Spaces:

abhisheksan
/

credify

Running

App Files Files Community

abhisheksan commited on Oct 12, 2024

Commit

15fccb8

1 Parent(s): fa55b66

Refactor forgery detection process and improve result aggregation in forgery_routes.py

Browse files

Files changed (3) hide show

app/api/forgery_routes.py +63 -34
app/services/deepfake_video_detection.py +43 -0
models/deepfake_videos.h5 +3 -0

app/api/forgery_routes.py CHANGED Viewed

@@ -6,8 +6,9 @@ from app.services.gan_detection_service import GANDetectionService
 from app.utils.file_utils import download_file, remove_temp_file, get_file_content
 from app.utils.forgery_image_utils import detect_face
 from app.utils.forgery_video_utils import extract_audio, extract_frames, compress_and_process_video, detect_speech # Adjust the import path if necessary
 import os
 import logging
 import traceback
 from pydantic import BaseModel
@@ -22,6 +23,8 @@ image_manipulation_service = ImageManipulationService()
 face_manipulation_service = FaceManipulationService()
 audio_deepfake_service = AudioDeepfakeService()
 gan_detection_service = GANDetectionService()
 def parse_confidence(value):
     if isinstance(value, str):
@@ -86,6 +89,17 @@ async def process_image(firebase_filename: str):
     logging.info(f"Image processing completed for: {firebase_filename}")
     return results
 async def process_video(firebase_filename: str):
     logging.info(f"Starting video processing for: {firebase_filename}")
     try:
@@ -100,14 +114,13 @@ async def process_video(firebase_filename: str):
             audio_content = get_file_content(audio_filename)
             if detect_speech(audio_content):
                 logging.info("Speech detected in the audio")
-                audio_deepfake_result = audio_deepfake_service.detect_deepfake(audio_filename)
-                is_audio_deepfake = audio_deepfake_result["prediction"] == "Fake"
             else:
                 logging.info("No speech detected in the audio")
             await remove_temp_file(audio_filename)
             logging.info(f"Temporary audio file removed: {audio_filename}")
         else:
-            logging.warning("No audio detected or extracted from the video")
         results = {"is_audio_deepfake": is_audio_deepfake}
@@ -115,45 +128,61 @@ async def process_video(firebase_filename: str):
         logging.info(f"Frames extracted: {len(frames)} frames")
         results.update({
-            "image_manipulation": [],
-            "face_manipulation": [],
-            "gan_detection": []
         })
         face_frames = []
-        for i, frame in enumerate(frames):
-            frame_filename = frame  # Assuming extract_frames now returns a list of filenames
-            logging.info(f"Processing frame: {frame_filename}")
-            frame_content = get_file_content(frame_filename)
-            has_face = detect_face(frame_content)
-            logging.info(f"Face detection result for {frame_filename}: {'Face detected' if has_face else 'No face detected'}")
-            results["image_manipulation"].append(image_manipulation_service.detect_manipulation(frame_filename))
-            results["gan_detection"].append(gan_detection_service.detect_gan(frame_filename))
             if has_face:
-                face_frames.append(frame_filename)
-                results["face_manipulation"].append(face_manipulation_service.detect_manipulation(frame_filename))
-            else:
-                results["face_manipulation"].append(None)
-                logging.info(f"Face manipulation detection skipped for {frame_filename} (no face detected)")
-            await remove_temp_file(frame_filename)
-            logging.info(f"Temporary frame file removed: {frame_filename}")
-        # Aggregate results
-        for key in results:
-            if key != "is_audio_deepfake" and results[key]:
-                valid_results = [r for r in results[key] if r is not None]
-                results[key] = {
-                    "collective_detection": any(r.get("is_manipulated", False) if isinstance(r, dict) else r for r in valid_results),
-                    "collective_confidence": sum(parse_confidence(r.get("confidence", 0)) if isinstance(r, dict) else 0 for r in valid_results) / len(valid_results) if valid_results else 0
-                }
         logging.info(f"Aggregated results: {results}")
         await remove_temp_file(compressed_video_filename)
-        logging.info(f"Temporary compressed video file removed: {compressed_video_filename}")
         logging.info(f"Video processing completed for: {firebase_filename}")
         return results
     except Exception as e:
         logging.error(f"Error processing video: {e}")

 from app.utils.file_utils import download_file, remove_temp_file, get_file_content
 from app.utils.forgery_image_utils import detect_face
 from app.utils.forgery_video_utils import extract_audio, extract_frames, compress_and_process_video, detect_speech # Adjust the import path if necessary
+from app.services.deepfake_video_detection import DeepfakeVideoDetectionService
 import os
+import numpy as np
 import logging
 import traceback
 from pydantic import BaseModel
 face_manipulation_service = FaceManipulationService()
 audio_deepfake_service = AudioDeepfakeService()
 gan_detection_service = GANDetectionService()
+deepfake_video_detection_service = DeepfakeVideoDetectionService()
 def parse_confidence(value):
     if isinstance(value, str):
     logging.info(f"Image processing completed for: {firebase_filename}")
     return results
+def convert_to_python_types(obj):
+    if isinstance(obj, np.generic):
+        return obj.item()
+    elif isinstance(obj, (list, tuple)):
+        return [convert_to_python_types(item) for item in obj]
+    elif isinstance(obj, dict):
+        return {key: convert_to_python_types(value) for key, value in obj.items()}
+    elif isinstance(obj, np.ndarray):
+        return obj.tolist()
+    return obj
 async def process_video(firebase_filename: str):
     logging.info(f"Starting video processing for: {firebase_filename}")
     try:
             audio_content = get_file_content(audio_filename)
             if detect_speech(audio_content):
                 logging.info("Speech detected in the audio")
+                # Audio deepfake detection logic here if needed
             else:
                 logging.info("No speech detected in the audio")
             await remove_temp_file(audio_filename)
             logging.info(f"Temporary audio file removed: {audio_filename}")
         else:
+            logging.info("No audio detected or extracted from the video")
         results = {"is_audio_deepfake": is_audio_deepfake}
         logging.info(f"Frames extracted: {len(frames)} frames")
         results.update({
+            "image_manipulation": {
+                "collective_detection": False,
+                "collective_confidence": 0.0
+            },
+            "face_manipulation": None,
+            "gan_detection": {
+                "collective_detection": False,
+                "collective_confidence": 0.0
+            }
         })
         face_frames = []
+        img_manip_detections = []
+        img_manip_confidences = []
+        gan_detections = []
+        gan_confidences = []
+        for frame in frames:
+            frame_content = get_file_content(frame)
+            has_face = detect_face(frame_content)
             if has_face:
+                face_frames.append(frame)
+            img_manip_result = image_manipulation_service.detect_manipulation(frame)
+            gan_result = gan_detection_service.detect_gan(frame)
+            img_manip_detections.append(img_manip_result.get("is_manipulated", False))
+            img_manip_confidences.append(parse_confidence(img_manip_result.get("confidence", "0%")))
+            gan_detections.append(gan_result.get("is_gan", False))
+            gan_confidences.append(parse_confidence(gan_result.get("confidence", "0%")))
+        # Aggregate results for image manipulation and GAN detection
+        results["image_manipulation"]["collective_detection"] = any(img_manip_detections)
+        results["image_manipulation"]["collective_confidence"] = sum(img_manip_confidences) / len(img_manip_confidences) if img_manip_confidences else 0.0
+        results["gan_detection"]["collective_detection"] = any(gan_detections)
+        results["gan_detection"]["collective_confidence"] = sum(gan_confidences) / len(gan_confidences) if gan_confidences else 0.0
+        # Perform deepfake detection if faces were detected
+        if face_frames:
+            deepfake_result = deepfake_video_detection_service.detect_deepfake(face_frames)
+            deepfake_result = convert_to_python_types(deepfake_result)
+            results["face_manipulation"] = {
+                "collective_detection": bool(deepfake_result["is_deepfake"]),
+                "collective_confidence": deepfake_result['confidence']
+            }
         logging.info(f"Aggregated results: {results}")
         await remove_temp_file(compressed_video_filename)
+        for frame in frames:
+            await remove_temp_file(frame)
+        logging.info(f"Temporary files removed")
         logging.info(f"Video processing completed for: {firebase_filename}")
         return results
     except Exception as e:
         logging.error(f"Error processing video: {e}")

app/services/deepfake_video_detection.py ADDED Viewed

	@@ -0,0 +1,43 @@

+import tensorflow as tf
+import numpy as np
+import cv2
+from app.utils.file_utils import get_file_content
+import io
+class DeepfakeVideoDetectionService:
+    def __init__(self):
+        self.model = tf.keras.models.load_model("models\deepfake_videos.h5")
+    def process_frame(self, frame):
+        frame = cv2.resize(frame, (224, 224))
+        frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+        frame = tf.keras.applications.xception.preprocess_input(tf.convert_to_tensor(frame, dtype=tf.float32))
+        return np.expand_dims(frame, axis=0)
+    def calculate_weighted_average(self, predictions, threshold=0.5):
+        weights = np.maximum(predictions - threshold, 0)
+        if np.sum(weights) == 0:
+            return np.mean(predictions)
+        else:
+            return np.average(predictions, weights=weights)
+    def detect_deepfake(self, frame_filenames):
+        predictions = []
+        for filename in frame_filenames:
+            frame_content = get_file_content(filename)
+            frame = cv2.imdecode(np.frombuffer(frame_content, np.uint8), cv2.IMREAD_COLOR)
+            processed_frame = self.process_frame(frame)
+            prediction = float(self.model.predict(processed_frame, verbose=0)[0][0])
+            predictions.append(prediction)
+        predictions = np.array(predictions)
+        weighted_avg_confidence = self.calculate_weighted_average(predictions)
+        is_fake = weighted_avg_confidence > 0.5
+        return {
+            "is_deepfake": is_fake,
+            "confidence": float(weighted_avg_confidence),
+            "max_confidence": float(np.max(predictions)),
+            "min_confidence": float(np.min(predictions)),
+            "frames_analyzed": len(predictions)
+        }

models/deepfake_videos.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ab66e33cd80e38b3642994c16a271af3b2519ae1e189a792014e6607cb57beed
+size 149835704