Spaces:

truens66
/

deepfake-video-detector

Running

App Files Files Community

truens66 commited on Feb 5

Commit

9797501

verified ·

1 Parent(s): fa179db

Update app.py

Browse files

Files changed (1) hide show

app.py +171 -80

app.py CHANGED Viewed

@@ -124,103 +124,194 @@ import numpy as np
 import mediapipe as mp
 from torchvision import models, transforms
 from tempfile import NamedTemporaryFile
-# Initialize MediaPipe Face Detection and Face Mesh
-mp_face_detection = mp.solutions.face_detection
-mp_face_mesh = mp.solutions.face_mesh
-face_detection = mp_face_detection.FaceDetection(model_selection=1, min_detection_confidence=0.5)
-face_mesh = mp_face_mesh.FaceMesh(static_image_mode=False, max_num_faces=1, min_detection_confidence=0.5)
-# Initialize ResNet-34 model with random weights
-def create_model():
-    model = models.resnet34(pretrained=False)
-    model.fc = torch.nn.Linear(model.fc.in_features, 2)
-    return model
-model = create_model()
-model.eval()
-# Define transformation for face images
-transform = transforms.Compose([
-    transforms.ToPILImage(),
-    transforms.Resize((224, 224)),
-    transforms.ToTensor(),
-    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
-])
-def get_face_bbox(landmarks, frame_shape):
-    h, w = frame_shape[:2]
-    xs = [lm.x * w for lm in landmarks.landmark]
-    ys = [lm.y * h for lm in landmarks.landmark]
-    return int(min(xs)), int(min(ys)), int(max(xs)), int(max(ys))
-def process_video(video_path: str):
-    cap = cv2.VideoCapture(video_path)
-    width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
-    height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
-    fps = int(cap.get(cv2.CAP_PROP_FPS))
-    output_path = video_path.replace(".mp4", "_processed.mp4")
-    output_video = cv2.VideoWriter(output_path, cv2.VideoWriter_fourcc(*'mp4v'), fps, (width, height))
-    while cap.isOpened():
-        ret, frame = cap.read()
-        if not ret:
-            break
         rgb_frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
-        # Face detection
-        results = face_detection.process(rgb_frame)
-        if results.detections:
-            for detection in results.detections:
-                # Get face landmarks
-                mesh_results = face_mesh.process(rgb_frame)
-                if mesh_results.multi_face_landmarks:
-                    for face_landmarks in mesh_results.multi_face_landmarks:
-                        x_min, y_min, x_max, y_max = get_face_bbox(face_landmarks, frame.shape)
-                        face_crop = rgb_frame[y_min:y_max, x_min:x_max]
-                        if face_crop.size == 0:
-                            continue
-                        face_tensor = transform(face_crop).unsqueeze(0)
-                        with torch.no_grad():
-                            output = torch.softmax(model(face_tensor), dim=1)
-                            fake_confidence = output[0, 1].item() * 100
-                            label = "Fake" if fake_confidence > 50 else "Real"
-                            color = (0, 0, 255) if label == "Fake" else (0, 255, 0)
-                            label_text = f"{label} ({fake_confidence:.2f}%)"
-                        cv2.rectangle(frame, (x_min, y_min), (x_max, y_max), color, 2)
-                        cv2.putText(frame, label_text, (x_min, y_min - 10),
-                                  cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 1)
-        output_video.write(frame)
-    cap.release()
-    output_video.release()
-    return output_path
 def gradio_interface(video_file):
     if video_file is None:
         return "Error: No video uploaded."
     with NamedTemporaryFile(delete=False, suffix=".mp4") as temp_file:
         temp_file_path = temp_file.name
         with open(video_file, "rb") as uploaded_file:
             temp_file.write(uploaded_file.read())
-    output_path = process_video(temp_file_path)
     return output_path
 iface = gr.Interface(
     fn=gradio_interface,
     inputs=gr.Video(label="Upload Video"),
     outputs=gr.Video(label="Processed Video"),
     title="Deepfake Detection",
-    description="Upload a video to detect deepfakes using MediaPipe face detection and ResNet-34 model."
 )
 if __name__ == "__main__":
-    iface.launch()

 import mediapipe as mp
 from torchvision import models, transforms
 from tempfile import NamedTemporaryFile
+from pathlib import Path
+import logging
+from typing import Tuple, Optional
+# Set up logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+class DeepfakeDetector:
+    def __init__(self, detection_confidence: float = 0.5, max_faces: int = 1):
+        """Initialize the DeepfakeDetector with MediaPipe and ResNet model."""
+        self.mp_face_detection = mp.solutions.face_detection
+        self.mp_face_mesh = mp.solutions.face_mesh
+        # Initialize face detection and mesh
+        self.face_detection = self.mp_face_detection.FaceDetection(
+            model_selection=1,
+            min_detection_confidence=detection_confidence
+        )
+        self.face_mesh = self.mp_face_mesh.FaceMesh(
+            static_image_mode=False,
+            max_num_faces=max_faces,
+            min_detection_confidence=detection_confidence
+        )
+        # Initialize model and transform
+        self.model = self._create_model()
+        self.transform = self._create_transform()
+    @staticmethod
+    def _create_model() -> torch.nn.Module:
+        """Create and configure the ResNet model."""
+        model = models.resnet34(weights=None)
+        model.fc = torch.nn.Linear(model.fc.in_features, 2)
+        model.eval()
+        return model
+    @staticmethod
+    def _create_transform() -> transforms.Compose:
+        """Create the image transformation pipeline."""
+        return transforms.Compose([
+            transforms.ToPILImage(),
+            transforms.Resize((224, 224)),
+            transforms.ToTensor(),
+            transforms.Normalize(
+                mean=[0.485, 0.456, 0.406],
+                std=[0.229, 0.224, 0.225]
+            )
+        ])
+    def get_face_bbox(self, landmarks, frame_shape: Tuple[int, int]) -> Tuple[int, int, int, int]:
+        """Extract face bounding box from landmarks."""
+        h, w = frame_shape[:2]
+        xs = [lm.x * w for lm in landmarks.landmark]
+        ys = [lm.y * h for lm in landmarks.landmark]
+        return (
+            max(0, int(min(xs))),
+            max(0, int(min(ys))),
+            min(w, int(max(xs))),
+            min(h, int(max(ys)))
+        )
+    def process_frame(self, frame: np.ndarray) -> np.ndarray:
+        """Process a single frame to detect deepfakes."""
         rgb_frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
+        # Detect faces
+        detection_results = self.face_detection.process(rgb_frame)
+        if not detection_results.detections:
+            return frame
+        # Process each detected face
+        for detection in detection_results.detections:
+            mesh_results = self.face_mesh.process(rgb_frame)
+            if not mesh_results.multi_face_landmarks:
+                continue
+            for face_landmarks in mesh_results.multi_face_landmarks:
+                frame = self._analyze_face(frame, rgb_frame, face_landmarks)
+        return frame
+    def _analyze_face(self, frame: np.ndarray, rgb_frame: np.ndarray,
+                     face_landmarks) -> np.ndarray:
+        """Analyze a single face and draw results on frame."""
+        # Get face bbox
+        x_min, y_min, x_max, y_max = self.get_face_bbox(
+            face_landmarks, frame.shape
+        )
+        # Crop and transform face
+        face_crop = rgb_frame[y_min:y_max, x_min:x_max]
+        if face_crop.size == 0:
+            return frame
+        # Run inference
+        try:
+            face_tensor = self.transform(face_crop).unsqueeze(0)
+            with torch.no_grad():
+                output = torch.softmax(self.model(face_tensor), dim=1)
+                fake_confidence = output[0, 1].item() * 100
+        except Exception as e:
+            logger.error(f"Error during inference: {str(e)}")
+            return frame
+        # Draw results
+        label = "Fake" if fake_confidence > 50 else "Real"
+        color = (0, 0, 255) if label == "Fake" else (0, 255, 0)
+        label_text = f"{label} ({fake_confidence:.2f}%)"
+        cv2.rectangle(frame, (x_min, y_min), (x_max, y_max), color, 2)
+        cv2.putText(frame, label_text, (x_min, y_min - 10),
+                   cv2.FONT_HERSHEY_SIMPLEX, 0.5, color, 1)
+        return frame
+    def process_video(self, video_path: str) -> Optional[str]:
+        """Process a video file and return path to processed video."""
+        try:
+            cap = cv2.VideoCapture(video_path)
+            if not cap.isOpened():
+                logger.error("Error opening video file")
+                return None
+            # Get video properties
+            width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+            height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+            fps = int(cap.get(cv2.CAP_PROP_FPS))
+            # Set up output video
+            output_path = str(Path(video_path).with_suffix('')) + "_processed.mp4"
+            output_video = cv2.VideoWriter(
+                output_path,
+                cv2.VideoWriter_fourcc(*'mp4v'),
+                fps,
+                (width, height)
+            )
+            # Process frames
+            while cap.isOpened():
+                ret, frame = cap.read()
+                if not ret:
+                    break
+                processed_frame = self.process_frame(frame)
+                output_video.write(processed_frame)
+            # Clean up
+            cap.release()
+            output_video.release()
+            return output_path
+        except Exception as e:
+            logger.error(f"Error processing video: {str(e)}")
+            return None
 def gradio_interface(video_file):
+    """Gradio interface function."""
     if video_file is None:
         return "Error: No video uploaded."
+    detector = DeepfakeDetector()
     with NamedTemporaryFile(delete=False, suffix=".mp4") as temp_file:
         temp_file_path = temp_file.name
         with open(video_file, "rb") as uploaded_file:
             temp_file.write(uploaded_file.read())
+    output_path = detector.process_video(temp_file_path)
+    if output_path is None:
+        return "Error processing video"
     return output_path
+# Create Gradio interface
 iface = gr.Interface(
     fn=gradio_interface,
     inputs=gr.Video(label="Upload Video"),
     outputs=gr.Video(label="Processed Video"),
     title="Deepfake Detection",
+    description="Upload a video to detect deepfakes using MediaPipe face detection and ResNet-34 model.",
+    examples=[],  # Add example videos here if available
 )
 if __name__ == "__main__":
+    iface.launch(
+        server_name="0.0.0.0",
+        share=True,  # Set to True to create a public link
+        debug=True
+    )