fix(face_swapper): replacing with new code

2024-10-24 00:55:18 +05:30 · 2024-10-24 00:55:18 +05:30 · f2894470a7
parent d616c513c9
commit f2894470a7
1 changed files with 93 additions and 45 deletions
--- a/modules/processors/frame/face_swapper.py
+++ b/modules/processors/frame/face_swapper.py
@ -1,8 +1,8 @@
-from typing import Any, List, Tuple
+from typing import Any, List, Tuple, Optional
 import cv2
-import numpy as np
 import insightface
 import threading
+import numpy as np

 import modules.globals
 import modules.processors.frame.core
@ -20,11 +20,7 @@ from modules.cluster_analysis import find_closest_centroid
 FACE_SWAPPER = None
 THREAD_LOCK = threading.Lock()
 NAME = "DLC.FACE-SWAPPER"
-
-# Add mouth landmarks indices for masking
-MOUTH_LANDMARKS = list(
-    range(46, 68)
-)  # Common indices for mouth landmarks in facial detection
+BLUR_AMOUNT = 12


 def pre_check() -> bool:
@ -67,47 +63,105 @@ def get_face_swapper() -> Any:
    return FACE_SWAPPER


-def create_mouth_mask(face: Face, frame_shape: Tuple[int, int]) -> np.ndarray:
-    """Create a mask for the mouth region"""
-    mask = np.zeros(frame_shape[:2], dtype=np.uint8)
-
-    # Get mouth landmarks from the face
-    landmarks = face.kps
-    mouth_points = landmarks[MOUTH_LANDMARKS].astype(np.int32)
-
-    # Create a polygon around the mouth region
-    cv2.fillPoly(mask, [mouth_points], 255)
-
-    # Dilate the mask slightly to ensure smooth blending
-    kernel = np.ones((5, 5), np.uint8)
-    mask = cv2.dilate(mask, kernel, iterations=2)
-
-    # Blur the mask edges
-    mask = cv2.GaussianBlur(mask, (15, 15), 10)
-
+def create_face_mask(face: Face, frame: Frame) -> np.ndarray:
+    """Create a binary mask for the face region."""
+    mask = np.zeros(frame.shape[:2], dtype=np.uint8)
+    landmarks = face.landmark_2d_106
+    if landmarks is not None:
+        hull = cv2.convexHull(landmarks.astype(np.int32))
+        cv2.fillConvexPoly(mask, hull, 255)
    return mask


-def blend_with_mask(
-    swapped_frame: Frame, original_frame: Frame, mask: np.ndarray
-) -> Frame:
-    """Blend the swapped face with the original frame using the mouth mask"""
-    mask_3channel = cv2.cvtColor(mask, cv2.COLOR_GRAY2BGR) / 255.0
+def create_lower_mouth_mask(
+    face: Face, frame: Frame
+) -> Tuple[np.ndarray, np.ndarray, Tuple[int, int, int, int], np.ndarray]:
+    """Create a mask for the lower mouth region."""
+    mask = np.zeros(frame.shape[:2], dtype=np.uint8)
+    landmarks = face.landmark_2d_106

-    # Blend the images based on the mask
-    blended = swapped_frame * (1 - mask_3channel) + original_frame * mask_3channel
-    return blended.astype(np.uint8)
+    if landmarks is not None:
+        # Extract mouth landmarks
+        mouth_points = landmarks[84:96]  # Adjust indices based on your landmark format
+        lower_lip = mouth_points[6:12]  # Lower lip points
+
+        # Create polygon for lower mouth area
+        lower_lip_polygon = cv2.convexHull(lower_lip.astype(np.int32))
+        cv2.fillConvexPoly(mask, lower_lip_polygon, 255)
+
+        # Get bounding box
+        x, y, w, h = cv2.boundingRect(lower_lip_polygon)
+        mouth_box = (x, y, w, h)
+
+        # Extract the mouth region
+        mouth_cutout = frame[y : y + h, x : x + w].copy()
+
+        return mask, mouth_cutout, mouth_box, lower_lip_polygon
+
+    return None, None, None, None
+
+
+def apply_mouth_area(
+    frame: Frame,
+    mouth_cutout: np.ndarray,
+    mouth_box: Tuple[int, int, int, int],
+    face_mask: np.ndarray,
+    lower_lip_polygon: Optional[np.ndarray],
+) -> Frame:
+    """Apply the original mouth area back to the face-swapped frame."""
+    if mouth_cutout is None or mouth_box is None:
+        return frame
+
+    x, y, w, h = mouth_box
+
+    # Create a blurred version of the mask
+    mask = np.zeros(frame.shape[:2], dtype=np.uint8)
+    if lower_lip_polygon is not None:
+        cv2.fillConvexPoly(mask, lower_lip_polygon, 255)
+    else:
+        mask[y : y + h, x : x + w] = 255
+
+    # Blur the mask
+    blurred_mask = cv2.GaussianBlur(mask, (BLUR_AMOUNT * 2 + 1, BLUR_AMOUNT * 2 + 1), 0)
+    blurred_mask = blurred_mask / 255.0
+
+    # Create 3-channel mask
+    blurred_mask_3channel = np.repeat(blurred_mask[:, :, np.newaxis], 3, axis=2)
+
+    # Blend the original mouth area with the swapped face
+    frame_copy = frame.copy()
+    frame_copy[y : y + h, x : x + w] = mouth_cutout
+
+    # Combine using the blurred mask
+    result = (
+        frame_copy * blurred_mask_3channel + frame * (1 - blurred_mask_3channel)
+    ).astype(np.uint8)
+
+    return result


 def swap_face(source_face: Face, target_face: Face, temp_frame: Frame) -> Frame:
-    # Store the original frame for mouth preservation
-    original_frame = temp_frame.copy()
-
-    # Perform the face swap
-    swapped_frame = get_face_swapper().get(
+    face_swapper = get_face_swapper()
+    # Apply the face swap
+    swapped_frame = face_swapper.get(
        temp_frame, target_face, source_face, paste_back=True
    )

+    if modules.globals.mouth_mask:
+        # Create masks
+        face_mask = create_face_mask(target_face, temp_frame)
+        mouth_mask, mouth_cutout, mouth_box, lower_lip_polygon = (
+            create_lower_mouth_mask(target_face, temp_frame)
+        )
+
+        if mouth_mask is not None:
+            # Apply the mouth area preservation
+            swapped_frame = apply_mouth_area(
+                swapped_frame, mouth_cutout, mouth_box, face_mask, lower_lip_polygon
+            )
+
+    return swapped_frame
+

 def process_frame(source_face: Face, temp_frame: Frame) -> Frame:
    # Ensure the frame is in RGB format if color correction is enabled
@ -123,6 +177,7 @@ def process_frame(source_face: Face, temp_frame: Frame) -> Frame:
        target_face = get_one_face(temp_frame)
        if target_face:
            temp_frame = swap_face(source_face, target_face, temp_frame)
+
    return temp_frame


@ -133,7 +188,6 @@ def process_frame_v2(temp_frame: Frame, temp_frame_path: str = "") -> Frame:
            for map in modules.globals.souce_target_map:
                target_face = map["target"]["face"]
                temp_frame = swap_face(source_face, target_face, temp_frame)
-
        elif not modules.globals.many_faces:
            for map in modules.globals.souce_target_map:
                if "source" in map:
@ -150,11 +204,9 @@ def process_frame_v2(temp_frame: Frame, temp_frame_path: str = "") -> Frame:
                    for f in map["target_faces_in_frame"]
                    if f["location"] == temp_frame_path
                ]
-
                for frame in target_frame:
                    for target_face in frame["faces"]:
                        temp_frame = swap_face(source_face, target_face, temp_frame)
-
        elif not modules.globals.many_faces:
            for map in modules.globals.souce_target_map:
                if "source" in map:
@ -164,7 +216,6 @@ def process_frame_v2(temp_frame: Frame, temp_frame_path: str = "") -> Frame:
                        if f["location"] == temp_frame_path
                    ]
                    source_face = map["source"]["face"]
-
                    for frame in target_frame:
                        for target_face in frame["faces"]:
                            temp_frame = swap_face(source_face, target_face, temp_frame)
@ -175,7 +226,6 @@ def process_frame_v2(temp_frame: Frame, temp_frame_path: str = "") -> Frame:
                source_face = default_source_face()
                for target_face in detected_faces:
                    temp_frame = swap_face(source_face, target_face, temp_frame)
-
        elif not modules.globals.many_faces:
            if detected_faces:
                if len(detected_faces) <= len(
@ -186,7 +236,6 @@ def process_frame_v2(temp_frame: Frame, temp_frame_path: str = "") -> Frame:
                            modules.globals.simple_map["target_embeddings"],
                            detected_face.normed_embedding,
                        )
-
                        temp_frame = swap_face(
                            modules.globals.simple_map["source_faces"][
                                closest_centroid_index
@ -205,7 +254,6 @@ def process_frame_v2(temp_frame: Frame, temp_frame_path: str = "") -> Frame:
                        closest_centroid_index, _ = find_closest_centroid(
                            detected_faces_centroids, target_embedding
                        )
-
                        temp_frame = swap_face(
                            modules.globals.simple_map["source_faces"][i],
                            detected_faces[closest_centroid_index],