Merge d4905c6bd9 into 9086072b8e

Fix: Prevent per-frame source image reload in live preview.
- Modified `update_webcam_frame_after` in `modules/ui.py` to use the source_image passed from `create_webcam_preview` without attempting to reload it on every frame if it was initially None. - This fixes an FPS drop regression that occurred when starting the live preview with a problematic or non-existent source image.
2025-06-27 17:56:07 -03:00 · 2025-06-27 20:33:44 +00:00 · 2025-06-27 20:25:26 +00:00 · 2025-06-27 19:25:06 +00:00
2 changed files with 195 additions and 101 deletions
--- a/modules/ui.py
+++ b/modules/ui.py
@ -880,84 +880,119 @@ def create_webcam_preview(camera_index: int):
    PREVIEW.deiconify()

    frame_processors = get_frame_processors_modules(modules.globals.frame_processors)
+    # Get initial source image if not mapping faces
    source_image = None
-    prev_time = time.time()
-    fps_update_interval = 0.5
-    frame_count = 0
-    fps = 0
+    if not modules.globals.map_faces and modules.globals.source_path:
+        try:
+            loaded_cv_image = cv2.imread(modules.globals.source_path)
+            if loaded_cv_image is None:
+                update_status(f"Error: Could not read source image at {modules.globals.source_path}")
+                # source_image remains None
+            else:
+                source_image = get_one_face(loaded_cv_image)
+                if source_image is None:
+                    update_status(f"Error: No face detected in source image {os.path.basename(modules.globals.source_path)}")
+        except Exception as e:
+            update_status(f"Exception loading source image: {str(e)[:100]}")
+            source_image = None # Ensure source_image is None on any error

-    while True:
-        ret, frame = cap.read()
-        if not ret:
-            break
+    # If source_image is still None AND a source_path was provided (meaning user intended a swap)
+    # AND we are not using map_faces (which handles its own source logic for sources)
+    if source_image is None and modules.globals.source_path and not modules.globals.map_faces:
+        update_status("Warning: Live preview started, but source image is invalid or has no face. No swap will occur.")
+        # The live preview will start, but no swap will occur if source_image is None.

-        temp_frame = frame.copy()
+    # Start the update loop
+    fps_data = { # Moved fps_data initialization here to be passed to the loop
+        "prev_time": time.time(),
+        "frame_count": 0,
+        "fps": 0.0,
+        "fps_update_interval": 0.5
+    }
+    update_webcam_frame_after(cap, frame_processors, source_image, fps_data)

-        if modules.globals.live_mirror:
-            temp_frame = cv2.flip(temp_frame, 1)

-        if modules.globals.live_resizable:
-            temp_frame = fit_image_to_size(
-                temp_frame, PREVIEW.winfo_width(), PREVIEW.winfo_height()
-            )
+def update_webcam_frame_after(cap, frame_processors, source_image, fps_data, delay_ms=15): # Approx 66 FPS target for UI updates
+    global preview_label, ROOT, PREVIEW

-        else:
-            temp_frame = fit_image_to_size(
-                temp_frame, PREVIEW.winfo_width(), PREVIEW.winfo_height()
-            )
+    if PREVIEW.state() == "withdrawn":
+        cap.release()
+        PREVIEW.withdraw() # Ensure it's withdrawn if loop exits
+        return

-        if not modules.globals.map_faces:
-            if source_image is None and modules.globals.source_path:
-                source_image = get_one_face(cv2.imread(modules.globals.source_path))
+    ret, frame = cap.read()
+    if not ret:
+        # Handle camera read failure or end of stream (though for webcam, it's usually continuous)
+        ROOT.after(delay_ms, lambda: update_webcam_frame_after(cap, frame_processors, source_image, fps_data, delay_ms))
+        return

-            for frame_processor in frame_processors:
-                if frame_processor.NAME == "DLC.FACE-ENHANCER":
-                    if modules.globals.fp_ui["face_enhancer"]:
-                        temp_frame = frame_processor.process_frame(None, temp_frame)
-                else:
-                    temp_frame = frame_processor.process_frame(source_image, temp_frame)
-        else:
-            modules.globals.target_path = None
-            for frame_processor in frame_processors:
-                if frame_processor.NAME == "DLC.FACE-ENHANCER":
-                    if modules.globals.fp_ui["face_enhancer"]:
-                        temp_frame = frame_processor.process_frame_v2(temp_frame)
-                else:
+    temp_frame = frame.copy()
+
+    if modules.globals.live_mirror:
+        temp_frame = cv2.flip(temp_frame, 1)
+
+    # Resizing based on PREVIEW window dimensions.
+    preview_width = PREVIEW.winfo_width()
+    preview_height = PREVIEW.winfo_height()
+    if preview_width > 1 and preview_height > 1: # Ensure valid dimensions
+         temp_frame = fit_image_to_size(temp_frame, preview_width, preview_height)
+
+
+    if not modules.globals.map_faces:
+        # current_source_image is the source_image passed in from create_webcam_preview
+        # It's determined once before the loop starts. No reloading here.
+        current_source_image = source_image
+
+        for frame_processor in frame_processors:
+            if frame_processor.NAME == "DLC.FACE-ENHANCER":
+                if modules.globals.fp_ui["face_enhancer"]:
+                    temp_frame = frame_processor.process_frame(None, temp_frame)
+            else: # This is the face_swapper processor or other default
+                if current_source_image: # Only process if source_image (from create_webcam_preview) is valid
+                    temp_frame = frame_processor.process_frame(current_source_image, temp_frame)
+                # If current_source_image is None, the frame is not processed by face_swapper, effectively no swap.
+    else:
+        modules.globals.target_path = None
+        for frame_processor in frame_processors:
+            if frame_processor.NAME == "DLC.FACE-ENHANCER":
+                if modules.globals.fp_ui["face_enhancer"]:
                    temp_frame = frame_processor.process_frame_v2(temp_frame)
+            else:
+                temp_frame = frame_processor.process_frame_v2(temp_frame)

-        # Calculate and display FPS
-        current_time = time.time()
-        frame_count += 1
-        if current_time - prev_time >= fps_update_interval:
-            fps = frame_count / (current_time - prev_time)
-            frame_count = 0
-            prev_time = current_time
+    current_time = time.time()
+    fps_data["frame_count"] += 1
+    time_diff = current_time - fps_data["prev_time"]

-        if modules.globals.show_fps:
-            cv2.putText(
-                temp_frame,
-                f"FPS: {fps:.1f}",
-                (10, 30),
-                cv2.FONT_HERSHEY_SIMPLEX,
-                1,
-                (0, 255, 0),
-                2,
-            )
+    if time_diff >= fps_data.get("fps_update_interval", 0.5):
+        fps_data["fps"] = fps_data["frame_count"] / time_diff
+        fps_data["frame_count"] = 0
+        fps_data["prev_time"] = current_time

-        image = cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB)
-        image = Image.fromarray(image)
-        image = ImageOps.contain(
-            image, (temp_frame.shape[1], temp_frame.shape[0]), Image.LANCZOS
+    if modules.globals.show_fps:
+        cv2.putText(
+            temp_frame,
+            f"FPS: {fps_data['fps']:.1f}",
+            (10, 30),
+            cv2.FONT_HERSHEY_SIMPLEX,
+            1,
+            (0, 255, 0),
+            2,
        )
-        image = ctk.CTkImage(image, size=image.size)
-        preview_label.configure(image=image)
-        ROOT.update()

-        if PREVIEW.state() == "withdrawn":
-            break
+    if temp_frame is not None and temp_frame.size > 0:
+        image = cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB)
+        pil_image = Image.fromarray(image)

-    cap.release()
-    PREVIEW.withdraw()
+        contained_image = ImageOps.contain(
+            pil_image, (temp_frame.shape[1], temp_frame.shape[0]), Image.LANCZOS
+        )
+        ctk_image = ctk.CTkImage(contained_image, size=contained_image.size)
+        preview_label.configure(image=ctk_image)
+    else:
+        pass
+
+    ROOT.after(delay_ms, lambda: update_webcam_frame_after(cap, frame_processors, source_image, fps_data, delay_ms))


 def create_source_target_popup_for_webcam(
--- a/modules/video_capture.py
+++ b/modules/video_capture.py
@ -12,83 +12,142 @@ if platform.system() == "Windows":
 class VideoCapturer:
    def __init__(self, device_index: int):
        self.device_index = device_index
-        self.frame_callback = None
-        self._current_frame = None
-        self._frame_ready = threading.Event()
+        self._latest_frame: Optional[np.ndarray] = None
+        self._frame_lock = threading.Lock()
        self.is_running = False
-        self.cap = None
+        self.cap: Optional[cv2.VideoCapture] = None
+        self._capture_thread: Optional[threading.Thread] = None

        # Initialize Windows-specific components if on Windows
        if platform.system() == "Windows":
-            self.graph = FilterGraph()
-            # Verify device exists
-            devices = self.graph.get_input_devices()
-            if self.device_index >= len(devices):
-                raise ValueError(
-                    f"Invalid device index {device_index}. Available devices: {len(devices)}"
-                )
+            try:
+                self.graph = FilterGraph()
+                # Verify device exists
+                devices = self.graph.get_input_devices()
+                if self.device_index >= len(devices):
+                    # Fallback or logging, rather than immediate raise for flexibility
+                    print(f"Warning: Device index {device_index} might be out of range. Available: {len(devices)}. Will attempt to open anyway.")
+            except Exception as e:
+                print(f"Warning: Could not initialize FilterGraph for device enumeration: {e}")
+                self.graph = None
+
+
+    def _capture_loop(self) -> None:
+        while self.is_running and self.cap is not None:
+            try:
+                ret, frame = self.cap.read()
+                if ret:
+                    with self._frame_lock:
+                        self._latest_frame = frame
+                else:
+                    # Handle camera read failure, e.g., camera disconnected
+                    print("Warning: Failed to read frame from camera in capture loop.")
+                    # Small sleep to prevent tight loop on continuous read errors
+                    threading.Event().wait(0.1)
+            except Exception as e:
+                print(f"Error in capture loop: {e}")
+                self.is_running = False # Stop loop on critical error
+                break
+            # Small sleep to yield execution and not busy-wait if camera FPS is low
+            # Adjust sleep time as needed; too high adds latency, too low uses more CPU.
+            threading.Event().wait(0.001) # 1 ms sleep

    def start(self, width: int = 960, height: int = 540, fps: int = 60) -> bool:
-        """Initialize and start video capture"""
+        """Initialize and start video capture in a separate thread."""
+        if self.is_running:
+            print("Capture already running.")
+            return True
        try:
            if platform.system() == "Windows":
-                # Windows-specific capture methods
                capture_methods = [
-                    (self.device_index, cv2.CAP_DSHOW),  # Try DirectShow first
-                    (self.device_index, cv2.CAP_ANY),  # Then try default backend
-                    (-1, cv2.CAP_ANY),  # Try -1 as fallback
-                    (0, cv2.CAP_ANY),  # Finally try 0 without specific backend
+                    (self.device_index, cv2.CAP_DSHOW),
+                    (self.device_index, cv2.CAP_MSMF),
+                    (self.device_index, cv2.CAP_ANY),
+                    (-1, cv2.CAP_ANY),
+                    (0, cv2.CAP_ANY)
                ]
-
                for dev_id, backend in capture_methods:
                    try:
                        self.cap = cv2.VideoCapture(dev_id, backend)
-                        if self.cap.isOpened():
+                        if self.cap and self.cap.isOpened():
+                            print(f"Successfully opened camera {dev_id} with backend {backend}")
                            break
-                        self.cap.release()
+                        if self.cap:
+                            self.cap.release()
+                            self.cap = None
                    except Exception:
                        continue
-            else:
-                # Unix-like systems (Linux/Mac) capture method
+            else: # Unix-like
                self.cap = cv2.VideoCapture(self.device_index)

            if not self.cap or not self.cap.isOpened():
-                raise RuntimeError("Failed to open camera")
+                raise RuntimeError(f"Failed to open camera with device index {self.device_index} using available methods.")

            # Configure format
+            # Note: Setting properties might not always work or might reset after opening.
+            # It's often better to request a format the camera natively supports if known.
            self.cap.set(cv2.CAP_PROP_FRAME_WIDTH, width)
            self.cap.set(cv2.CAP_PROP_FRAME_HEIGHT, height)
            self.cap.set(cv2.CAP_PROP_FPS, fps)

+            # Verify settings if possible (actual values might differ)
+            actual_width = self.cap.get(cv2.CAP_PROP_FRAME_WIDTH)
+            actual_height = self.cap.get(cv2.CAP_PROP_FRAME_HEIGHT)
+            actual_fps = self.cap.get(cv2.CAP_PROP_FPS)
+            print(f"Requested: {width}x{height}@{fps}fps. Actual: {actual_width}x{actual_height}@{actual_fps}fps")
+
+
            self.is_running = True
+            self._capture_thread = threading.Thread(target=self._capture_loop, daemon=True)
+            self._capture_thread.start()
+
+            # Wait briefly for the first frame to be captured, makes initial read() more likely to succeed.
+            # This is optional and can be adjusted or removed.
+            threading.Event().wait(0.5) # Wait up to 0.5 seconds
+
            return True

        except Exception as e:
            print(f"Failed to start capture: {str(e)}")
            if self.cap:
                self.cap.release()
+                self.cap = None
+            self.is_running = False
            return False

    def read(self) -> Tuple[bool, Optional[np.ndarray]]:
-        """Read a frame from the camera"""
-        if not self.is_running or self.cap is None:
+        """Read the latest frame from the camera (non-blocking)."""
+        if not self.is_running:
            return False, None

-        ret, frame = self.cap.read()
-        if ret:
-            self._current_frame = frame
-            if self.frame_callback:
-                self.frame_callback(frame)
-            return True, frame
-        return False, None
+        frame_copy = None
+        with self._frame_lock:
+            if self._latest_frame is not None:
+                frame_copy = self._latest_frame.copy()
+
+        if frame_copy is not None:
+            return True, frame_copy
+        else:
+            # No frame available yet, or thread stopped
+            return False, None

    def release(self) -> None:
-        """Stop capture and release resources"""
-        if self.is_running and self.cap is not None:
+        """Stop capture thread and release resources."""
+        if self.is_running:
+            self.is_running = False # Signal the thread to stop
+            if self._capture_thread is not None:
+                self._capture_thread.join(timeout=1.0) # Wait for thread to finish
+                if self._capture_thread.is_alive():
+                    print("Warning: Capture thread did not terminate cleanly.")
+            self._capture_thread = None
+
+        if self.cap is not None:
            self.cap.release()
-            self.is_running = False
            self.cap = None

-    def set_frame_callback(self, callback: Callable[[np.ndarray], None]) -> None:
-        """Set callback for frame processing"""
-        self.frame_callback = callback
+        with self._frame_lock: # Clear last frame
+            self._latest_frame = None
+        print("Video capture released.")
+
+    # frame_callback is removed as direct polling via read() is now non-blocking and preferred with threaded capture.
+    # If a callback mechanism is still desired, it would need to be integrated carefully with the thread.
Author	SHA1	Message	Date
netmirror-apple9	7874cfe868	Merge `d4905c6bd9` into `9086072b8e`	2025-06-27 17:56:07 -03:00
google-labs-jules[bot]	d4905c6bd9	Fix: Prevent per-frame source image reload in live preview. - Modified `update_webcam_frame_after` in `modules/ui.py` to use the source_image passed from `create_webcam_preview` without attempting to reload it on every frame if it was initially None. - This fixes an FPS drop regression that occurred when starting the live preview with a problematic or non-existent source image.	2025-06-27 20:33:44 +00:00
google-labs-jules[bot]	d00af5a995	Fix: Prevent immediate stop/crash in live preview if source image is invalid. - Modified `create_webcam_preview` in `modules/ui.py` to handle errors during source image loading (e.g., file not readable, no face detected) more gracefully. - Instead of stopping the live preview, it now shows a warning message and starts the live camera feed without face swapping if the source image is unusable. - This addresses the issue where clicking 'Live' after selecting a problematic source image would cause the preview to stop or crash immediately.	2025-06-27 20:25:26 +00:00
google-labs-jules[bot]	eb33df659b	Consolidate all recent enhancements and fixes. This commit includes: - Refactored modules/ui.py: Live webcam preview loop now uses ROOT.after() for better UI responsiveness and potentially smoother external capture. - Refactored modules/video_capture.py: Implemented threaded, non-blocking frame reads for improved camera capture performance and stability. - Feature: Ear preservation for Poisson blending to reduce artifacts (controlled by --preserve-ears and related globals). - Feature: Histogram-based color correction (--color-correction). - Feature: Poisson blending for smoother face integration (--poisson-blending). These changes aim to improve overall swap quality, UI stability, and address reported FPS issues with external capture tools like SplitCam.	2025-06-27 19:25:06 +00:00