Compare commits
	
		
			15 Commits 
		
	
	
		
			d581d05f2b
			...
			82fcd7916a
		
	
	| Author | SHA1 | Date | 
|---|---|---|
|  | 82fcd7916a | |
|  | 2d0c5bc8d0 | |
|  | 5708be40eb | |
|  | f08c81f22a | |
|  | 2faaecbe15 | |
|  | 53c72d6774 | |
|  | 98e7320237 | |
|  | 12d7ca8bad | |
|  | 133b2ac330 | |
|  | 57ac933dff | |
|  | 11c2717a1d | |
|  | 0c5bb269f2 | |
|  | 6a1f87dc69 | |
|  | 81c1a817cc | |
|  | feae2657c9 | 
|  | @ -42,11 +42,4 @@ mask_feather_ratio = 8 | |||
| mask_down_size = 0.50 | ||||
| mask_size = 1 | ||||
| 
 | ||||
| # Enhanced performance settings | ||||
| performance_mode = "balanced"  # "fast", "balanced", "quality" | ||||
| adaptive_quality = True | ||||
| target_live_fps = 30 | ||||
| quality_level = 1.0 | ||||
| face_detection_interval = 0.1 | ||||
| enable_frame_caching = True | ||||
| enable_gpu_acceleration = True | ||||
| # Removed all performance optimization variables | ||||
|  |  | |||
|  | @ -1,221 +0,0 @@ | |||
| """ | ||||
| Enhanced Live Face Swapper with optimized performance and quality | ||||
| """ | ||||
| import cv2 | ||||
| import numpy as np | ||||
| import threading | ||||
| import time | ||||
| from typing import Optional, Callable, Any | ||||
| from collections import deque | ||||
| import modules.globals | ||||
| from modules.face_analyser import get_one_face, get_many_faces | ||||
| from modules.processors.frame.face_swapper import swap_face_enhanced, get_face_swapper | ||||
| from modules.performance_optimizer import performance_optimizer | ||||
| from modules.video_capture import VideoCapturer | ||||
| 
 | ||||
| 
 | ||||
| class LiveFaceSwapper: | ||||
|     def __init__(self): | ||||
|         self.is_running = False | ||||
|         self.source_face = None | ||||
|         self.video_capturer = None | ||||
|         self.processing_thread = None | ||||
|         self.display_callback = None | ||||
|          | ||||
|         # Performance tracking | ||||
|         self.fps_counter = 0 | ||||
|         self.fps_start_time = time.time() | ||||
|         self.current_fps = 0 | ||||
|         self.processed_frames = 0 | ||||
|          | ||||
|         # Frame processing | ||||
|         self.input_queue = deque(maxlen=2)  # Small queue to reduce latency | ||||
|         self.output_queue = deque(maxlen=2) | ||||
|         self.queue_lock = threading.Lock() | ||||
|          | ||||
|         # Quality settings | ||||
|         self.quality_mode = "balanced"  # "fast", "balanced", "quality" | ||||
|         self.adaptive_quality = True | ||||
|          | ||||
|     def set_source_face(self, source_image_path: str) -> bool: | ||||
|         """Set the source face for swapping""" | ||||
|         try: | ||||
|             source_image = cv2.imread(source_image_path) | ||||
|             if source_image is None: | ||||
|                 return False | ||||
|                  | ||||
|             face = get_one_face(source_image) | ||||
|             if face is None: | ||||
|                 return False | ||||
|                  | ||||
|             self.source_face = face | ||||
|             return True | ||||
|         except Exception as e: | ||||
|             print(f"Error setting source face: {e}") | ||||
|             return False | ||||
|      | ||||
|     def start_live_swap(self, camera_index: int, display_callback: Callable[[np.ndarray, float], None]) -> bool: | ||||
|         """Start live face swapping""" | ||||
|         try: | ||||
|             if self.source_face is None: | ||||
|                 print("No source face set") | ||||
|                 return False | ||||
|                  | ||||
|             self.display_callback = display_callback | ||||
|             self.video_capturer = VideoCapturer(camera_index) | ||||
|              | ||||
|             # Start video capture with optimized settings | ||||
|             if not self.video_capturer.start(width=960, height=540, fps=30): | ||||
|                 return False | ||||
|              | ||||
|             self.is_running = True | ||||
|             self.processing_thread = threading.Thread(target=self._processing_loop, daemon=True) | ||||
|             self.processing_thread.start() | ||||
|              | ||||
|             # Start capture loop | ||||
|             self._capture_loop() | ||||
|             return True | ||||
|              | ||||
|         except Exception as e: | ||||
|             print(f"Error starting live swap: {e}") | ||||
|             return False | ||||
|      | ||||
|     def stop_live_swap(self): | ||||
|         """Stop live face swapping""" | ||||
|         self.is_running = False | ||||
|         if self.video_capturer: | ||||
|             self.video_capturer.release() | ||||
|         if self.processing_thread: | ||||
|             self.processing_thread.join(timeout=1.0) | ||||
|      | ||||
|     def _capture_loop(self): | ||||
|         """Main capture loop""" | ||||
|         while self.is_running: | ||||
|             try: | ||||
|                 ret, frame = self.video_capturer.read() | ||||
|                 if ret and frame is not None: | ||||
|                     # Add frame to processing queue | ||||
|                     with self.queue_lock: | ||||
|                         if len(self.input_queue) < self.input_queue.maxlen: | ||||
|                             self.input_queue.append(frame.copy()) | ||||
|                  | ||||
|                 # Small delay to prevent excessive CPU usage | ||||
|                 time.sleep(0.001) | ||||
|                  | ||||
|             except Exception as e: | ||||
|                 print(f"Error in capture loop: {e}") | ||||
|                 break | ||||
|      | ||||
|     def _processing_loop(self): | ||||
|         """Background processing loop for face swapping""" | ||||
|         while self.is_running: | ||||
|             try: | ||||
|                 frame_to_process = None | ||||
|                  | ||||
|                 # Get frame from input queue | ||||
|                 with self.queue_lock: | ||||
|                     if self.input_queue: | ||||
|                         frame_to_process = self.input_queue.popleft() | ||||
|                  | ||||
|                 if frame_to_process is not None: | ||||
|                     # Process the frame | ||||
|                     processed_frame = self._process_frame(frame_to_process) | ||||
|                      | ||||
|                     # Add to output queue | ||||
|                     with self.queue_lock: | ||||
|                         if len(self.output_queue) < self.output_queue.maxlen: | ||||
|                             self.output_queue.append(processed_frame) | ||||
|                      | ||||
|                     # Update FPS and call display callback | ||||
|                     self._update_fps() | ||||
|                     if self.display_callback: | ||||
|                         self.display_callback(processed_frame, self.current_fps) | ||||
|                  | ||||
|                 else: | ||||
|                     # No frame to process, small delay | ||||
|                     time.sleep(0.005) | ||||
|                      | ||||
|             except Exception as e: | ||||
|                 print(f"Error in processing loop: {e}") | ||||
|                 time.sleep(0.01) | ||||
|      | ||||
|     def _process_frame(self, frame: np.ndarray) -> np.ndarray: | ||||
|         """Process a single frame with face swapping""" | ||||
|         try: | ||||
|             start_time = time.time() | ||||
|              | ||||
|             # Apply performance optimizations | ||||
|             original_size = frame.shape[:2][::-1] | ||||
|             processed_frame = performance_optimizer.preprocess_frame(frame) | ||||
|              | ||||
|             # Detect faces based on performance settings | ||||
|             if modules.globals.many_faces: | ||||
|                 if performance_optimizer.should_detect_faces(): | ||||
|                     target_faces = get_many_faces(processed_frame) | ||||
|                     performance_optimizer.face_cache['many_faces'] = target_faces | ||||
|                 else: | ||||
|                     target_faces = performance_optimizer.face_cache.get('many_faces', []) | ||||
|                  | ||||
|                 if target_faces: | ||||
|                     for target_face in target_faces: | ||||
|                         if self.source_face and target_face: | ||||
|                             processed_frame = swap_face_enhanced(self.source_face, target_face, processed_frame) | ||||
|             else: | ||||
|                 if performance_optimizer.should_detect_faces(): | ||||
|                     target_face = get_one_face(processed_frame) | ||||
|                     performance_optimizer.face_cache['single_face'] = target_face | ||||
|                 else: | ||||
|                     target_face = performance_optimizer.face_cache.get('single_face') | ||||
|                  | ||||
|                 if target_face and self.source_face: | ||||
|                     processed_frame = swap_face_enhanced(self.source_face, target_face, processed_frame) | ||||
|              | ||||
|             # Post-process back to original size | ||||
|             final_frame = performance_optimizer.postprocess_frame(processed_frame, original_size) | ||||
|              | ||||
|             # Update performance metrics | ||||
|             processing_time = time.time() - start_time | ||||
|             performance_optimizer.update_fps_stats(processing_time) | ||||
|              | ||||
|             return final_frame | ||||
|              | ||||
|         except Exception as e: | ||||
|             print(f"Error processing frame: {e}") | ||||
|             return frame | ||||
|      | ||||
|     def _update_fps(self): | ||||
|         """Update FPS counter""" | ||||
|         self.fps_counter += 1 | ||||
|         current_time = time.time() | ||||
|          | ||||
|         if current_time - self.fps_start_time >= 1.0: | ||||
|             self.current_fps = self.fps_counter / (current_time - self.fps_start_time) | ||||
|             self.fps_counter = 0 | ||||
|             self.fps_start_time = current_time | ||||
|      | ||||
|     def set_quality_mode(self, mode: str): | ||||
|         """Set quality mode: 'fast', 'balanced', or 'quality'""" | ||||
|         self.quality_mode = mode | ||||
|          | ||||
|         if mode == "fast": | ||||
|             performance_optimizer.quality_level = 0.7 | ||||
|             performance_optimizer.detection_interval = 0.15 | ||||
|         elif mode == "balanced": | ||||
|             performance_optimizer.quality_level = 0.85 | ||||
|             performance_optimizer.detection_interval = 0.1 | ||||
|         elif mode == "quality": | ||||
|             performance_optimizer.quality_level = 1.0 | ||||
|             performance_optimizer.detection_interval = 0.05 | ||||
|      | ||||
|     def get_performance_stats(self) -> dict: | ||||
|         """Get current performance statistics""" | ||||
|         return { | ||||
|             'fps': self.current_fps, | ||||
|             'quality_level': performance_optimizer.quality_level, | ||||
|             'detection_interval': performance_optimizer.detection_interval, | ||||
|             'processed_frames': self.processed_frames | ||||
|         } | ||||
| 
 | ||||
| 
 | ||||
| # Global instance | ||||
| live_face_swapper = LiveFaceSwapper() | ||||
|  | @ -1,151 +0,0 @@ | |||
| """ | ||||
| Performance Manager for Deep-Live-Cam | ||||
| Handles performance mode switching and optimization settings | ||||
| """ | ||||
| import json | ||||
| import os | ||||
| from typing import Dict, Any | ||||
| import modules.globals | ||||
| from modules.performance_optimizer import performance_optimizer | ||||
| 
 | ||||
| 
 | ||||
| class PerformanceManager: | ||||
|     def __init__(self): | ||||
|         self.config_path = "performance_config.json" | ||||
|         self.config = self.load_config() | ||||
|         self.current_mode = "balanced" | ||||
|      | ||||
|     def load_config(self) -> Dict[str, Any]: | ||||
|         """Load performance configuration from file""" | ||||
|         try: | ||||
|             if os.path.exists(self.config_path): | ||||
|                 with open(self.config_path, 'r') as f: | ||||
|                     return json.load(f) | ||||
|             else: | ||||
|                 return self.get_default_config() | ||||
|         except Exception as e: | ||||
|             print(f"Error loading performance config: {e}") | ||||
|             return self.get_default_config() | ||||
|      | ||||
|     def get_default_config(self) -> Dict[str, Any]: | ||||
|         """Get default performance configuration""" | ||||
|         return { | ||||
|             "performance_modes": { | ||||
|                 "fast": { | ||||
|                     "quality_level": 0.6, | ||||
|                     "face_detection_interval": 0.2, | ||||
|                     "target_fps": 30, | ||||
|                     "frame_skip": 2, | ||||
|                     "enable_caching": True, | ||||
|                     "processing_resolution_scale": 0.7 | ||||
|                 }, | ||||
|                 "balanced": { | ||||
|                     "quality_level": 0.85, | ||||
|                     "face_detection_interval": 0.1, | ||||
|                     "target_fps": 25, | ||||
|                     "frame_skip": 1, | ||||
|                     "enable_caching": True, | ||||
|                     "processing_resolution_scale": 0.85 | ||||
|                 }, | ||||
|                 "quality": { | ||||
|                     "quality_level": 1.0, | ||||
|                     "face_detection_interval": 0.05, | ||||
|                     "target_fps": 20, | ||||
|                     "frame_skip": 1, | ||||
|                     "enable_caching": False, | ||||
|                     "processing_resolution_scale": 1.0 | ||||
|                 } | ||||
|             } | ||||
|         } | ||||
|      | ||||
|     def set_performance_mode(self, mode: str) -> bool: | ||||
|         """Set performance mode (fast, balanced, quality)""" | ||||
|         try: | ||||
|             if mode not in self.config["performance_modes"]: | ||||
|                 print(f"Invalid performance mode: {mode}") | ||||
|                 return False | ||||
|              | ||||
|             mode_config = self.config["performance_modes"][mode] | ||||
|             self.current_mode = mode | ||||
|              | ||||
|             # Apply settings to performance optimizer | ||||
|             performance_optimizer.quality_level = mode_config["quality_level"] | ||||
|             performance_optimizer.detection_interval = mode_config["face_detection_interval"] | ||||
|             performance_optimizer.target_fps = mode_config["target_fps"] | ||||
|              | ||||
|             # Apply to globals | ||||
|             modules.globals.performance_mode = mode | ||||
|             modules.globals.quality_level = mode_config["quality_level"] | ||||
|             modules.globals.face_detection_interval = mode_config["face_detection_interval"] | ||||
|             modules.globals.target_live_fps = mode_config["target_fps"] | ||||
|              | ||||
|             print(f"Performance mode set to: {mode}") | ||||
|             return True | ||||
|              | ||||
|         except Exception as e: | ||||
|             print(f"Error setting performance mode: {e}") | ||||
|             return False | ||||
|      | ||||
|     def get_current_mode(self) -> str: | ||||
|         """Get current performance mode""" | ||||
|         return self.current_mode | ||||
|      | ||||
|     def get_mode_info(self, mode: str) -> Dict[str, Any]: | ||||
|         """Get information about a specific performance mode""" | ||||
|         return self.config["performance_modes"].get(mode, {}) | ||||
|      | ||||
|     def get_all_modes(self) -> Dict[str, Any]: | ||||
|         """Get all available performance modes""" | ||||
|         return self.config["performance_modes"] | ||||
|      | ||||
|     def optimize_for_hardware(self) -> str: | ||||
|         """Automatically select optimal performance mode based on hardware""" | ||||
|         try: | ||||
|             import psutil | ||||
|             import torch | ||||
|              | ||||
|             # Check available RAM | ||||
|             ram_gb = psutil.virtual_memory().total / (1024**3) | ||||
|              | ||||
|             # Check GPU availability | ||||
|             has_gpu = torch.cuda.is_available() | ||||
|              | ||||
|             # Check CPU cores | ||||
|             cpu_cores = psutil.cpu_count() | ||||
|              | ||||
|             # Determine optimal mode | ||||
|             if has_gpu and ram_gb >= 8 and cpu_cores >= 8: | ||||
|                 optimal_mode = "quality" | ||||
|             elif has_gpu and ram_gb >= 4: | ||||
|                 optimal_mode = "balanced" | ||||
|             else: | ||||
|                 optimal_mode = "fast" | ||||
|              | ||||
|             self.set_performance_mode(optimal_mode) | ||||
|             print(f"Auto-optimized for hardware: {optimal_mode} mode") | ||||
|             print(f"  RAM: {ram_gb:.1f}GB, GPU: {has_gpu}, CPU Cores: {cpu_cores}") | ||||
|              | ||||
|             return optimal_mode | ||||
|              | ||||
|         except Exception as e: | ||||
|             print(f"Error in hardware optimization: {e}") | ||||
|             self.set_performance_mode("balanced") | ||||
|             return "balanced" | ||||
|      | ||||
|     def get_performance_tips(self) -> list: | ||||
|         """Get performance optimization tips""" | ||||
|         tips = [ | ||||
|             "🚀 Use 'Fast' mode for maximum FPS during live streaming", | ||||
|             "⚖️ Use 'Balanced' mode for good quality with decent performance", | ||||
|             "🎨 Use 'Quality' mode for best results when processing videos", | ||||
|             "💾 Close other applications to free up system resources", | ||||
|             "🖥️ Use GPU acceleration when available (CUDA/DirectML)", | ||||
|             "📹 Lower camera resolution if experiencing lag", | ||||
|             "🔄 Enable frame caching for smoother playback", | ||||
|             "⚡ Ensure good lighting for better face detection" | ||||
|         ] | ||||
|         return tips | ||||
| 
 | ||||
| 
 | ||||
| # Global performance manager instance | ||||
| performance_manager = PerformanceManager() | ||||
|  | @ -1,76 +0,0 @@ | |||
| """ | ||||
| Performance optimization module for Deep-Live-Cam | ||||
| Provides frame caching, adaptive quality, and FPS optimization | ||||
| """ | ||||
| import cv2 | ||||
| import numpy as np | ||||
| import time | ||||
| from typing import Dict, Any, Optional, Tuple | ||||
| import threading | ||||
| from collections import deque | ||||
| import modules.globals | ||||
| 
 | ||||
| class PerformanceOptimizer: | ||||
|     def __init__(self): | ||||
|         self.frame_cache = {} | ||||
|         self.face_cache = {} | ||||
|         self.last_detection_time = 0 | ||||
|         self.detection_interval = 0.1  # Detect faces every 100ms | ||||
|         self.adaptive_quality = True | ||||
|         self.target_fps = 30 | ||||
|         self.frame_times = deque(maxlen=10) | ||||
|         self.current_fps = 0 | ||||
|         self.quality_level = 1.0 | ||||
|         self.min_quality = 0.5 | ||||
|         self.max_quality = 1.0 | ||||
|          | ||||
|     def should_detect_faces(self) -> bool: | ||||
|         """Determine if we should run face detection based on timing""" | ||||
|         current_time = time.time() | ||||
|         if current_time - self.last_detection_time > self.detection_interval: | ||||
|             self.last_detection_time = current_time | ||||
|             return True | ||||
|         return False | ||||
|      | ||||
|     def update_fps_stats(self, frame_time: float): | ||||
|         """Update FPS statistics and adjust quality accordingly""" | ||||
|         self.frame_times.append(frame_time) | ||||
|         if len(self.frame_times) >= 5: | ||||
|             avg_frame_time = sum(self.frame_times) / len(self.frame_times) | ||||
|             self.current_fps = 1.0 / avg_frame_time if avg_frame_time > 0 else 0 | ||||
|              | ||||
|             if self.adaptive_quality: | ||||
|                 self._adjust_quality() | ||||
|      | ||||
|     def _adjust_quality(self): | ||||
|         """Dynamically adjust processing quality based on FPS""" | ||||
|         if self.current_fps < self.target_fps * 0.8:  # Below 80% of target | ||||
|             self.quality_level = max(self.min_quality, self.quality_level - 0.1) | ||||
|             self.detection_interval = min(0.2, self.detection_interval + 0.02) | ||||
|         elif self.current_fps > self.target_fps * 0.95:  # Above 95% of target | ||||
|             self.quality_level = min(self.max_quality, self.quality_level + 0.05) | ||||
|             self.detection_interval = max(0.05, self.detection_interval - 0.01) | ||||
|      | ||||
|     def get_optimal_resolution(self, original_size: Tuple[int, int]) -> Tuple[int, int]: | ||||
|         """Get optimal processing resolution based on current quality level""" | ||||
|         width, height = original_size | ||||
|         scale = self.quality_level | ||||
|         return (int(width * scale), int(height * scale)) | ||||
|      | ||||
|     def preprocess_frame(self, frame: np.ndarray) -> np.ndarray: | ||||
|         """Preprocess frame for optimal performance""" | ||||
|         if self.quality_level < 1.0: | ||||
|             height, width = frame.shape[:2] | ||||
|             new_height = int(height * self.quality_level) | ||||
|             new_width = int(width * self.quality_level) | ||||
|             frame = cv2.resize(frame, (new_width, new_height), interpolation=cv2.INTER_LINEAR) | ||||
|         return frame | ||||
|      | ||||
|     def postprocess_frame(self, frame: np.ndarray, target_size: Tuple[int, int]) -> np.ndarray: | ||||
|         """Postprocess frame to target resolution""" | ||||
|         if frame.shape[:2][::-1] != target_size: | ||||
|             frame = cv2.resize(frame, target_size, interpolation=cv2.INTER_CUBIC) | ||||
|         return frame | ||||
| 
 | ||||
| # Global optimizer instance | ||||
| performance_optimizer = PerformanceOptimizer() | ||||
|  | @ -5,7 +5,6 @@ import threading | |||
| import numpy as np | ||||
| import modules.globals | ||||
| import logging | ||||
| import time | ||||
| import modules.processors.frame.core | ||||
| from modules.core import update_status | ||||
| from modules.face_analyser import get_one_face, get_many_faces, default_source_face | ||||
|  | @ -71,7 +70,7 @@ def get_face_swapper() -> Any: | |||
| def swap_face(source_face: Face, target_face: Face, temp_frame: Frame) -> Frame: | ||||
|     face_swapper = get_face_swapper() | ||||
| 
 | ||||
|     # Apply the face swap with optimized settings for better performance | ||||
|     # Simple face swap - maximum FPS | ||||
|     swapped_frame = face_swapper.get( | ||||
|         temp_frame, target_face, source_face, paste_back=True | ||||
|     ) | ||||
|  | @ -99,18 +98,29 @@ def swap_face(source_face: Face, target_face: Face, temp_frame: Frame) -> Frame: | |||
|     return swapped_frame | ||||
| 
 | ||||
| 
 | ||||
| def swap_face_enhanced(source_face: Face, target_face: Face, temp_frame: Frame) -> Frame: | ||||
|     """Enhanced face swapping with better quality and performance optimizations""" | ||||
| # Simple face position smoothing for stability | ||||
| _last_face_position = None | ||||
| _position_smoothing = 0.7  # Higher = more stable, lower = more responsive | ||||
| 
 | ||||
| def swap_face_stable(source_face: Face, target_face: Face, temp_frame: Frame) -> Frame: | ||||
|     """Ultra-fast face swap - maximum FPS priority""" | ||||
|     # Skip all complex processing for maximum FPS | ||||
|     face_swapper = get_face_swapper() | ||||
|     swapped_frame = face_swapper.get(temp_frame, target_face, source_face, paste_back=True) | ||||
|      | ||||
|     # Apply the face swap | ||||
|     swapped_frame = face_swapper.get( | ||||
|         temp_frame, target_face, source_face, paste_back=True | ||||
|     ) | ||||
|     # Skip all post-processing to maximize FPS | ||||
|     return swapped_frame | ||||
| 
 | ||||
| 
 | ||||
| def swap_face_ultra_fast(source_face: Face, target_face: Face, temp_frame: Frame) -> Frame: | ||||
|     """Fast face swap with mouth mask support and forehead protection""" | ||||
|     face_swapper = get_face_swapper() | ||||
|     swapped_frame = face_swapper.get(temp_frame, target_face, source_face, paste_back=True) | ||||
|      | ||||
|     # Enhanced post-processing for better quality | ||||
|     swapped_frame = enhance_face_swap_quality(swapped_frame, source_face, target_face, temp_frame) | ||||
|     # Fix forehead hair issue - blend forehead area back to original | ||||
|     swapped_frame = fix_forehead_hair_issue(swapped_frame, target_face, temp_frame) | ||||
|      | ||||
|     # Add mouth mask functionality back (only if enabled) | ||||
|     if modules.globals.mouth_mask: | ||||
|         # Create a mask for the target face | ||||
|         face_mask = create_face_mask(target_face, temp_frame) | ||||
|  | @ -130,12 +140,12 @@ def swap_face_enhanced(source_face: Face, target_face: Face, temp_frame: Frame) | |||
|             swapped_frame = draw_mouth_mask_visualization( | ||||
|                 swapped_frame, target_face, mouth_mask_data | ||||
|             ) | ||||
| 
 | ||||
|      | ||||
|     return swapped_frame | ||||
| 
 | ||||
| 
 | ||||
| def enhance_face_swap_quality(swapped_frame: Frame, source_face: Face, target_face: Face, original_frame: Frame) -> Frame: | ||||
|     """Apply quality enhancements to the swapped face""" | ||||
| def fix_forehead_hair_issue(swapped_frame: Frame, target_face: Face, original_frame: Frame) -> Frame: | ||||
|     """Fix hair falling on forehead by blending forehead area back to original""" | ||||
|     try: | ||||
|         # Get face bounding box | ||||
|         bbox = target_face.bbox.astype(int) | ||||
|  | @ -148,124 +158,149 @@ def enhance_face_swap_quality(swapped_frame: Frame, source_face: Face, target_fa | |||
|          | ||||
|         if x2 <= x1 or y2 <= y1: | ||||
|             return swapped_frame | ||||
|          | ||||
|         # Focus on forehead area (upper 35% of face) | ||||
|         forehead_height = int((y2 - y1) * 0.35) | ||||
|         forehead_y2 = y1 + forehead_height | ||||
|          | ||||
|         if forehead_y2 > y1: | ||||
|             # Extract forehead regions | ||||
|             swapped_forehead = swapped_frame[y1:forehead_y2, x1:x2] | ||||
|             original_forehead = original_frame[y1:forehead_y2, x1:x2] | ||||
|              | ||||
|         # Extract face regions | ||||
|         swapped_face = swapped_frame[y1:y2, x1:x2] | ||||
|         original_face = original_frame[y1:y2, x1:x2] | ||||
|          | ||||
|         # Apply color matching | ||||
|         color_matched = apply_advanced_color_matching(swapped_face, original_face) | ||||
|          | ||||
|         # Apply edge smoothing | ||||
|         smoothed = apply_edge_smoothing(color_matched, original_face) | ||||
|          | ||||
|         # Blend back into frame | ||||
|         swapped_frame[y1:y2, x1:x2] = smoothed | ||||
|             # Create a soft blend mask for forehead area | ||||
|             mask = np.ones(swapped_forehead.shape[:2], dtype=np.float32) | ||||
|              | ||||
|             # Apply strong Gaussian blur for very soft blending | ||||
|             mask = cv2.GaussianBlur(mask, (31, 31), 10) | ||||
|             mask = mask[:, :, np.newaxis] | ||||
|              | ||||
|             # Blend forehead areas (keep much more of original to preserve hair) | ||||
|             blended_forehead = (swapped_forehead * 0.3 + original_forehead * 0.7).astype(np.uint8) | ||||
|              | ||||
|             # Apply the blended forehead back | ||||
|             swapped_frame[y1:forehead_y2, x1:x2] = blended_forehead | ||||
|          | ||||
|         return swapped_frame | ||||
|          | ||||
|     except Exception: | ||||
|         return swapped_frame | ||||
| 
 | ||||
| 
 | ||||
| def improve_forehead_matching(swapped_frame: Frame, source_face: Face, target_face: Face, original_frame: Frame) -> Frame: | ||||
|     """Create precise face mask - only swap core facial features (eyes, nose, cheeks, chin)""" | ||||
|     try: | ||||
|         # Get face landmarks for precise masking | ||||
|         if hasattr(target_face, 'landmark_2d_106') and target_face.landmark_2d_106 is not None: | ||||
|             landmarks = target_face.landmark_2d_106.astype(np.int32) | ||||
|              | ||||
|             # Create precise face mask excluding forehead and hair | ||||
|             mask = create_precise_face_mask(landmarks, swapped_frame.shape[:2]) | ||||
|              | ||||
|             if mask is not None: | ||||
|                 # Apply the precise mask | ||||
|                 mask_3d = mask[:, :, np.newaxis] / 255.0 | ||||
|                  | ||||
|                 # Blend only the core facial features | ||||
|                 result = (swapped_frame * mask_3d + original_frame * (1 - mask_3d)).astype(np.uint8) | ||||
|                 return result | ||||
|          | ||||
|         # Fallback: use bounding box method but exclude forehead | ||||
|         bbox = target_face.bbox.astype(int) | ||||
|         x1, y1, x2, y2 = bbox | ||||
|          | ||||
|         # Ensure coordinates are within frame bounds | ||||
|         h, w = swapped_frame.shape[:2] | ||||
|         x1, y1 = max(0, x1), max(0, y1) | ||||
|         x2, y2 = min(w, x2), min(h, y2) | ||||
|          | ||||
|         if x2 <= x1 or y2 <= y1: | ||||
|             return swapped_frame | ||||
|          | ||||
|         # Exclude forehead area (upper 25% of face) to avoid hair swapping | ||||
|         forehead_height = int((y2 - y1) * 0.25) | ||||
|         face_start_y = y1 + forehead_height | ||||
|          | ||||
|         if face_start_y < y2: | ||||
|             # Only blend the lower face area (eyes, nose, cheeks, chin) | ||||
|             swapped_face_area = swapped_frame[face_start_y:y2, x1:x2] | ||||
|             original_face_area = original_frame[face_start_y:y2, x1:x2] | ||||
|              | ||||
|             # Create soft mask for the face area only | ||||
|             mask = np.ones(swapped_face_area.shape[:2], dtype=np.float32) | ||||
|             mask = cv2.GaussianBlur(mask, (15, 15), 5) | ||||
|             mask = mask[:, :, np.newaxis] | ||||
|              | ||||
|             # Apply the face area back (keep original forehead/hair) | ||||
|             swapped_frame[face_start_y:y2, x1:x2] = swapped_face_area | ||||
|          | ||||
|         return swapped_frame | ||||
|          | ||||
|     except Exception: | ||||
|         return swapped_frame | ||||
| 
 | ||||
| 
 | ||||
| def create_precise_face_mask(landmarks: np.ndarray, frame_shape: tuple) -> np.ndarray: | ||||
|     """Create precise mask for core facial features only (exclude forehead and hair)""" | ||||
|     try: | ||||
|         mask = np.zeros(frame_shape, dtype=np.uint8) | ||||
|          | ||||
|         # For 106-point landmarks, use correct indices | ||||
|         # Face contour (jawline) - points 0-32 | ||||
|         jaw_line = landmarks[0:33] | ||||
|          | ||||
|         # Eyes area - approximate indices for 106-point model | ||||
|         left_eye_area = landmarks[33:42]   # Left eye region | ||||
|         right_eye_area = landmarks[87:96]  # Right eye region | ||||
|          | ||||
|         # Eyebrows (start from eyebrow level, not forehead) | ||||
|         left_eyebrow = landmarks[43:51]    # Left eyebrow | ||||
|         right_eyebrow = landmarks[97:105]  # Right eyebrow | ||||
|          | ||||
|         # Create face contour that excludes forehead | ||||
|         # Start from eyebrow level and go around the face | ||||
|         face_contour_points = [] | ||||
|          | ||||
|         # Add eyebrow points (this will be our "top" instead of forehead) | ||||
|         face_contour_points.extend(left_eyebrow) | ||||
|         face_contour_points.extend(right_eyebrow) | ||||
|          | ||||
|         # Add jawline points (bottom and sides of face) | ||||
|         face_contour_points.extend(jaw_line) | ||||
|          | ||||
|         # Convert to numpy array | ||||
|         face_contour_points = np.array(face_contour_points) | ||||
|          | ||||
|         # Create convex hull for the core face area (excluding forehead) | ||||
|         hull = cv2.convexHull(face_contour_points) | ||||
|         cv2.fillConvexPoly(mask, hull, 255) | ||||
|          | ||||
|         # Apply Gaussian blur for soft edges | ||||
|         mask = cv2.GaussianBlur(mask, (21, 21), 7) | ||||
|          | ||||
|         return mask | ||||
|          | ||||
|     except Exception as e: | ||||
|         # Return original swapped frame if enhancement fails | ||||
|         return swapped_frame | ||||
| 
 | ||||
| 
 | ||||
| def apply_advanced_color_matching(swapped_face: np.ndarray, target_face: np.ndarray) -> np.ndarray: | ||||
|     """Apply advanced color matching between swapped and target faces""" | ||||
|     try: | ||||
|         # Convert to LAB color space for better color matching | ||||
|         swapped_lab = cv2.cvtColor(swapped_face, cv2.COLOR_BGR2LAB).astype(np.float32) | ||||
|         target_lab = cv2.cvtColor(target_face, cv2.COLOR_BGR2LAB).astype(np.float32) | ||||
|          | ||||
|         # Calculate statistics for each channel | ||||
|         swapped_mean = np.mean(swapped_lab, axis=(0, 1)) | ||||
|         swapped_std = np.std(swapped_lab, axis=(0, 1)) | ||||
|         target_mean = np.mean(target_lab, axis=(0, 1)) | ||||
|         target_std = np.std(target_lab, axis=(0, 1)) | ||||
|          | ||||
|         # Apply color transfer | ||||
|         for i in range(3): | ||||
|             if swapped_std[i] > 0: | ||||
|                 swapped_lab[:, :, i] = (swapped_lab[:, :, i] - swapped_mean[i]) * (target_std[i] / swapped_std[i]) + target_mean[i] | ||||
|          | ||||
|         # Convert back to BGR | ||||
|         result = cv2.cvtColor(np.clip(swapped_lab, 0, 255).astype(np.uint8), cv2.COLOR_LAB2BGR) | ||||
|         return result | ||||
|          | ||||
|     except Exception: | ||||
|         return swapped_face | ||||
| 
 | ||||
| 
 | ||||
| def apply_edge_smoothing(face: np.ndarray, reference: np.ndarray) -> np.ndarray: | ||||
|     """Apply edge smoothing to reduce artifacts""" | ||||
|     try: | ||||
|         # Create a soft mask for blending edges | ||||
|         mask = np.ones(face.shape[:2], dtype=np.float32) | ||||
|          | ||||
|         # Apply Gaussian blur to create soft edges | ||||
|         kernel_size = max(5, min(face.shape[0], face.shape[1]) // 20) | ||||
|         if kernel_size % 2 == 0: | ||||
|             kernel_size += 1 | ||||
|              | ||||
|         mask = cv2.GaussianBlur(mask, (kernel_size, kernel_size), 0) | ||||
|         mask = mask[:, :, np.newaxis] | ||||
|          | ||||
|         # Blend with reference for smoother edges | ||||
|         blended = face * mask + reference * (1 - mask) | ||||
|         return blended.astype(np.uint8) | ||||
|          | ||||
|     except Exception: | ||||
|         return face | ||||
|         print(f"Error creating precise face mask: {e}") | ||||
|         return None | ||||
| 
 | ||||
| 
 | ||||
| def process_frame(source_face: Face, temp_frame: Frame) -> Frame: | ||||
|     from modules.performance_optimizer import performance_optimizer | ||||
|      | ||||
|     start_time = time.time() | ||||
|     original_size = temp_frame.shape[:2][::-1]  # (width, height) | ||||
|      | ||||
|     # Apply color correction if enabled | ||||
|     if modules.globals.color_correction: | ||||
|         temp_frame = cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB) | ||||
|      | ||||
|     # Preprocess frame for performance | ||||
|     processed_frame = performance_optimizer.preprocess_frame(temp_frame) | ||||
|      | ||||
|     # Skip color correction for maximum FPS | ||||
|     # if modules.globals.color_correction: | ||||
|     #     temp_frame = cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB) | ||||
| 
 | ||||
|     if modules.globals.many_faces: | ||||
|         # Only detect faces if enough time has passed or cache is empty | ||||
|         if performance_optimizer.should_detect_faces(): | ||||
|             many_faces = get_many_faces(processed_frame) | ||||
|             performance_optimizer.face_cache['many_faces'] = many_faces | ||||
|         else: | ||||
|             many_faces = performance_optimizer.face_cache.get('many_faces', []) | ||||
|              | ||||
|         many_faces = get_many_faces(temp_frame) | ||||
|         if many_faces: | ||||
|             for target_face in many_faces: | ||||
|                 if source_face and target_face: | ||||
|                     processed_frame = swap_face_enhanced(source_face, target_face, processed_frame) | ||||
|                 else: | ||||
|                     print("Face detection failed for target/source.") | ||||
|                     temp_frame = swap_face_ultra_fast(source_face, target_face, temp_frame) | ||||
|     else: | ||||
|         # Use cached face detection for better performance | ||||
|         if performance_optimizer.should_detect_faces(): | ||||
|             target_face = get_one_face(processed_frame) | ||||
|             performance_optimizer.face_cache['single_face'] = target_face | ||||
|         else: | ||||
|             target_face = performance_optimizer.face_cache.get('single_face') | ||||
|              | ||||
|         target_face = get_one_face(temp_frame) | ||||
|         if target_face and source_face: | ||||
|             processed_frame = swap_face_enhanced(source_face, target_face, processed_frame) | ||||
|         else: | ||||
|             logging.error("Face detection failed for target or source.") | ||||
|      | ||||
|     # Postprocess frame back to original size | ||||
|     final_frame = performance_optimizer.postprocess_frame(processed_frame, original_size) | ||||
|      | ||||
|     # Update performance stats | ||||
|     frame_time = time.time() - start_time | ||||
|     performance_optimizer.update_fps_stats(frame_time) | ||||
|      | ||||
|     return final_frame | ||||
| 
 | ||||
|             temp_frame = swap_face_ultra_fast(source_face, target_face, temp_frame) | ||||
|     return temp_frame | ||||
| 
 | ||||
| 
 | ||||
| def process_frame_v2(temp_frame: Frame, temp_frame_path: str = "") -> Frame: | ||||
|  | @ -419,7 +454,6 @@ def create_lower_mouth_mask( | |||
|     mouth_cutout = None | ||||
|     landmarks = face.landmark_2d_106 | ||||
|     if landmarks is not None: | ||||
|         #                  0  1  2  3  4  5  6  7  8  9  10 11 12 13 14 15 16 17 18 19 20 | ||||
|         lower_lip_order = [ | ||||
|             65, | ||||
|             66, | ||||
|  | @ -443,192 +477,74 @@ def create_lower_mouth_mask( | |||
|             2, | ||||
|             65, | ||||
|         ] | ||||
|         lower_lip_landmarks = landmarks[lower_lip_order].astype( | ||||
|             np.float32 | ||||
|         )  # Use float for precise calculations | ||||
|         lower_lip_landmarks = landmarks[lower_lip_order].astype(np.float32) | ||||
| 
 | ||||
|         # Calculate the center of the landmarks | ||||
|         center = np.mean(lower_lip_landmarks, axis=0) | ||||
| 
 | ||||
|         # Expand the landmarks outward | ||||
|         expansion_factor = ( | ||||
|             1 + modules.globals.mask_down_size | ||||
|         )  # Adjust this for more or less expansion | ||||
|         expansion_factor = 1 + modules.globals.mask_down_size | ||||
|         expanded_landmarks = (lower_lip_landmarks - center) * expansion_factor + center | ||||
| 
 | ||||
|         # Extend the top lip part | ||||
|         toplip_indices = [ | ||||
|             20, | ||||
|             0, | ||||
|             1, | ||||
|             2, | ||||
|             3, | ||||
|             4, | ||||
|             5, | ||||
|         ]  # Indices for landmarks 2, 65, 66, 62, 70, 69, 18 | ||||
|         toplip_extension = ( | ||||
|             modules.globals.mask_size * 0.5 | ||||
|         )  # Adjust this factor to control the extension | ||||
|         toplip_indices = [20, 0, 1, 2, 3, 4, 5] | ||||
|         toplip_extension = modules.globals.mask_size * 0.5 | ||||
|         for idx in toplip_indices: | ||||
|             direction = expanded_landmarks[idx] - center | ||||
|             direction = direction / np.linalg.norm(direction) | ||||
|             expanded_landmarks[idx] += direction * toplip_extension | ||||
| 
 | ||||
|         # Extend the bottom part (chin area) | ||||
|         chin_indices = [ | ||||
|             11, | ||||
|             12, | ||||
|             13, | ||||
|             14, | ||||
|             15, | ||||
|             16, | ||||
|         ]  # Indices for landmarks 21, 22, 23, 24, 0, 8 | ||||
|         chin_extension = 2 * 0.2  # Adjust this factor to control the extension | ||||
|         chin_indices = [11, 12, 13, 14, 15, 16] | ||||
|         chin_extension = 2 * 0.2 | ||||
|         for idx in chin_indices: | ||||
|             expanded_landmarks[idx][1] += ( | ||||
|                 expanded_landmarks[idx][1] - center[1] | ||||
|             ) * chin_extension | ||||
| 
 | ||||
|         # Convert back to integer coordinates | ||||
|         expanded_landmarks = expanded_landmarks.astype(np.int32) | ||||
| 
 | ||||
|         # Calculate bounding box for the expanded lower mouth | ||||
|         min_x, min_y = np.min(expanded_landmarks, axis=0) | ||||
|         max_x, max_y = np.max(expanded_landmarks, axis=0) | ||||
| 
 | ||||
|         # Add some padding to the bounding box | ||||
|         padding = int((max_x - min_x) * 0.1)  # 10% padding | ||||
|         padding = int((max_x - min_x) * 0.1) | ||||
|         min_x = max(0, min_x - padding) | ||||
|         min_y = max(0, min_y - padding) | ||||
|         max_x = min(frame.shape[1], max_x + padding) | ||||
|         max_y = min(frame.shape[0], max_y + padding) | ||||
| 
 | ||||
|         # Ensure the bounding box dimensions are valid | ||||
|         if max_x <= min_x or max_y <= min_y: | ||||
|             if (max_x - min_x) <= 1: | ||||
|                 max_x = min_x + 1 | ||||
|             if (max_y - min_y) <= 1: | ||||
|                 max_y = min_y + 1 | ||||
| 
 | ||||
|         # Create the mask | ||||
|         mask_roi = np.zeros((max_y - min_y, max_x - min_x), dtype=np.uint8) | ||||
|         cv2.fillPoly(mask_roi, [expanded_landmarks - [min_x, min_y]], 255) | ||||
| 
 | ||||
|         # Apply Gaussian blur to soften the mask edges | ||||
|         mask_roi = cv2.GaussianBlur(mask_roi, (15, 15), 5) | ||||
| 
 | ||||
|         # Place the mask ROI in the full-sized mask | ||||
|         # Improved smoothing for mouth mask | ||||
|         mask_roi = cv2.GaussianBlur(mask_roi, (25, 25), 8) | ||||
|         mask[min_y:max_y, min_x:max_x] = mask_roi | ||||
| 
 | ||||
|         # Extract the masked area from the frame | ||||
|         mouth_cutout = frame[min_y:max_y, min_x:max_x].copy() | ||||
| 
 | ||||
|         # Return the expanded lower lip polygon in original frame coordinates | ||||
|         lower_lip_polygon = expanded_landmarks | ||||
| 
 | ||||
|     return mask, mouth_cutout, (min_x, min_y, max_x, max_y), lower_lip_polygon | ||||
| 
 | ||||
| 
 | ||||
| def draw_mouth_mask_visualization( | ||||
|     frame: Frame, face: Face, mouth_mask_data: tuple | ||||
| ) -> Frame: | ||||
| def draw_mouth_mask_visualization(frame: Frame, face: Face, mouth_mask_data: tuple) -> Frame: | ||||
|     landmarks = face.landmark_2d_106 | ||||
|     if landmarks is not None and mouth_mask_data is not None: | ||||
|         mask, mouth_cutout, (min_x, min_y, max_x, max_y), lower_lip_polygon = ( | ||||
|             mouth_mask_data | ||||
|         ) | ||||
| 
 | ||||
|         mask, mouth_cutout, (min_x, min_y, max_x, max_y), lower_lip_polygon = mouth_mask_data | ||||
|         vis_frame = frame.copy() | ||||
| 
 | ||||
|         # Ensure coordinates are within frame bounds | ||||
|         height, width = vis_frame.shape[:2] | ||||
|         min_x, min_y = max(0, min_x), max(0, min_y) | ||||
|         max_x, max_y = min(width, max_x), min(height, max_y) | ||||
| 
 | ||||
|         # Adjust mask to match the region size | ||||
|         mask_region = mask[0 : max_y - min_y, 0 : max_x - min_x] | ||||
| 
 | ||||
|         # Remove the color mask overlay | ||||
|         # color_mask = cv2.applyColorMap((mask_region * 255).astype(np.uint8), cv2.COLORMAP_JET) | ||||
| 
 | ||||
|         # Ensure shapes match before blending | ||||
|         vis_region = vis_frame[min_y:max_y, min_x:max_x] | ||||
|         # Remove blending with color_mask | ||||
|         # if vis_region.shape[:2] == color_mask.shape[:2]: | ||||
|         #     blended = cv2.addWeighted(vis_region, 0.7, color_mask, 0.3, 0) | ||||
|         #     vis_frame[min_y:max_y, min_x:max_x] = blended | ||||
| 
 | ||||
|         # Draw the lower lip polygon | ||||
|         cv2.polylines(vis_frame, [lower_lip_polygon], True, (0, 255, 0), 2) | ||||
| 
 | ||||
|         # Remove the red box | ||||
|         # cv2.rectangle(vis_frame, (min_x, min_y), (max_x, max_y), (0, 0, 255), 2) | ||||
| 
 | ||||
|         # Visualize the feathered mask | ||||
|         feather_amount = max( | ||||
|             1, | ||||
|             min( | ||||
|                 30, | ||||
|                 (max_x - min_x) // modules.globals.mask_feather_ratio, | ||||
|                 (max_y - min_y) // modules.globals.mask_feather_ratio, | ||||
|             ), | ||||
|         ) | ||||
|         # Ensure kernel size is odd | ||||
|         kernel_size = 2 * feather_amount + 1 | ||||
|         feathered_mask = cv2.GaussianBlur( | ||||
|             mask_region.astype(float), (kernel_size, kernel_size), 0 | ||||
|         ) | ||||
|         feathered_mask = (feathered_mask / feathered_mask.max() * 255).astype(np.uint8) | ||||
|         # Remove the feathered mask color overlay | ||||
|         # color_feathered_mask = cv2.applyColorMap(feathered_mask, cv2.COLORMAP_VIRIDIS) | ||||
| 
 | ||||
|         # Ensure shapes match before blending feathered mask | ||||
|         # if vis_region.shape == color_feathered_mask.shape: | ||||
|         #     blended_feathered = cv2.addWeighted(vis_region, 0.7, color_feathered_mask, 0.3, 0) | ||||
|         #     vis_frame[min_y:max_y, min_x:max_x] = blended_feathered | ||||
| 
 | ||||
|         # Add labels | ||||
|         cv2.putText( | ||||
|             vis_frame, | ||||
|             "Lower Mouth Mask", | ||||
|             (min_x, min_y - 10), | ||||
|             cv2.FONT_HERSHEY_SIMPLEX, | ||||
|             0.5, | ||||
|             (255, 255, 255), | ||||
|             1, | ||||
|         ) | ||||
|         cv2.putText( | ||||
|             vis_frame, | ||||
|             "Feathered Mask", | ||||
|             (min_x, max_y + 20), | ||||
|             cv2.FONT_HERSHEY_SIMPLEX, | ||||
|             0.5, | ||||
|             (255, 255, 255), | ||||
|             1, | ||||
|         ) | ||||
| 
 | ||||
|         cv2.putText(vis_frame, "Lower Mouth Mask", (min_x, min_y - 10), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255, 255, 255), 1) | ||||
|         return vis_frame | ||||
|     return frame | ||||
| 
 | ||||
| 
 | ||||
| def apply_mouth_area( | ||||
|     frame: np.ndarray, | ||||
|     mouth_cutout: np.ndarray, | ||||
|     mouth_box: tuple, | ||||
|     face_mask: np.ndarray, | ||||
|     mouth_polygon: np.ndarray, | ||||
| ) -> np.ndarray: | ||||
| def apply_mouth_area(frame: np.ndarray, mouth_cutout: np.ndarray, mouth_box: tuple, face_mask: np.ndarray, mouth_polygon: np.ndarray) -> np.ndarray: | ||||
|     min_x, min_y, max_x, max_y = mouth_box | ||||
|     box_width = max_x - min_x | ||||
|     box_height = max_y - min_y | ||||
| 
 | ||||
|     if ( | ||||
|         mouth_cutout is None | ||||
|         or box_width is None | ||||
|         or box_height is None | ||||
|         or face_mask is None | ||||
|         or mouth_polygon is None | ||||
|     ): | ||||
|     if mouth_cutout is None or box_width is None or box_height is None or face_mask is None or mouth_polygon is None: | ||||
|         return frame | ||||
| 
 | ||||
|     try: | ||||
|  | @ -636,44 +552,33 @@ def apply_mouth_area( | |||
|         roi = frame[min_y:max_y, min_x:max_x] | ||||
| 
 | ||||
|         if roi.shape != resized_mouth_cutout.shape: | ||||
|             resized_mouth_cutout = cv2.resize( | ||||
|                 resized_mouth_cutout, (roi.shape[1], roi.shape[0]) | ||||
|             ) | ||||
|             resized_mouth_cutout = cv2.resize(resized_mouth_cutout, (roi.shape[1], roi.shape[0])) | ||||
| 
 | ||||
|         color_corrected_mouth = apply_color_transfer(resized_mouth_cutout, roi) | ||||
| 
 | ||||
|         # Use the provided mouth polygon to create the mask | ||||
|         polygon_mask = np.zeros(roi.shape[:2], dtype=np.uint8) | ||||
|         adjusted_polygon = mouth_polygon - [min_x, min_y] | ||||
|         cv2.fillPoly(polygon_mask, [adjusted_polygon], 255) | ||||
| 
 | ||||
|         # Apply feathering to the polygon mask | ||||
|         feather_amount = min( | ||||
|             30, | ||||
|             box_width // modules.globals.mask_feather_ratio, | ||||
|             box_height // modules.globals.mask_feather_ratio, | ||||
|         ) | ||||
|         feathered_mask = cv2.GaussianBlur( | ||||
|             polygon_mask.astype(float), (0, 0), feather_amount | ||||
|         ) | ||||
|         # Improved feathering for smoother mouth mask | ||||
|         feather_amount = min(35, box_width // modules.globals.mask_feather_ratio, box_height // modules.globals.mask_feather_ratio) | ||||
|         feathered_mask = cv2.GaussianBlur(polygon_mask.astype(float), (0, 0), feather_amount * 1.2) | ||||
|         feathered_mask = feathered_mask / feathered_mask.max() | ||||
|          | ||||
|         # Additional smoothing pass for extra softness | ||||
|         feathered_mask = cv2.GaussianBlur(feathered_mask, (7, 7), 2) | ||||
|          | ||||
|         # Fix black line artifacts by ensuring smooth mask transitions | ||||
|         feathered_mask = np.clip(feathered_mask, 0.1, 0.9)  # Avoid pure 0 and 1 values | ||||
| 
 | ||||
|         face_mask_roi = face_mask[min_y:max_y, min_x:max_x] | ||||
|         combined_mask = feathered_mask * (face_mask_roi / 255.0) | ||||
| 
 | ||||
|         combined_mask = combined_mask[:, :, np.newaxis] | ||||
|         blended = ( | ||||
|             color_corrected_mouth * combined_mask + roi * (1 - combined_mask) | ||||
|         ).astype(np.uint8) | ||||
|         blended = (color_corrected_mouth * combined_mask + roi * (1 - combined_mask)).astype(np.uint8) | ||||
| 
 | ||||
|         # Apply face mask to blended result | ||||
|         face_mask_3channel = ( | ||||
|             np.repeat(face_mask_roi[:, :, np.newaxis], 3, axis=2) / 255.0 | ||||
|         ) | ||||
|         face_mask_3channel = np.repeat(face_mask_roi[:, :, np.newaxis], 3, axis=2) / 255.0 | ||||
|         final_blend = blended * face_mask_3channel + roi * (1 - face_mask_3channel) | ||||
| 
 | ||||
|         frame[min_y:max_y, min_x:max_x] = final_blend.astype(np.uint8) | ||||
|     except Exception as e: | ||||
|     except Exception: | ||||
|         pass | ||||
| 
 | ||||
|     return frame | ||||
|  | @ -683,10 +588,7 @@ def create_face_mask(face: Face, frame: Frame) -> np.ndarray: | |||
|     mask = np.zeros(frame.shape[:2], dtype=np.uint8) | ||||
|     landmarks = face.landmark_2d_106 | ||||
|     if landmarks is not None: | ||||
|         # Convert landmarks to int32 | ||||
|         landmarks = landmarks.astype(np.int32) | ||||
| 
 | ||||
|         # Extract facial features | ||||
|         right_side_face = landmarks[0:16] | ||||
|         left_side_face = landmarks[17:32] | ||||
|         right_eye = landmarks[33:42] | ||||
|  | @ -694,39 +596,22 @@ def create_face_mask(face: Face, frame: Frame) -> np.ndarray: | |||
|         left_eye = landmarks[87:96] | ||||
|         left_eye_brow = landmarks[97:105] | ||||
| 
 | ||||
|         # Calculate forehead extension | ||||
|         right_eyebrow_top = np.min(right_eye_brow[:, 1]) | ||||
|         left_eyebrow_top = np.min(left_eye_brow[:, 1]) | ||||
|         eyebrow_top = min(right_eyebrow_top, left_eyebrow_top) | ||||
| 
 | ||||
|         face_top = np.min([right_side_face[0, 1], left_side_face[-1, 1]]) | ||||
|         forehead_height = face_top - eyebrow_top | ||||
|         extended_forehead_height = int(forehead_height * 5.0)  # Extend by 50% | ||||
|         extended_forehead_height = int(forehead_height * 5.0) | ||||
| 
 | ||||
|         # Create forehead points | ||||
|         forehead_left = right_side_face[0].copy() | ||||
|         forehead_right = left_side_face[-1].copy() | ||||
|         forehead_left[1] -= extended_forehead_height | ||||
|         forehead_right[1] -= extended_forehead_height | ||||
| 
 | ||||
|         # Combine all points to create the face outline | ||||
|         face_outline = np.vstack( | ||||
|             [ | ||||
|                 [forehead_left], | ||||
|                 right_side_face, | ||||
|                 left_side_face[ | ||||
|                     ::-1 | ||||
|                 ],  # Reverse left side to create a continuous outline | ||||
|                 [forehead_right], | ||||
|             ] | ||||
|         ) | ||||
|         face_outline = np.vstack([[forehead_left], right_side_face, left_side_face[::-1], [forehead_right]]) | ||||
|         padding = int(np.linalg.norm(right_side_face[0] - left_side_face[-1]) * 0.05) | ||||
| 
 | ||||
|         # Calculate padding | ||||
|         padding = int( | ||||
|             np.linalg.norm(right_side_face[0] - left_side_face[-1]) * 0.05 | ||||
|         )  # 5% of face width | ||||
| 
 | ||||
|         # Create a slightly larger convex hull for padding | ||||
|         hull = cv2.convexHull(face_outline) | ||||
|         hull_padded = [] | ||||
|         for point in hull: | ||||
|  | @ -738,33 +623,23 @@ def create_face_mask(face: Face, frame: Frame) -> np.ndarray: | |||
|             hull_padded.append(padded_point) | ||||
| 
 | ||||
|         hull_padded = np.array(hull_padded, dtype=np.int32) | ||||
| 
 | ||||
|         # Fill the padded convex hull | ||||
|         cv2.fillConvexPoly(mask, hull_padded, 255) | ||||
| 
 | ||||
|         # Smooth the mask edges | ||||
|         mask = cv2.GaussianBlur(mask, (5, 5), 3) | ||||
| 
 | ||||
|     return mask | ||||
| 
 | ||||
| 
 | ||||
| def apply_color_transfer(source, target): | ||||
|     """ | ||||
|     Apply color transfer from target to source image | ||||
|     """ | ||||
|     source = cv2.cvtColor(source, cv2.COLOR_BGR2LAB).astype("float32") | ||||
|     target = cv2.cvtColor(target, cv2.COLOR_BGR2LAB).astype("float32") | ||||
| 
 | ||||
|     source_mean, source_std = cv2.meanStdDev(source) | ||||
|     target_mean, target_std = cv2.meanStdDev(target) | ||||
| 
 | ||||
|     # Reshape mean and std to be broadcastable | ||||
|     source_mean = source_mean.reshape(1, 1, 3) | ||||
|     source_std = source_std.reshape(1, 1, 3) | ||||
|     target_mean = target_mean.reshape(1, 1, 3) | ||||
|     target_std = target_std.reshape(1, 1, 3) | ||||
| 
 | ||||
|     # Perform the color transfer | ||||
|     source = (source - source_mean) * (target_std / source_std) + target_mean | ||||
| 
 | ||||
|     return cv2.cvtColor(np.clip(source, 0, 255).astype("uint8"), cv2.COLOR_LAB2BGR) | ||||
|     return cv2.cvtColor(np.clip(source, 0, 255).astype("uint8"), cv2.COLOR_LAB2BGR) | ||||
|  | @ -3,8 +3,6 @@ import numpy as np | |||
| from typing import Optional, Tuple, Callable | ||||
| import platform | ||||
| import threading | ||||
| import time | ||||
| from collections import deque | ||||
| 
 | ||||
| # Only import Windows-specific library if on Windows | ||||
| if platform.system() == "Windows": | ||||
|  | @ -19,17 +17,6 @@ class VideoCapturer: | |||
|         self._frame_ready = threading.Event() | ||||
|         self.is_running = False | ||||
|         self.cap = None | ||||
|          | ||||
|         # Performance tracking | ||||
|         self.frame_times = deque(maxlen=30) | ||||
|         self.current_fps = 0 | ||||
|         self.target_fps = 30 | ||||
|         self.frame_skip = 1 | ||||
|         self.frame_counter = 0 | ||||
|          | ||||
|         # Buffer management | ||||
|         self.frame_buffer = deque(maxlen=3) | ||||
|         self.buffer_lock = threading.Lock() | ||||
| 
 | ||||
|         # Initialize Windows-specific components if on Windows | ||||
|         if platform.system() == "Windows": | ||||
|  | @ -42,10 +29,8 @@ class VideoCapturer: | |||
|                 ) | ||||
| 
 | ||||
|     def start(self, width: int = 960, height: int = 540, fps: int = 60) -> bool: | ||||
|         """Initialize and start video capture with performance optimizations""" | ||||
|         """Initialize and start video capture""" | ||||
|         try: | ||||
|             self.target_fps = fps | ||||
|              | ||||
|             if platform.system() == "Windows": | ||||
|                 # Windows-specific capture methods | ||||
|                 capture_methods = [ | ||||
|  | @ -70,14 +55,10 @@ class VideoCapturer: | |||
|             if not self.cap or not self.cap.isOpened(): | ||||
|                 raise RuntimeError("Failed to open camera") | ||||
| 
 | ||||
|             # Configure format with performance optimizations | ||||
|             # Configure format | ||||
|             self.cap.set(cv2.CAP_PROP_FRAME_WIDTH, width) | ||||
|             self.cap.set(cv2.CAP_PROP_FRAME_HEIGHT, height) | ||||
|             self.cap.set(cv2.CAP_PROP_FPS, fps) | ||||
|              | ||||
|             # Additional performance settings | ||||
|             self.cap.set(cv2.CAP_PROP_BUFFERSIZE, 1)  # Reduce buffer to minimize latency | ||||
|             self.cap.set(cv2.CAP_PROP_FOURCC, cv2.VideoWriter_fourcc('M', 'J', 'P', 'G'))  # Use MJPEG for better performance | ||||
| 
 | ||||
|             self.is_running = True | ||||
|             return True | ||||
|  | @ -89,57 +70,17 @@ class VideoCapturer: | |||
|             return False | ||||
| 
 | ||||
|     def read(self) -> Tuple[bool, Optional[np.ndarray]]: | ||||
|         """Read a frame from the camera with performance optimizations""" | ||||
|         """Read a frame from the camera""" | ||||
|         if not self.is_running or self.cap is None: | ||||
|             return False, None | ||||
| 
 | ||||
|         start_time = time.time() | ||||
|          | ||||
|         # Implement frame skipping for performance | ||||
|         self.frame_counter += 1 | ||||
|         if self.frame_counter % self.frame_skip != 0: | ||||
|             # Skip this frame but still read to clear buffer | ||||
|             ret, _ = self.cap.read() | ||||
|             return ret, self._current_frame if ret else None | ||||
| 
 | ||||
|         ret, frame = self.cap.read() | ||||
|         if ret: | ||||
|             self._current_frame = frame | ||||
|              | ||||
|             # Update performance metrics | ||||
|             frame_time = time.time() - start_time | ||||
|             self.frame_times.append(frame_time) | ||||
|             self._update_performance_metrics() | ||||
|              | ||||
|             # Add to buffer for processing | ||||
|             with self.buffer_lock: | ||||
|                 self.frame_buffer.append(frame.copy()) | ||||
|              | ||||
|             if self.frame_callback: | ||||
|                 self.frame_callback(frame) | ||||
|             return True, frame | ||||
|         return False, None | ||||
|      | ||||
|     def _update_performance_metrics(self): | ||||
|         """Update FPS and adjust frame skipping based on performance""" | ||||
|         if len(self.frame_times) >= 10: | ||||
|             avg_frame_time = sum(list(self.frame_times)[-10:]) / 10 | ||||
|             self.current_fps = 1.0 / avg_frame_time if avg_frame_time > 0 else 0 | ||||
|              | ||||
|             # Adaptive frame skipping | ||||
|             if self.current_fps < self.target_fps * 0.8: | ||||
|                 self.frame_skip = min(3, self.frame_skip + 1) | ||||
|             elif self.current_fps > self.target_fps * 0.95: | ||||
|                 self.frame_skip = max(1, self.frame_skip - 1) | ||||
|      | ||||
|     def get_buffered_frame(self) -> Optional[np.ndarray]: | ||||
|         """Get the latest frame from buffer""" | ||||
|         with self.buffer_lock: | ||||
|             return self.frame_buffer[-1] if self.frame_buffer else None | ||||
|      | ||||
|     def get_fps(self) -> float: | ||||
|         """Get current FPS""" | ||||
|         return self.current_fps | ||||
| 
 | ||||
|     def release(self) -> None: | ||||
|         """Stop capture and release resources""" | ||||
|  |  | |||
|  | @ -1,46 +0,0 @@ | |||
| { | ||||
|   "performance_modes": { | ||||
|     "fast": { | ||||
|       "quality_level": 0.6, | ||||
|       "face_detection_interval": 0.2, | ||||
|       "target_fps": 30, | ||||
|       "frame_skip": 2, | ||||
|       "enable_caching": true, | ||||
|       "processing_resolution_scale": 0.7, | ||||
|       "description": "Optimized for maximum FPS with acceptable quality" | ||||
|     }, | ||||
|     "balanced": { | ||||
|       "quality_level": 0.85, | ||||
|       "face_detection_interval": 0.1, | ||||
|       "target_fps": 25, | ||||
|       "frame_skip": 1, | ||||
|       "enable_caching": true, | ||||
|       "processing_resolution_scale": 0.85, | ||||
|       "description": "Balance between quality and performance" | ||||
|     }, | ||||
|     "quality": { | ||||
|       "quality_level": 1.0, | ||||
|       "face_detection_interval": 0.05, | ||||
|       "target_fps": 20, | ||||
|       "frame_skip": 1, | ||||
|       "enable_caching": false, | ||||
|       "processing_resolution_scale": 1.0, | ||||
|       "description": "Maximum quality with slower processing" | ||||
|     } | ||||
|   }, | ||||
|   "advanced_settings": { | ||||
|     "color_matching_strength": 0.7, | ||||
|     "edge_smoothing_enabled": true, | ||||
|     "adaptive_quality_enabled": true, | ||||
|     "gpu_memory_optimization": true, | ||||
|     "face_cache_size": 10, | ||||
|     "frame_buffer_size": 3 | ||||
|   }, | ||||
|   "quality_enhancements": { | ||||
|     "enable_color_correction": true, | ||||
|     "enable_edge_smoothing": true, | ||||
|     "enable_advanced_blending": true, | ||||
|     "skin_tone_matching": true, | ||||
|     "lighting_adaptation": true | ||||
|   } | ||||
| } | ||||
|  | @ -14,8 +14,8 @@ torch; sys_platform != 'darwin' | |||
| torch==2.5.1; sys_platform == 'darwin' | ||||
| torchvision; sys_platform != 'darwin' | ||||
| torchvision==0.20.1; sys_platform == 'darwin' | ||||
| onnxruntime-silicon==1.16.3; sys_platform == 'darwin' and platform_machine == 'arm64' | ||||
| onnxruntime-gpu==1.22.0; sys_platform != 'darwin' | ||||
| tensorflow; sys_platform != 'darwin' | ||||
| opennsfw2==0.10.2 | ||||
| protobuf==4.25.1 | ||||
| pygrabber | ||||
|  | @ -1,120 +0,0 @@ | |||
| #!/usr/bin/env python3 | ||||
| """ | ||||
| Deep-Live-Cam Performance Setup Script | ||||
| Easy configuration for optimal performance based on your hardware | ||||
| """ | ||||
| 
 | ||||
| import sys | ||||
| import os | ||||
| sys.path.append(os.path.dirname(os.path.abspath(__file__))) | ||||
| 
 | ||||
| from modules.performance_manager import performance_manager | ||||
| import psutil | ||||
| import platform | ||||
| 
 | ||||
| def print_header(): | ||||
|     print("=" * 60) | ||||
|     print("🎭 Deep-Live-Cam Performance Optimizer") | ||||
|     print("=" * 60) | ||||
|     print() | ||||
| 
 | ||||
| def analyze_system(): | ||||
|     """Analyze system specifications""" | ||||
|     print("📊 Analyzing your system...") | ||||
|     print("-" * 40) | ||||
|      | ||||
|     # System info | ||||
|     print(f"OS: {platform.system()} {platform.release()}") | ||||
|     print(f"CPU: {platform.processor()}") | ||||
|     print(f"CPU Cores: {psutil.cpu_count()}") | ||||
|     print(f"RAM: {psutil.virtual_memory().total / (1024**3):.1f} GB") | ||||
|      | ||||
|     # GPU info | ||||
|     try: | ||||
|         import torch | ||||
|         if torch.cuda.is_available(): | ||||
|             gpu_name = torch.cuda.get_device_name(0) | ||||
|             gpu_memory = torch.cuda.get_device_properties(0).total_memory / (1024**3) | ||||
|             print(f"GPU: {gpu_name} ({gpu_memory:.1f} GB)") | ||||
|         else: | ||||
|             print("GPU: Not available or not CUDA-compatible") | ||||
|     except ImportError: | ||||
|         print("GPU: PyTorch not available") | ||||
|      | ||||
|     print() | ||||
| 
 | ||||
| def show_performance_modes(): | ||||
|     """Display available performance modes""" | ||||
|     print("🎯 Available Performance Modes:") | ||||
|     print("-" * 40) | ||||
|      | ||||
|     modes = performance_manager.get_all_modes() | ||||
|     for mode_name, mode_config in modes.items(): | ||||
|         print(f"\n{mode_name.upper()}:") | ||||
|         print(f"  Quality Level: {mode_config['quality_level']}") | ||||
|         print(f"  Target FPS: {mode_config['target_fps']}") | ||||
|         print(f"  Detection Interval: {mode_config['face_detection_interval']}s") | ||||
|         if 'description' in mode_config: | ||||
|             print(f"  Description: {mode_config['description']}") | ||||
| 
 | ||||
| def interactive_setup(): | ||||
|     """Interactive performance setup""" | ||||
|     print("🛠️ Interactive Setup:") | ||||
|     print("-" * 40) | ||||
|      | ||||
|     print("\nChoose your priority:") | ||||
|     print("1. Maximum FPS (for live streaming)") | ||||
|     print("2. Balanced performance and quality") | ||||
|     print("3. Best quality (for video processing)") | ||||
|     print("4. Auto-optimize based on hardware") | ||||
|      | ||||
|     while True: | ||||
|         try: | ||||
|             choice = input("\nEnter your choice (1-4): ").strip() | ||||
|              | ||||
|             if choice == "1": | ||||
|                 performance_manager.set_performance_mode("fast") | ||||
|                 print("✅ Set to FAST mode - Maximum FPS") | ||||
|                 break | ||||
|             elif choice == "2": | ||||
|                 performance_manager.set_performance_mode("balanced") | ||||
|                 print("✅ Set to BALANCED mode - Good balance") | ||||
|                 break | ||||
|             elif choice == "3": | ||||
|                 performance_manager.set_performance_mode("quality") | ||||
|                 print("✅ Set to QUALITY mode - Best results") | ||||
|                 break | ||||
|             elif choice == "4": | ||||
|                 optimal_mode = performance_manager.optimize_for_hardware() | ||||
|                 print(f"✅ Auto-optimized to {optimal_mode.upper()} mode") | ||||
|                 break | ||||
|             else: | ||||
|                 print("❌ Invalid choice. Please enter 1, 2, 3, or 4.") | ||||
|                  | ||||
|         except KeyboardInterrupt: | ||||
|             print("\n\n👋 Setup cancelled.") | ||||
|             return | ||||
| 
 | ||||
| def show_tips(): | ||||
|     """Show performance tips""" | ||||
|     print("\n💡 Performance Tips:") | ||||
|     print("-" * 40) | ||||
|      | ||||
|     tips = performance_manager.get_performance_tips() | ||||
|     for tip in tips: | ||||
|         print(f"  {tip}") | ||||
| 
 | ||||
| def main(): | ||||
|     print_header() | ||||
|     analyze_system() | ||||
|     show_performance_modes() | ||||
|     interactive_setup() | ||||
|     show_tips() | ||||
|      | ||||
|     print("\n" + "=" * 60) | ||||
|     print("🎉 Setup complete! You can change these settings anytime by running this script again.") | ||||
|     print("💻 Start Deep-Live-Cam with: python run.py") | ||||
|     print("=" * 60) | ||||
| 
 | ||||
| if __name__ == "__main__": | ||||
|     main() | ||||
		Loading…
	
		Reference in New Issue