import os import platform import webbrowser import customtkinter as ctk from typing import Callable, Tuple, List, Any from types import ModuleType import cv2 from PIL import Image, ImageOps import pyvirtualcam # Import OS-specific modules only when necessary if platform.system() == 'Darwin': # macOS import AVFoundation # Import Windows specific modules only when on windows platform if platform.system() == 'Windows' or platform.system() == 'Linux': # Windows or Linux from pygrabber.dshow_graph import FilterGraph import modules.globals import modules.metadata from modules.face_analyser import get_one_face from modules.capturer import get_video_frame, get_video_frame_total from modules.processors.frame.core import get_frame_processors_modules from modules.utilities import is_image, is_video, resolve_relative_path ROOT = None ROOT_HEIGHT = 800 ROOT_WIDTH = 600 PREVIEW = None PREVIEW_MAX_HEIGHT = 700 PREVIEW_MAX_WIDTH = 1200 PREVIEW_DEFAULT_WIDTH = 960 PREVIEW_DEFAULT_HEIGHT = 540 RECENT_DIRECTORY_SOURCE = None RECENT_DIRECTORY_TARGET = None RECENT_DIRECTORY_OUTPUT = None preview_label = None preview_slider = None source_label = None target_label = None status_label = None img_ft, vid_ft = modules.globals.file_types camera = None def check_camera_permissions(): """Check and request camera access permission on macOS.""" if platform.system() == 'Darwin': # macOS-specific auth_status = AVFoundation.AVCaptureDevice.authorizationStatusForMediaType_(AVFoundation.AVMediaTypeVideo) if auth_status == AVFoundation.AVAuthorizationStatusNotDetermined: # Request access to the camera def completion_handler(granted): if granted: print("Access granted to the camera.") else: print("Access denied to the camera.") AVFoundation.AVCaptureDevice.requestAccessForMediaType_completionHandler_(AVFoundation.AVMediaTypeVideo, completion_handler) elif auth_status == AVFoundation.AVAuthorizationStatusAuthorized: print("Camera access already authorized.") elif auth_status == AVFoundation.AVAuthorizationStatusDenied: print("Camera access denied. Please enable it in System Preferences.") elif auth_status == AVFoundation.AVAuthorizationStatusRestricted: print("Camera access restricted. The app is not allowed to use the camera.") def select_camera(camera_name: str): """Select the appropriate camera based on its name (cross-platform).""" if platform.system() == 'Darwin': # macOS-specific devices = AVFoundation.AVCaptureDevice.devicesWithMediaType_(AVFoundation.AVMediaTypeVideo) for device in devices: if device.localizedName() == camera_name: return device elif platform.system() == 'Windows' or platform.system() == 'Linux': # On Windows/Linux, simply return the camera name as OpenCV can handle it by index return camera_name return None def init(start: Callable[[], None], destroy: Callable[[], None]) -> ctk.CTk: global ROOT, PREVIEW if platform.system() == 'Darwin': # macOS-specific check_camera_permissions() # Check camera permissions before initializing the UI ROOT = create_root(start, destroy) PREVIEW = create_preview(ROOT) return ROOT def create_root(start: Callable[[], None], destroy: Callable[[], None]) -> ctk.CTk: global source_label, target_label, status_label ctk.deactivate_automatic_dpi_awareness() ctk.set_appearance_mode('system') ctk.set_default_color_theme(resolve_relative_path('ui.json')) print("Creating root window...") root = ctk.CTk() root.minsize(ROOT_WIDTH, ROOT_HEIGHT) root.title(f'{modules.metadata.name} {modules.metadata.version} {modules.metadata.edition}') root.protocol('WM_DELETE_WINDOW', lambda: destroy()) source_label = ctk.CTkLabel(root, text=None) source_label.place(relx=0.1, rely=0.0875, relwidth=0.3, relheight=0.25) target_label = ctk.CTkLabel(root, text=None) target_label.place(relx=0.6, rely=0.0875, relwidth=0.3, relheight=0.25) source_button = ctk.CTkButton(root, text='Select a face', cursor='hand2', command=select_source_path) source_button.place(relx=0.1, rely=0.35, relwidth=0.3, relheight=0.1) swap_faces_button = ctk.CTkButton(root, text='↔', cursor='hand2', command=lambda: swap_faces_paths()) swap_faces_button.place(relx=0.45, rely=0.4, relwidth=0.1, relheight=0.1) target_button = ctk.CTkButton(root, text='Select a target', cursor='hand2', command=select_target_path) target_button.place(relx=0.6, rely=0.35, relwidth=0.3, relheight=0.1) keep_fps_value = ctk.BooleanVar(value=modules.globals.keep_fps) keep_fps_checkbox = ctk.CTkSwitch(root, text='Keep fps', variable=keep_fps_value, cursor='hand2', command=lambda: setattr(modules.globals, 'keep_fps', not modules.globals.keep_fps)) keep_fps_checkbox.place(relx=0.1, rely=0.525) keep_frames_value = ctk.BooleanVar(value=modules.globals.keep_frames) keep_frames_switch = ctk.CTkSwitch(root, text='Keep frames', variable=keep_frames_value, cursor='hand2', command=lambda: setattr(modules.globals, 'keep_frames', keep_frames_value.get())) keep_frames_switch.place(relx=0.1, rely=0.56875) enhancer_value = ctk.BooleanVar(value=modules.globals.fp_ui['face_enhancer']) enhancer_switch = ctk.CTkSwitch(root, text='Face Enhancer', variable=enhancer_value, cursor='hand2', command=lambda: update_tumbler('face_enhancer', enhancer_value.get())) enhancer_switch.place(relx=0.1, rely=0.6125) keep_audio_value = ctk.BooleanVar(value=modules.globals.keep_audio) keep_audio_switch = ctk.CTkSwitch(root, text='Keep audio', variable=keep_audio_value, cursor='hand2', command=lambda: setattr(modules.globals, 'keep_audio', keep_audio_value.get())) keep_audio_switch.place(relx=0.6, rely=0.525) many_faces_value = ctk.BooleanVar(value=modules.globals.many_faces) many_faces_switch = ctk.CTkSwitch(root, text='Many faces', variable=many_faces_value, cursor='hand2', command=lambda: setattr(modules.globals, 'many_faces', many_faces_value.get())) many_faces_switch.place(relx=0.6, rely=0.56875) nsfw_value = ctk.BooleanVar(value=modules.globals.nsfw) nsfw_switch = ctk.CTkSwitch(root, text='NSFW', variable=nsfw_value, cursor='hand2', command=lambda: setattr(modules.globals, 'nsfw', nsfw_value.get())) nsfw_switch.place(relx=0.6, rely=0.6125) start_button = ctk.CTkButton(root, text='Start', cursor='hand2', command=lambda: select_output_path(start)) start_button.place(relx=0.15, rely=0.7, relwidth=0.2, relheight=0.05) stop_button = ctk.CTkButton(root, text='Destroy', cursor='hand2', command=destroy) stop_button.place(relx=0.4, rely=0.7, relwidth=0.2, relheight=0.05) preview_button = ctk.CTkButton(root, text='Preview', cursor='hand2', command=toggle_preview) preview_button.place(relx=0.65, rely=0.7, relwidth=0.2, relheight=0.05) camera_label = ctk.CTkLabel(root, text="Select Camera:") camera_label.place(relx=0.4, rely=0.7525, relwidth=0.2, relheight=0.05) available_cameras = get_available_cameras() available_camera_strings = [str(cam) for cam in available_cameras] camera_variable = ctk.StringVar(value=available_camera_strings[0] if available_camera_strings else "No cameras found") camera_optionmenu = ctk.CTkOptionMenu(root, variable=camera_variable, values=available_camera_strings) camera_optionmenu.place(relx=0.65, rely=0.7525, relwidth=0.2, relheight=0.05) virtual_cam_out_value = ctk.BooleanVar(value=False) virtual_cam_out_switch = ctk.CTkSwitch(root, text='Virtual Cam Output (OBS)', variable=virtual_cam_out_value, cursor='hand2') virtual_cam_out_switch.place(relx=0.4, rely=0.805) live_button = ctk.CTkButton(root, text='Live', cursor='hand2', command=lambda: webcam_preview(camera_variable.get(), virtual_cam_out_value.get())) live_button.place(relx=0.15, rely=0.7525, relwidth=0.2, relheight=0.05) status_label = ctk.CTkLabel(root, text=None, justify='center') status_label.place(relx=0.1, relwidth=0.8, rely=0.875) donate_label = ctk.CTkLabel(root, text='Deep Live Cam', justify='center', cursor='hand2') donate_label.place(relx=0.1, rely=0.95, relwidth=0.8) donate_label.configure(text_color=ctk.ThemeManager.theme.get('URL').get('text_color')) donate_label.bind('', lambda event: webbrowser.open('https://paypal.me/hacksider')) return root def create_preview(parent: ctk.CTk) -> ctk.CTkToplevel: global preview_label, preview_slider preview = ctk.CTkToplevel(parent) preview.withdraw() preview.title('Preview') preview.protocol('WM_DELETE_WINDOW', toggle_preview) preview.resizable(width=True, height=True) preview_label = ctk.CTkLabel(preview, text=None) preview_label.pack(fill='both', expand=True) preview_slider = ctk.CTkSlider(preview, from_=0, to=0, command=update_preview) return preview def update_status(text: str) -> None: status_label.configure(text=text) ROOT.update() def update_tumbler(var: str, value: bool) -> None: modules.globals.fp_ui[var] = value def select_source_path() -> None: global RECENT_DIRECTORY_SOURCE PREVIEW.withdraw() source_path = ctk.filedialog.askopenfilename(title='Select a source image', initialdir=RECENT_DIRECTORY_SOURCE, filetypes=[img_ft]) if is_image(source_path): modules.globals.source_path = source_path RECENT_DIRECTORY_SOURCE = os.path.dirname(modules.globals.source_path) image = render_image_preview(modules.globals.source_path, (200, 200)) source_label.configure(image=image) else: modules.globals.source_path = None source_label.configure(image=None) def swap_faces_paths() -> None: global RECENT_DIRECTORY_SOURCE, RECENT_DIRECTORY_TARGET source_path = modules.globals.source_path target_path = modules.globals.target_path if not is_image(source_path) or not is_image(target_path): return modules.globals.source_path = target_path modules.globals.target_path = source_path RECENT_DIRECTORY_SOURCE = os.path.dirname(modules.globals.source_path) RECENT_DIRECTORY_TARGET = os.path.dirname(modules.globals.target_path) PREVIEW.withdraw() source_image = render_image_preview(modules.globals.source_path, (200, 200)) source_label.configure(image=source_image) target_image = render_image_preview(modules.globals.target_path, (200, 200)) target_label.configure(image=target_image) def select_target_path() -> None: global RECENT_DIRECTORY_TARGET PREVIEW.withdraw() target_path = ctk.filedialog.askopenfilename(title='Select a target image or video', initialdir=RECENT_DIRECTORY_TARGET, filetypes=[img_ft, vid_ft]) if is_image(target_path): modules.globals.target_path = target_path RECENT_DIRECTORY_TARGET = os.path.dirname(modules.globals.target_path) image = render_image_preview(modules.globals.target_path, (200, 200)) target_label.configure(image=image) elif is_video(target_path): modules.globals.target_path = target_path RECENT_DIRECTORY_TARGET = os.path.dirname(modules.globals.target_path) video_frame = render_video_preview(target_path, (200, 200)) target_label.configure(image=video_frame) else: modules.globals.target_path = None target_label.configure(image=None) def select_output_path(start: Callable[[], None]) -> None: global RECENT_DIRECTORY_OUTPUT if is_image(modules.globals.target_path): output_path = ctk.filedialog.asksaveasfilename(title='Save image output file', filetypes=[img_ft], defaultextension='.png', initialfile='output.png', initialdir=RECENT_DIRECTORY_OUTPUT) elif is_video(modules.globals.target_path): output_path = ctk.filedialog.asksaveasfilename(title='Save video output file', filetypes=[vid_ft], defaultextension='.mp4', initialfile='output.mp4', initialdir=RECENT_DIRECTORY_OUTPUT) else: output_path = None if output_path: modules.globals.output_path = output_path RECENT_DIRECTORY_OUTPUT = os.path.dirname(modules.globals.output_path) start() def render_image_preview(image_path: str, size: Tuple[int, int]) -> ctk.CTkImage: image = Image.open(image_path) if size: image = ImageOps.fit(image, size, Image.LANCZOS) return ctk.CTkImage(image, size=image.size) def render_video_preview(video_path: str, size: Tuple[int, int], frame_number: int = 0) -> ctk.CTkImage: capture = cv2.VideoCapture(video_path) if frame_number: capture.set(cv2.CAP_PROP_POS_FRAMES, frame_number) has_frame, frame = capture.read() capture.release() if has_frame: image = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)) if size: image = ImageOps.fit(image, size, Image.LANCZOS) return ctk.CTkImage(image, size=image.size) return None def toggle_preview() -> None: if PREVIEW.state() == 'normal': PREVIEW.withdraw() elif modules.globals.source_path and modules.globals.target_path: init_preview() update_preview() PREVIEW.deiconify() global camera if PREVIEW.state() == 'withdrawn': if camera and camera.isOpened(): camera.release() camera = None def init_preview() -> None: if is_image(modules.globals.target_path): preview_slider.pack_forget() elif is_video(modules.globals.target_path): video_frame_total = get_video_frame_total(modules.globals.target_path) preview_slider.configure(to=video_frame_total) preview_slider.pack(fill='x') preview_slider.set(0) def update_preview(frame_number: int = 0) -> None: if modules.globals.source_path and modules.globals.target_path: temp_frame = get_video_frame(modules.globals.target_path, frame_number) if not modules.globals.nsfw: from modules.predicter import predict_frame if predict_frame(temp_frame): quit() for frame_processor in get_frame_processors_modules(modules.globals.frame_processors): temp_frame = frame_processor.process_frame( get_one_face(cv2.imread(modules.globals.source_path)), temp_frame ) image = Image.fromarray(cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB)) image = ImageOps.contain(image, (PREVIEW_MAX_WIDTH, PREVIEW_MAX_HEIGHT), Image.LANCZOS) image = ctk.CTkImage(image, size=image.size) preview_label.configure(image=image) def webcam_preview_loop(camera: cv2.VideoCapture, source_image: Any, frame_processors: List[ModuleType], virtual_cam: pyvirtualcam.Camera = None) -> bool: global preview_label, PREVIEW ret, frame = camera.read() if not ret: update_status(f"Error: Frame not received from camera.") return False temp_frame = frame.copy() if modules.globals.live_mirror: temp_frame = cv2.flip(temp_frame, 1) # horizontal flipping if modules.globals.live_resizable: temp_frame = fit_image_to_size(temp_frame, PREVIEW.winfo_width(), PREVIEW.winfo_height()) for frame_processor in frame_processors: temp_frame = frame_processor.process_frame(source_image, temp_frame) image = Image.fromarray(cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB)) image = ImageOps.contain(image, (temp_frame.shape[1], temp_frame.shape[0]), Image.LANCZOS) image = ctk.CTkImage(image, size=image.size) preview_label.configure(image=image) if virtual_cam: virtual_cam.send(temp_frame) virtual_cam.sleep_until_next_frame() ROOT.update() if PREVIEW.state() == 'withdrawn': return False return True def fit_image_to_size(image, width: int, height: int): if width is None and height is None: return image h, w, _ = image.shape ratio_h = 0.0 ratio_w = 0.0 if width > height: ratio_h = height / h else: ratio_w = width / w ratio = max(ratio_w, ratio_h) new_size = (int(ratio * w), int(ratio * h)) return cv2.resize(image, dsize=new_size) def webcam_preview(camera_name: str, virtual_cam_output: bool): if modules.globals.source_path is None: return global preview_label, PREVIEW WIDTH = 960 HEIGHT = 540 FPS = 60 # Select the camera by its name selected_camera = select_camera(camera_name) if selected_camera is None: update_status(f"No suitable camera found.") return # Use OpenCV's camera index for cross-platform compatibility camera_index = get_camera_index_by_name(camera_name) global camera camera = cv2.VideoCapture(camera_index) if not camera.isOpened(): update_status(f"Error: Could not open camera {camera_name}") return camera.set(cv2.CAP_PROP_FRAME_WIDTH, WIDTH) camera.set(cv2.CAP_PROP_FRAME_HEIGHT, HEIGHT) camera.set(cv2.CAP_PROP_FPS, FPS) PREVIEW_MAX_WIDTH = WIDTH PREVIEW_MAX_HEIGHT = HEIGHT preview_label.configure(width=PREVIEW_DEFAULT_WIDTH, height=PREVIEW_DEFAULT_HEIGHT) PREVIEW.deiconify() frame_processors = get_frame_processors_modules(modules.globals.frame_processors) source_image = get_one_face(cv2.imread(modules.globals.source_path)) preview_running = True if virtual_cam_output: with pyvirtualcam.Camera(width=WIDTH, height=HEIGHT, fps=FPS, fmt=pyvirtualcam.PixelFormat.BGR) as virtual_cam: while preview_running: preview_running = webcam_preview_loop(camera, source_image, frame_processors, virtual_cam) while preview_running: preview_running = webcam_preview_loop(camera, source_image, frame_processors) if camera: camera.release() PREVIEW.withdraw() def get_camera_index_by_name(camera_name: str) -> int: """Map camera name to index for OpenCV.""" if platform.system() == 'Darwin': # macOS-specific if "FaceTime" in camera_name: return 0 # Assuming FaceTime is at index 0 elif "iPhone" in camera_name: return 1 # Assuming iPhone camera is at index 1 elif platform.system() == 'Windows' or platform.system() == 'Linux': # Map camera name to index dynamically (OpenCV on these platforms usually starts with 0) return get_available_cameras().index(camera_name) return -1 def get_available_cameras(): """Get available camera names (cross-platform).""" available_cameras = [] if platform.system() == 'Darwin': # macOS-specific devices = AVFoundation.AVCaptureDevice.devicesWithMediaType_(AVFoundation.AVMediaTypeVideo) for device in devices: if device.deviceType() == AVFoundation.AVCaptureDeviceTypeBuiltInWideAngleCamera: print(f"Found Built-In Camera: {device.localizedName()}") available_cameras.append(device.localizedName()) elif device.deviceType() == "AVCaptureDeviceTypeExternal": print(f"Found External Camera: {device.localizedName()}") available_cameras.append(device.localizedName()) elif device.deviceType() == "AVCaptureDeviceTypeContinuityCamera": print(f"Skipping Continuity Camera: {device.localizedName()}") elif platform.system() == 'Windows' or platform.system() == 'Linux': try: devices = FilterGraph().get_input_devices() except Exception as e: # Use OpenCV to detect camera indexes index = 0 devices = [] while True: cap = cv2.VideoCapture(index) if not cap.isOpened(): break devices.append(f"Camera {index}") cap.release() index += 1 available_cameras = devices return available_cameras