update some instruction
							parent
							
								
									2b2aa74644
								
							
						
					
					
						commit
						2293c54523
					
				
								
									
									
										
											31
										
									
									README.md
									
									
									
									
								
								
							
							
										
											31
										
									
									README.md
									
									
									
									
								|  | @ -1,9 +1,3 @@ | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| Take a video and replace the face in it with a face of your choice. You only need one image of the desired face. No dataset, no training. |  | ||||||
| 
 |  | ||||||
| You can watch some demos [here](https://drive.google.com/drive/folders/1KHv8n_rd3Lcr2v7jBq1yPSTWM554Gq8e?usp=sharing). A StableDiffusion extension is also available, [here](https://github.com/s0md3v/sd-webui-roop). |  | ||||||
| 
 |  | ||||||
|  |  | ||||||
| 
 | 
 | ||||||
| ## Disclaimer | ## Disclaimer | ||||||
|  | @ -15,29 +9,22 @@ Users of this software are expected to use this software responsibly while abidi | ||||||
| 
 | 
 | ||||||
| ## How do I install it? | ## How do I install it? | ||||||
| 
 | 
 | ||||||
| ### Single command install |  | ||||||
| 
 |  | ||||||
| For windows, [download this file](https://github.com/hacksider/roop-cam/files/12358726/1_click_install.zip), extract to a folder without space, then run (double click)  |  | ||||||
| ``` |  | ||||||
| windows_run.bat |  | ||||||
| ``` |  | ||||||
| 
 |  | ||||||
| Then proceed to the folder of roop-cam and just double click  |  | ||||||
| ``` |  | ||||||
| run-cuda-windows.bat |  | ||||||
| ``` |  | ||||||
| 
 | 
 | ||||||
| ### Basic: It is more likely to work on your computer but it will also be very slow. You can follow instructions for the basic install (This usually runs via **CPU**) | ### Basic: It is more likely to work on your computer but it will also be very slow. You can follow instructions for the basic install (This usually runs via **CPU**) | ||||||
| #### 1.Setup your platform | #### 1.Setup your platform | ||||||
| -   python (3.10 recommended) | -   python (3.10 recommended) | ||||||
| -   pip | -   pip | ||||||
| -   git | -   git | ||||||
| -   ffmpeg | -   [ffmpeg](https://www.youtube.com/watch?v=OlNWCpFdVMA)  | ||||||
| -   visual studio 2022 runtimes (windows) | -   [visual studio 2022 runtimes (windows)](https://learn.microsoft.com/en-us/visualstudio/releases/2022/redistribution#vs2022-download) | ||||||
| #### 2. Clone Repository | #### 2. Clone Repository | ||||||
|     https://github.com/hacksider/roop-cam.git |     https://github.com/hacksider/Deep-Live-Cam.git | ||||||
| 
 | 
 | ||||||
| #### 3. Install dependency | #### 3. Download Models | ||||||
|  | [GFPGANv1.4](https://huggingface.co/hacksider/deep-live-cam/resolve/main/GFPGANv1.4.pth) | ||||||
|  | [inswapper_128.onnx](https://huggingface.co/hacksider/deep-live-cam/resolve/main/inswapper_128.onnx) | ||||||
|  | 
 | ||||||
|  | #### 4. Install dependency | ||||||
| We highly recommend to work with a  `venv`  to avoid issues. | We highly recommend to work with a  `venv`  to avoid issues. | ||||||
| ``` | ``` | ||||||
| pip install -r requirements.txt | pip install -r requirements.txt | ||||||
|  | @ -146,7 +133,7 @@ Just follow the clicks on the screenshot | ||||||
| 2. Click live | 2. Click live | ||||||
| 3. Wait for a few second (it takes a longer time, usually 10 to 30 seconds before the preview shows up) | 3. Wait for a few second (it takes a longer time, usually 10 to 30 seconds before the preview shows up) | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
| 
 | 
 | ||||||
| Just use your favorite screencapture to stream like OBS | Just use your favorite screencapture to stream like OBS | ||||||
| > Note: In case you want to change your face, just select another picture, the preview mode will then restart (so just wait a bit). | > Note: In case you want to change your face, just select another picture, the preview mode will then restart (so just wait a bit). | ||||||
|  |  | ||||||
								
									
									
										
											
												BIN
											
										
									
									demo.gif
									
									
									
									
								
								
							
							
										
											
												BIN
											
										
									
									demo.gif
									
									
									
									
								
											
												Binary file not shown.
											
										
									
								| Before Width: | Height: | Size: 6.2 MiB After Width: | Height: | Size: 1.1 MiB | 
|  | @ -1,283 +0,0 @@ | ||||||
| import os |  | ||||||
| import webbrowser |  | ||||||
| import customtkinter as ctk |  | ||||||
| from typing import Callable, Tuple |  | ||||||
| import cv2 |  | ||||||
| from PIL import Image, ImageOps |  | ||||||
| 
 |  | ||||||
| import roop.globals |  | ||||||
| import roop.metadata |  | ||||||
| from roop.face_analyser import get_one_face |  | ||||||
| from roop.capturer import get_video_frame, get_video_frame_total |  | ||||||
| from roop.predicter import predict_frame |  | ||||||
| from roop.processors.frame.core import get_frame_processors_modules |  | ||||||
| from roop.utilities import is_image, is_video, resolve_relative_path |  | ||||||
| 
 |  | ||||||
| import cv2 |  | ||||||
| 
 |  | ||||||
| ROOT = None |  | ||||||
| ROOT_HEIGHT = 700 |  | ||||||
| ROOT_WIDTH = 600 |  | ||||||
| 
 |  | ||||||
| PREVIEW = None |  | ||||||
| PREVIEW_MAX_HEIGHT = 700 |  | ||||||
| PREVIEW_MAX_WIDTH = 1200 |  | ||||||
| 
 |  | ||||||
| RECENT_DIRECTORY_SOURCE = None |  | ||||||
| RECENT_DIRECTORY_TARGET = None |  | ||||||
| RECENT_DIRECTORY_OUTPUT = None |  | ||||||
| 
 |  | ||||||
| preview_label = None |  | ||||||
| preview_slider = None |  | ||||||
| source_label = None |  | ||||||
| target_label = None |  | ||||||
| status_label = None |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| def init(start: Callable[[], None], destroy: Callable[[], None]) -> ctk.CTk: |  | ||||||
|     global ROOT, PREVIEW |  | ||||||
| 
 |  | ||||||
|     ROOT = create_root(start, destroy) |  | ||||||
|     PREVIEW = create_preview(ROOT) |  | ||||||
| 
 |  | ||||||
|     return ROOT |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| def create_root(start: Callable[[], None], destroy: Callable[[], None]) -> ctk.CTk: |  | ||||||
|     global source_label, target_label, status_label |  | ||||||
| 
 |  | ||||||
|     ctk.deactivate_automatic_dpi_awareness() |  | ||||||
|     ctk.set_appearance_mode('system') |  | ||||||
|     ctk.set_default_color_theme(resolve_relative_path('ui.json')) |  | ||||||
| 
 |  | ||||||
|     root = ctk.CTk() |  | ||||||
|     root.minsize(ROOT_WIDTH, ROOT_HEIGHT) |  | ||||||
|     root.title(f'{roop.metadata.name} {roop.metadata.version}') |  | ||||||
|     root.configure() |  | ||||||
|     root.protocol('WM_DELETE_WINDOW', lambda: destroy()) |  | ||||||
| 
 |  | ||||||
|     source_label = ctk.CTkLabel(root, text=None) |  | ||||||
|     source_label.place(relx=0.1, rely=0.1, relwidth=0.3, relheight=0.25) |  | ||||||
| 
 |  | ||||||
|     target_label = ctk.CTkLabel(root, text=None) |  | ||||||
|     target_label.place(relx=0.6, rely=0.1, relwidth=0.3, relheight=0.25) |  | ||||||
| 
 |  | ||||||
|     source_button = ctk.CTkButton(root, text='Select a face', cursor='hand2', command=lambda: select_source_path()) |  | ||||||
|     source_button.place(relx=0.1, rely=0.4, relwidth=0.3, relheight=0.1) |  | ||||||
| 
 |  | ||||||
|     target_button = ctk.CTkButton(root, text='Select a target', cursor='hand2', command=lambda: select_target_path()) |  | ||||||
|     target_button.place(relx=0.6, rely=0.4, relwidth=0.3, relheight=0.1) |  | ||||||
| 
 |  | ||||||
|     keep_fps_value = ctk.BooleanVar(value=roop.globals.keep_fps) |  | ||||||
|     keep_fps_checkbox = ctk.CTkSwitch(root, text='Keep fps', variable=keep_fps_value, cursor='hand2', command=lambda: setattr(roop.globals, 'keep_fps', not roop.globals.keep_fps)) |  | ||||||
|     keep_fps_checkbox.place(relx=0.1, rely=0.6) |  | ||||||
| 
 |  | ||||||
|     keep_frames_value = ctk.BooleanVar(value=roop.globals.keep_frames) |  | ||||||
|     keep_frames_switch = ctk.CTkSwitch(root, text='Keep frames', variable=keep_frames_value, cursor='hand2', command=lambda: setattr(roop.globals, 'keep_frames', keep_frames_value.get())) |  | ||||||
|     keep_frames_switch.place(relx=0.1, rely=0.65) |  | ||||||
| 
 |  | ||||||
|     keep_audio_value = ctk.BooleanVar(value=roop.globals.keep_audio) |  | ||||||
|     keep_audio_switch = ctk.CTkSwitch(root, text='Keep audio', variable=keep_audio_value, cursor='hand2', command=lambda: setattr(roop.globals, 'keep_audio', keep_audio_value.get())) |  | ||||||
|     keep_audio_switch.place(relx=0.6, rely=0.6) |  | ||||||
| 
 |  | ||||||
|     many_faces_value = ctk.BooleanVar(value=roop.globals.many_faces) |  | ||||||
|     many_faces_switch = ctk.CTkSwitch(root, text='Many faces', variable=many_faces_value, cursor='hand2', command=lambda: setattr(roop.globals, 'many_faces', many_faces_value.get())) |  | ||||||
|     many_faces_switch.place(relx=0.6, rely=0.65) |  | ||||||
| 
 |  | ||||||
|     start_button = ctk.CTkButton(root, text='Start', cursor='hand2', command=lambda: select_output_path(start)) |  | ||||||
|     start_button.place(relx=0.15, rely=0.75, relwidth=0.2, relheight=0.05) |  | ||||||
| 
 |  | ||||||
|     stop_button = ctk.CTkButton(root, text='Destroy', cursor='hand2', command=lambda: destroy()) |  | ||||||
|     stop_button.place(relx=0.4, rely=0.75, relwidth=0.2, relheight=0.05) |  | ||||||
| 
 |  | ||||||
|     preview_button = ctk.CTkButton(root, text='Preview', cursor='hand2', command=lambda: toggle_preview()) |  | ||||||
|     preview_button.place(relx=0.65, rely=0.75, relwidth=0.2, relheight=0.05) |  | ||||||
|      |  | ||||||
|     live_button = ctk.CTkButton(root, text='Live', cursor='hand2', command=lambda: webcam_preview()) |  | ||||||
|     live_button.place(relx=0.40, rely=0.83, relwidth=0.2, relheight=0.05) |  | ||||||
| 
 |  | ||||||
|     status_label = ctk.CTkLabel(root, text=None, justify='center') |  | ||||||
|     status_label.place(relx=0.1, rely=0.9, relwidth=0.8) |  | ||||||
| 
 |  | ||||||
|     donate_label = ctk.CTkLabel(root, text='Send some love!', justify='center', cursor='hand2') |  | ||||||
|     donate_label.place(relx=0.1, rely=0.95, relwidth=0.8) |  | ||||||
|     donate_label.configure(text_color=ctk.ThemeManager.theme.get('RoopDonate').get('text_color')) |  | ||||||
|     donate_label.bind('<Button>', lambda event: webbrowser.open('https://paypal.me/hacksider')) |  | ||||||
| 
 |  | ||||||
|     return root |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| def create_preview(parent: ctk.CTkToplevel) -> ctk.CTkToplevel: |  | ||||||
|     global preview_label, preview_slider |  | ||||||
| 
 |  | ||||||
|     preview = ctk.CTkToplevel(parent) |  | ||||||
|     preview.withdraw() |  | ||||||
|     preview.title('Preview') |  | ||||||
|     preview.configure() |  | ||||||
|     preview.protocol('WM_DELETE_WINDOW', lambda: toggle_preview()) |  | ||||||
|     preview.resizable(width=False, height=False) |  | ||||||
| 
 |  | ||||||
|     preview_label = ctk.CTkLabel(preview, text=None) |  | ||||||
|     preview_label.pack(fill='both', expand=True) |  | ||||||
| 
 |  | ||||||
|     preview_slider = ctk.CTkSlider(preview, from_=0, to=0, command=lambda frame_value: update_preview(frame_value)) |  | ||||||
| 
 |  | ||||||
|     return preview |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| def update_status(text: str) -> None: |  | ||||||
|     status_label.configure(text=text) |  | ||||||
|     ROOT.update() |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| def select_source_path() -> None: |  | ||||||
|     global RECENT_DIRECTORY_SOURCE |  | ||||||
| 
 |  | ||||||
|     PREVIEW.withdraw() |  | ||||||
|     source_path = ctk.filedialog.askopenfilename(title='select an source image', initialdir=RECENT_DIRECTORY_SOURCE) |  | ||||||
|     if is_image(source_path): |  | ||||||
|         roop.globals.source_path = source_path |  | ||||||
|         RECENT_DIRECTORY_SOURCE = os.path.dirname(roop.globals.source_path) |  | ||||||
|         image = render_image_preview(roop.globals.source_path, (200, 200)) |  | ||||||
|         source_label.configure(image=image) |  | ||||||
|     else: |  | ||||||
|         roop.globals.source_path = None |  | ||||||
|         source_label.configure(image=None) |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| def select_target_path() -> None: |  | ||||||
|     global RECENT_DIRECTORY_TARGET |  | ||||||
| 
 |  | ||||||
|     PREVIEW.withdraw() |  | ||||||
|     target_path = ctk.filedialog.askopenfilename(title='select an target image or video', initialdir=RECENT_DIRECTORY_TARGET) |  | ||||||
|     if is_image(target_path): |  | ||||||
|         roop.globals.target_path = target_path |  | ||||||
|         RECENT_DIRECTORY_TARGET = os.path.dirname(roop.globals.target_path) |  | ||||||
|         image = render_image_preview(roop.globals.target_path, (200, 200)) |  | ||||||
|         target_label.configure(image=image) |  | ||||||
|     elif is_video(target_path): |  | ||||||
|         roop.globals.target_path = target_path |  | ||||||
|         RECENT_DIRECTORY_TARGET = os.path.dirname(roop.globals.target_path) |  | ||||||
|         video_frame = render_video_preview(target_path, (200, 200)) |  | ||||||
|         target_label.configure(image=video_frame) |  | ||||||
|     else: |  | ||||||
|         roop.globals.target_path = None |  | ||||||
|         target_label.configure(image=None) |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| def select_output_path(start: Callable[[], None]) -> None: |  | ||||||
|     global RECENT_DIRECTORY_OUTPUT |  | ||||||
| 
 |  | ||||||
|     if is_image(roop.globals.target_path): |  | ||||||
|         output_path = ctk.filedialog.asksaveasfilename(title='save image output file', defaultextension='.png', initialfile='output.png', initialdir=RECENT_DIRECTORY_OUTPUT) |  | ||||||
|     elif is_video(roop.globals.target_path): |  | ||||||
|         output_path = ctk.filedialog.asksaveasfilename(title='save video output file', defaultextension='.mp4', initialfile='output.mp4', initialdir=RECENT_DIRECTORY_OUTPUT) |  | ||||||
|     else: |  | ||||||
|         output_path = None |  | ||||||
|     if output_path: |  | ||||||
|         roop.globals.output_path = output_path |  | ||||||
|         RECENT_DIRECTORY_OUTPUT = os.path.dirname(roop.globals.output_path) |  | ||||||
|         start() |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| def render_image_preview(image_path: str, size: Tuple[int, int]) -> ctk.CTkImage: |  | ||||||
|     image = Image.open(image_path) |  | ||||||
|     if size: |  | ||||||
|         image = ImageOps.fit(image, size, Image.LANCZOS) |  | ||||||
|     return ctk.CTkImage(image, size=image.size) |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| def render_video_preview(video_path: str, size: Tuple[int, int], frame_number: int = 0) -> ctk.CTkImage: |  | ||||||
|     capture = cv2.VideoCapture(video_path) |  | ||||||
|     if frame_number: |  | ||||||
|         capture.set(cv2.CAP_PROP_POS_FRAMES, frame_number) |  | ||||||
|     has_frame, frame = capture.read() |  | ||||||
|     if has_frame: |  | ||||||
|         image = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)) |  | ||||||
|         if size: |  | ||||||
|             image = ImageOps.fit(image, size, Image.LANCZOS) |  | ||||||
|         return ctk.CTkImage(image, size=image.size) |  | ||||||
|     capture.release() |  | ||||||
|     cv2.destroyAllWindows() |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| def toggle_preview() -> None: |  | ||||||
|     if PREVIEW.state() == 'normal': |  | ||||||
|         PREVIEW.withdraw() |  | ||||||
|     elif roop.globals.source_path and roop.globals.target_path: |  | ||||||
|         init_preview() |  | ||||||
|         update_preview() |  | ||||||
|         PREVIEW.deiconify() |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| def init_preview() -> None: |  | ||||||
|     if is_image(roop.globals.target_path): |  | ||||||
|         preview_slider.pack_forget() |  | ||||||
|     if is_video(roop.globals.target_path): |  | ||||||
|         video_frame_total = get_video_frame_total(roop.globals.target_path) |  | ||||||
|         preview_slider.configure(to=video_frame_total) |  | ||||||
|         preview_slider.pack(fill='x') |  | ||||||
|         preview_slider.set(0) |  | ||||||
| 
 |  | ||||||
| 
 |  | ||||||
| def update_preview(frame_number: int = 0) -> None: |  | ||||||
|     if roop.globals.source_path and roop.globals.target_path: |  | ||||||
|         temp_frame = get_video_frame(roop.globals.target_path, frame_number) |  | ||||||
|         if predict_frame(temp_frame): |  | ||||||
|             quit() |  | ||||||
|         for frame_processor in get_frame_processors_modules(roop.globals.frame_processors): |  | ||||||
|             temp_frame = frame_processor.process_frame( |  | ||||||
|                 get_one_face(cv2.imread(roop.globals.source_path)), |  | ||||||
|                 temp_frame |  | ||||||
|             ) |  | ||||||
|         image = Image.fromarray(cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB)) |  | ||||||
|         image = ImageOps.contain(image, (PREVIEW_MAX_WIDTH, PREVIEW_MAX_HEIGHT), Image.LANCZOS) |  | ||||||
|         image = ctk.CTkImage(image, size=image.size) |  | ||||||
|         preview_label.configure(image=image) |  | ||||||
|          |  | ||||||
| 
 |  | ||||||
| def webcam_preview(): |  | ||||||
|     if roop.globals.source_path is None: |  | ||||||
|         # No image selected |  | ||||||
|         return |  | ||||||
|      |  | ||||||
|     global preview_label, PREVIEW |  | ||||||
| 
 |  | ||||||
|     cap = cv2.VideoCapture(0)  # Use index for the webcam (adjust the index accordingly if necessary)     |  | ||||||
|     cap.set(cv2.CAP_PROP_FRAME_WIDTH, 1280)  # Set the width of the resolution |  | ||||||
|     cap.set(cv2.CAP_PROP_FRAME_HEIGHT, 720)  # Set the height of the resolution |  | ||||||
|     cap.set(cv2.CAP_PROP_FPS, 60)  # Set the frame rate of the webcam |  | ||||||
|     PREVIEW_MAX_HEIGHT = 720 |  | ||||||
|     PREVIEW_MAX_WIDTH = 1280 |  | ||||||
| 
 |  | ||||||
|     preview_label.configure(image=None)  # Reset the preview image before startup |  | ||||||
| 
 |  | ||||||
|     PREVIEW.deiconify()  # Open preview window |  | ||||||
| 
 |  | ||||||
|     frame_processors = get_frame_processors_modules(roop.globals.frame_processors) |  | ||||||
| 
 |  | ||||||
|     source_image = None  # Initialize variable for the selected face image |  | ||||||
| 
 |  | ||||||
|     while True: |  | ||||||
|         ret, frame = cap.read() |  | ||||||
|         if not ret: |  | ||||||
|             break |  | ||||||
| 
 |  | ||||||
|         # Select and save face image only once |  | ||||||
|         if source_image is None and roop.globals.source_path: |  | ||||||
|             source_image = get_one_face(cv2.imread(roop.globals.source_path)) |  | ||||||
| 
 |  | ||||||
|         temp_frame = frame.copy()  #Create a copy of the frame |  | ||||||
| 
 |  | ||||||
|         for frame_processor in frame_processors: |  | ||||||
|             temp_frame = frame_processor.process_frame(source_image, temp_frame) |  | ||||||
| 
 |  | ||||||
|         image = cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB)  # Convert the image to RGB format to display it with Tkinter |  | ||||||
|         image = Image.fromarray(image) |  | ||||||
|         image = ImageOps.contain(image, (PREVIEW_MAX_WIDTH, PREVIEW_MAX_HEIGHT), Image.LANCZOS) |  | ||||||
|         image = ctk.CTkImage(image, size=image.size) |  | ||||||
|         preview_label.configure(image=image) |  | ||||||
|         ROOT.update() |  | ||||||
| 
 |  | ||||||
|     cap.release() |  | ||||||
|     PREVIEW.withdraw()  # Close preview window when loop is finished |  | ||||||
|  | @ -107,10 +107,10 @@ def create_root(start: Callable[[], None], destroy: Callable[[], None]) -> ctk.C | ||||||
|     status_label = ctk.CTkLabel(root, text=None, justify='center') |     status_label = ctk.CTkLabel(root, text=None, justify='center') | ||||||
|     status_label.place(relx=0.1, rely=0.9, relwidth=0.8) |     status_label.place(relx=0.1, rely=0.9, relwidth=0.8) | ||||||
| 
 | 
 | ||||||
|     donate_label = ctk.CTkLabel(root, text='Gourieff GitHub', justify='center', cursor='hand2') |     donate_label = ctk.CTkLabel(root, text='Deep Live Cam', justify='center', cursor='hand2') | ||||||
|     donate_label.place(relx=0.1, rely=0.95, relwidth=0.8) |     donate_label.place(relx=0.1, rely=0.95, relwidth=0.8) | ||||||
|     donate_label.configure(text_color=ctk.ThemeManager.theme.get('URL').get('text_color')) |     donate_label.configure(text_color=ctk.ThemeManager.theme.get('URL').get('text_color')) | ||||||
|     donate_label.bind('<Button>', lambda event: webbrowser.open('https://github.com/Gourieff')) |     donate_label.bind('<Button>', lambda event: webbrowser.open('https://paypal.me/hacksider')) | ||||||
| 
 | 
 | ||||||
|     return root |     return root | ||||||
| 
 | 
 | ||||||
|  |  | ||||||
								
									
									
										
											
												BIN
											
										
									
									roop-cam.gif
									
									
									
									
								
								
							
							
										
											
												BIN
											
										
									
									roop-cam.gif
									
									
									
									
								
											
												Binary file not shown.
											
										
									
								| Before Width: | Height: | Size: 1.1 MiB | 
		Loading…
	
		Reference in New Issue