Merge pull request #329 from bit-wrangler/experimental

Added virtual camera output and fetching of input camera devices with names using pygrabber on windows and linux
2024-08-16 00:58:50 +08:00 · 2024-08-16 00:58:50 +08:00 · ac8feff652
parent 137ac597ef a90c4facc5
commit ac8feff652
3 changed files with 96 additions and 54 deletions
--- a/README.md
+++ b/README.md
@ -142,6 +142,7 @@ Just follow the clicks on the screenshot
 Just use your favorite screencapture to stream like OBS
 > Note: In case you want to change your face, just select another picture, the preview mode will then restart (so just wait a bit).
 You can now use the virtual camera output (uses pyvirtualcam) by turning on the `Virtual Cam Output (OBS)` toggle which should output to the OBS Virtual Camera. Note: this may not work on macOS. You will get a preview as before, but now you will also have a virtual camera output which can be used in applications like Zoom.
 Additional command line arguments are given below. To learn out what they do, check [this guide](https://github.com/s0md3v/roop/wiki/Advanced-Options).
--- a/modules/ui.py
+++ b/modules/ui.py
@ -2,9 +2,12 @@ import os
 import platform
 import webbrowser
 import customtkinter as ctk
-from typing import Callable, Tuple
+from typing import Callable, Tuple, List, Any
 from types import ModuleType
 import cv2
 from PIL import Image, ImageOps
 from pygrabber.dshow_graph import FilterGraph
 import pyvirtualcam
 # Import OS-specific modules only when necessary
 if platform.system() == 'Darwin':  # macOS
@ -20,7 +23,7 @@ from modules.processors.frame.core import get_frame_processors_modules
 from modules.utilities import is_image, is_video, resolve_relative_path
 ROOT = None
-ROOT_HEIGHT = 700
+ROOT_HEIGHT = 800
 ROOT_WIDTH = 600
 PREVIEW = None
@ -105,65 +108,69 @@ def create_root(start: Callable[[], None], destroy: Callable[[], None]) -> ctk.C
    root.protocol('WM_DELETE_WINDOW', lambda: destroy())
    source_label = ctk.CTkLabel(root, text=None)
-    source_label.place(relx=0.1, rely=0.1, relwidth=0.3, relheight=0.25)
+    source_label.place(relx=0.1, rely=0.0875, relwidth=0.3, relheight=0.25)
    target_label = ctk.CTkLabel(root, text=None)
-    target_label.place(relx=0.6, rely=0.1, relwidth=0.3, relheight=0.25)
+    target_label.place(relx=0.6, rely=0.0875, relwidth=0.3, relheight=0.25)
    source_button = ctk.CTkButton(root, text='Select a face', cursor='hand2', command=select_source_path)
-    source_button.place(relx=0.1, rely=0.4, relwidth=0.3, relheight=0.1)
+    source_button.place(relx=0.1, rely=0.35, relwidth=0.3, relheight=0.1)
    target_button = ctk.CTkButton(root, text='Select a target', cursor='hand2', command=select_target_path)
-    target_button.place(relx=0.6, rely=0.4, relwidth=0.3, relheight=0.1)
+    target_button.place(relx=0.6, rely=0.35, relwidth=0.3, relheight=0.1)
    keep_fps_value = ctk.BooleanVar(value=modules.globals.keep_fps)
    keep_fps_checkbox = ctk.CTkSwitch(root, text='Keep fps', variable=keep_fps_value, cursor='hand2', command=lambda: setattr(modules.globals, 'keep_fps', not modules.globals.keep_fps))
-    keep_fps_checkbox.place(relx=0.1, rely=0.6)
+    keep_fps_checkbox.place(relx=0.1, rely=0.525)
    keep_frames_value = ctk.BooleanVar(value=modules.globals.keep_frames)
    keep_frames_switch = ctk.CTkSwitch(root, text='Keep frames', variable=keep_frames_value, cursor='hand2', command=lambda: setattr(modules.globals, 'keep_frames', keep_frames_value.get()))
-    keep_frames_switch.place(relx=0.1, rely=0.65)
+    keep_frames_switch.place(relx=0.1, rely=0.56875)
    enhancer_value = ctk.BooleanVar(value=modules.globals.fp_ui['face_enhancer'])
    enhancer_switch = ctk.CTkSwitch(root, text='Face Enhancer', variable=enhancer_value, cursor='hand2', command=lambda: update_tumbler('face_enhancer', enhancer_value.get()))
-    enhancer_switch.place(relx=0.1, rely=0.7)
+    enhancer_switch.place(relx=0.1, rely=0.6125)
    keep_audio_value = ctk.BooleanVar(value=modules.globals.keep_audio)
    keep_audio_switch = ctk.CTkSwitch(root, text='Keep audio', variable=keep_audio_value, cursor='hand2', command=lambda: setattr(modules.globals, 'keep_audio', keep_audio_value.get()))
-    keep_audio_switch.place(relx=0.6, rely=0.6)
+    keep_audio_switch.place(relx=0.6, rely=0.525)
    many_faces_value = ctk.BooleanVar(value=modules.globals.many_faces)
    many_faces_switch = ctk.CTkSwitch(root, text='Many faces', variable=many_faces_value, cursor='hand2', command=lambda: setattr(modules.globals, 'many_faces', many_faces_value.get()))
-    many_faces_switch.place(relx=0.6, rely=0.65)
+    many_faces_switch.place(relx=0.6, rely=0.56875)
    nsfw_value = ctk.BooleanVar(value=modules.globals.nsfw)
    nsfw_switch = ctk.CTkSwitch(root, text='NSFW', variable=nsfw_value, cursor='hand2', command=lambda: setattr(modules.globals, 'nsfw', nsfw_value.get()))
-    nsfw_switch.place(relx=0.6, rely=0.7)
+    nsfw_switch.place(relx=0.6, rely=0.6125)
    start_button = ctk.CTkButton(root, text='Start', cursor='hand2', command=lambda: select_output_path(start))
-    start_button.place(relx=0.15, rely=0.8, relwidth=0.2, relheight=0.05)
+    start_button.place(relx=0.15, rely=0.7, relwidth=0.2, relheight=0.05)
    stop_button = ctk.CTkButton(root, text='Destroy', cursor='hand2', command=destroy)
-    stop_button.place(relx=0.4, rely=0.8, relwidth=0.2, relheight=0.05)
+    stop_button.place(relx=0.4, rely=0.7, relwidth=0.2, relheight=0.05)
    preview_button = ctk.CTkButton(root, text='Preview', cursor='hand2', command=toggle_preview)
-    preview_button.place(relx=0.65, rely=0.8, relwidth=0.2, relheight=0.05)
+    preview_button.place(relx=0.65, rely=0.7, relwidth=0.2, relheight=0.05)
    camera_label = ctk.CTkLabel(root, text="Select Camera:")
-    camera_label.place(relx=0.4, rely=0.86, relwidth=0.2, relheight=0.05)
+    camera_label.place(relx=0.4, rely=0.7525, relwidth=0.2, relheight=0.05)
    available_cameras = get_available_cameras()
    available_camera_strings = [str(cam) for cam in available_cameras]
    camera_variable = ctk.StringVar(value=available_camera_strings[0] if available_camera_strings else "No cameras found")
    camera_optionmenu = ctk.CTkOptionMenu(root, variable=camera_variable, values=available_camera_strings)
-    camera_optionmenu.place(relx=0.65, rely=0.86, relwidth=0.2, relheight=0.05)
+    camera_optionmenu.place(relx=0.65, rely=0.7525, relwidth=0.2, relheight=0.05)
-    live_button = ctk.CTkButton(root, text='Live', cursor='hand2', command=lambda: webcam_preview(camera_variable.get()))
+    virtual_cam_out_value = ctk.BooleanVar(value=False)
-    live_button.place(relx=0.15, rely=0.86, relwidth=0.2, relheight=0.05)
+    virtual_cam_out_switch = ctk.CTkSwitch(root, text='Virtual Cam Output (OBS)', variable=virtual_cam_out_value, cursor='hand2')
    virtual_cam_out_switch.place(relx=0.4, rely=0.805)
    live_button = ctk.CTkButton(root, text='Live', cursor='hand2', command=lambda: webcam_preview(camera_variable.get(), virtual_cam_out_value.get()))
    live_button.place(relx=0.15, rely=0.7525, relwidth=0.2, relheight=0.05)
    status_label = ctk.CTkLabel(root, text=None, justify='center')
-    status_label.place(relx=0.1, relwidth=0.8, rely=0.9)
+    status_label.place(relx=0.1, relwidth=0.8, rely=0.875)
    donate_label = ctk.CTkLabel(root, text='Deep Live Cam', justify='center', cursor='hand2')
    donate_label.place(relx=0.1, rely=0.95, relwidth=0.8)
@ -311,6 +318,38 @@ def update_preview(frame_number: int = 0) -> None:
        image = ctk.CTkImage(image, size=image.size)
        preview_label.configure(image=image)
 def webcam_preview_loop(camera: cv2.VideoCapture, source_image: Any, frame_processors: List[ModuleType], virtual_cam: pyvirtualcam.Camera = None) -> bool:
    global preview_label, PREVIEW
    ret, frame = camera.read()
    if not ret:
        update_status(f"Error: Frame not received from camera.")
        return False
    temp_frame = frame.copy()
    if modules.globals.live_mirror:
        temp_frame = cv2.flip(temp_frame, 1) # horizontal flipping
    if modules.globals.live_resizable:
        temp_frame = fit_image_to_size(temp_frame, PREVIEW.winfo_width(), PREVIEW.winfo_height())
    for frame_processor in frame_processors:
        temp_frame = frame_processor.process_frame(source_image, temp_frame)
    image = Image.fromarray(cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB))
    image = ImageOps.contain(image, (temp_frame.shape[1], temp_frame.shape[0]), Image.LANCZOS)
    image = ctk.CTkImage(image, size=image.size)
    preview_label.configure(image=image)
    if virtual_cam:
        virtual_cam.send(temp_frame)
        virtual_cam.sleep_until_next_frame()
    ROOT.update()
    if PREVIEW.state() == 'withdrawn':
        return False
    return True
 def fit_image_to_size(image, width: int, height: int):
    if width is None and height is None:
@ -326,12 +365,16 @@ def fit_image_to_size(image, width: int, height: int):
    new_size = (int(ratio * w), int(ratio * h))
    return cv2.resize(image, dsize=new_size)
-def webcam_preview(camera_name: str):
+def webcam_preview(camera_name: str, virtual_cam_output: bool):
    if modules.globals.source_path is None:
        return
    global preview_label, PREVIEW
    WIDTH = 960
    HEIGHT = 540
    FPS = 60
    # Select the camera by its name
    selected_camera = select_camera(camera_name)
    if selected_camera is None:
@ -348,9 +391,12 @@ def webcam_preview(camera_name: str):
        update_status(f"Error: Could not open camera {camera_name}")
        return
-    camera.set(cv2.CAP_PROP_FRAME_WIDTH, 960)
+    camera.set(cv2.CAP_PROP_FRAME_WIDTH, WIDTH)
-    camera.set(cv2.CAP_PROP_FRAME_HEIGHT, 540)
+    camera.set(cv2.CAP_PROP_FRAME_HEIGHT, HEIGHT)
-    camera.set(cv2.CAP_PROP_FPS, 60)
+    camera.set(cv2.CAP_PROP_FPS, FPS)
    PREVIEW_MAX_WIDTH = WIDTH
    PREVIEW_MAX_HEIGHT = HEIGHT
    preview_label.configure(width=PREVIEW_DEFAULT_WIDTH, height=PREVIEW_DEFAULT_HEIGHT)
    PREVIEW.deiconify()
@ -358,28 +404,15 @@ def webcam_preview(camera_name: str):
    frame_processors = get_frame_processors_modules(modules.globals.frame_processors)
    source_image = get_one_face(cv2.imread(modules.globals.source_path))
-    while camera:
+    preview_running = True
        ret, frame = camera.read()
        if not ret:
            update_status(f"Error: Frame not received from camera.")
            break
-        temp_frame = frame.copy()
+    if virtual_cam_output:
        with pyvirtualcam.Camera(width=WIDTH, height=HEIGHT, fps=FPS, fmt=pyvirtualcam.PixelFormat.BGR) as virtual_cam:
            while preview_running:
                preview_running = webcam_preview_loop(camera, source_image, frame_processors, virtual_cam)
-        if modules.globals.live_mirror:
+    while preview_running:
-            temp_frame = cv2.flip(temp_frame, 1) # horizontal flipping
+        preview_running = webcam_preview_loop(camera, source_image, frame_processors)
        if modules.globals.live_resizable:
            temp_frame = fit_image_to_size(temp_frame, PREVIEW.winfo_width(), PREVIEW.winfo_height())
        for frame_processor in frame_processors:
            temp_frame = frame_processor.process_frame(source_image, temp_frame)
        image = Image.fromarray(cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB))
        image = ImageOps.contain(image, (temp_frame.shape[1], temp_frame.shape[0]), Image.LANCZOS)
        image = ctk.CTkImage(image, size=image.size)
        preview_label.configure(image=image)
        ROOT.update()
    if camera: camera.release()
    PREVIEW.withdraw()
@ -414,13 +447,19 @@ def get_available_cameras():
            elif device.deviceType() == "AVCaptureDeviceTypeContinuityCamera":
                print(f"Skipping Continuity Camera: {device.localizedName()}")
    elif platform.system() == 'Windows' or platform.system() == 'Linux':
        try:  
            devices = FilterGraph().get_input_devices()  
        except Exception as e:  
            # Use OpenCV to detect camera indexes
            index = 0
            devices = [] 
            while True:
                cap = cv2.VideoCapture(index)
                if not cap.isOpened():
                    break
-            available_cameras.append(f"Camera {index}")
+                devices.append(f"Camera {index}")
                cap.release()
                index += 1
        available_cameras = devices
    return available_cameras
--- a/requirements.txt
+++ b/requirements.txt
@ -22,3 +22,5 @@ protobuf==4.23.2
 tqdm==4.66.4
 gfpgan==1.3.8
 pyobjc==9.1; sys_platform == 'darwin'
 pygrabber==0.2
 pyvirtualcam==0.12.0