Deep-Live-Cam/modules/ui.py

491 lines
19 KiB
Python
Raw Normal View History

2023-09-24 21:36:57 +08:00
import os
import platform
2024-10-02 12:45:59 +08:00
import logging
2023-09-24 21:36:57 +08:00
import webbrowser
import customtkinter as ctk
2024-10-02 12:45:59 +08:00
from typing import Callable, Tuple, List, Any, Optional
from types import ModuleType
2023-09-24 21:36:57 +08:00
import cv2
from PIL import Image, ImageOps
import pyvirtualcam
# Import OS-specific modules only when necessary
if platform.system() == 'Darwin': # macOS
import AVFoundation
# Import Windows specific modules only when on windows platform
if platform.system() == 'Windows' or platform.system() == 'Linux': # Windows or Linux
from pygrabber.dshow_graph import FilterGraph
2023-09-24 21:36:57 +08:00
import modules.globals
import modules.metadata
from modules.face_analyser import get_one_face
2023-09-24 21:36:57 +08:00
from modules.capturer import get_video_frame, get_video_frame_total
from modules.processors.frame.core import get_frame_processors_modules
from modules.utilities import is_image, is_video, resolve_relative_path
2023-09-24 21:36:57 +08:00
ROOT = None
2024-09-25 20:06:50 +08:00
ROOT_HEIGHT = 800
ROOT_WIDTH = 600
2023-09-24 21:36:57 +08:00
PREVIEW = None
PREVIEW_MAX_HEIGHT = 700
PREVIEW_MAX_WIDTH = 1200
PREVIEW_DEFAULT_WIDTH = 960
PREVIEW_DEFAULT_HEIGHT = 540
2023-09-24 21:36:57 +08:00
RECENT_DIRECTORY_SOURCE = None
RECENT_DIRECTORY_TARGET = None
RECENT_DIRECTORY_OUTPUT = None
preview_label = None
preview_slider = None
source_label = None
target_label = None
status_label = None
img_ft, vid_ft = modules.globals.file_types
camera = None
def check_camera_permissions():
"""Check and request camera access permission on macOS."""
if platform.system() == 'Darwin': # macOS-specific
2024-10-02 05:08:53 +08:00
try:
result = subprocess.run(['tccutil', 'get', 'Camera', 'com.apple.Terminal'], capture_output=True, text=True)
if 'denied' in result.stdout.lower():
raise PermissionError("Camera access denied")
except subprocess.CalledProcessError:
raise RuntimeError("Failed to check camera permissions")
def select_camera(camera_name: str):
"""Select the appropriate camera based on its name (cross-platform)."""
if platform.system() == 'Darwin': # macOS-specific
devices = AVFoundation.AVCaptureDevice.devicesWithMediaType_(AVFoundation.AVMediaTypeVideo)
for device in devices:
if device.localizedName() == camera_name:
return device
elif platform.system() == 'Windows' or platform.system() == 'Linux':
# On Windows/Linux, simply return the camera name as OpenCV can handle it by index
return camera_name
return None
def init(start: Callable[[], None], destroy: Callable[[], None]) -> ctk.CTk:
2023-09-24 21:36:57 +08:00
global ROOT, PREVIEW
if platform.system() == 'Darwin': # macOS-specific
check_camera_permissions() # Check camera permissions before initializing the UI
2023-09-24 21:36:57 +08:00
ROOT = create_root(start, destroy)
PREVIEW = create_preview(ROOT)
return ROOT
def create_root(start: Callable[[], None], destroy: Callable[[], None]) -> ctk.CTk:
2023-09-24 21:36:57 +08:00
global source_label, target_label, status_label
ctk.deactivate_automatic_dpi_awareness()
ctk.set_appearance_mode('system')
ctk.set_default_color_theme(resolve_relative_path('ui.json'))
print("Creating root window...")
root = ctk.CTk()
root.minsize(ROOT_WIDTH, ROOT_HEIGHT)
root.title(f'{modules.metadata.name} {modules.metadata.version} {modules.metadata.edition}')
root.protocol('WM_DELETE_WINDOW', lambda: destroy())
source_label = ctk.CTkLabel(root, text=None)
source_label.place(relx=0.1, rely=0.0875, relwidth=0.3, relheight=0.25)
target_label = ctk.CTkLabel(root, text=None)
target_label.place(relx=0.6, rely=0.0875, relwidth=0.3, relheight=0.25)
source_button = ctk.CTkButton(root, text='Select a face', cursor='hand2', command=select_source_path)
source_button.place(relx=0.1, rely=0.35, relwidth=0.3, relheight=0.1)
swap_faces_button = ctk.CTkButton(root, text='', cursor='hand2', command=lambda: swap_faces_paths())
swap_faces_button.place(relx=0.45, rely=0.4, relwidth=0.1, relheight=0.1)
target_button = ctk.CTkButton(root, text='Select a target', cursor='hand2', command=select_target_path)
target_button.place(relx=0.6, rely=0.35, relwidth=0.3, relheight=0.1)
2023-09-24 21:36:57 +08:00
keep_fps_value = ctk.BooleanVar(value=modules.globals.keep_fps)
keep_fps_checkbox = ctk.CTkSwitch(root, text='Keep fps', variable=keep_fps_value, cursor='hand2', command=lambda: setattr(modules.globals, 'keep_fps', not modules.globals.keep_fps))
keep_fps_checkbox.place(relx=0.1, rely=0.525)
2023-09-24 21:36:57 +08:00
keep_frames_value = ctk.BooleanVar(value=modules.globals.keep_frames)
keep_frames_switch = ctk.CTkSwitch(root, text='Keep frames', variable=keep_frames_value, cursor='hand2', command=lambda: setattr(modules.globals, 'keep_frames', keep_frames_value.get()))
keep_frames_switch.place(relx=0.1, rely=0.56875)
enhancer_value = ctk.BooleanVar(value=modules.globals.fp_ui['face_enhancer'])
enhancer_switch = ctk.CTkSwitch(root, text='Face Enhancer', variable=enhancer_value, cursor='hand2', command=lambda: update_tumbler('face_enhancer', enhancer_value.get()))
enhancer_switch.place(relx=0.1, rely=0.6125)
2023-09-24 21:36:57 +08:00
keep_audio_value = ctk.BooleanVar(value=modules.globals.keep_audio)
keep_audio_switch = ctk.CTkSwitch(root, text='Keep audio', variable=keep_audio_value, cursor='hand2', command=lambda: setattr(modules.globals, 'keep_audio', keep_audio_value.get()))
keep_audio_switch.place(relx=0.6, rely=0.525)
2023-09-24 21:36:57 +08:00
many_faces_value = ctk.BooleanVar(value=modules.globals.many_faces)
many_faces_switch = ctk.CTkSwitch(root, text='Many faces', variable=many_faces_value, cursor='hand2', command=lambda: setattr(modules.globals, 'many_faces', many_faces_value.get()))
many_faces_switch.place(relx=0.6, rely=0.56875)
2023-09-24 21:36:57 +08:00
nsfw_value = ctk.BooleanVar(value=modules.globals.nsfw)
nsfw_switch = ctk.CTkSwitch(root, text='NSFW', variable=nsfw_value, cursor='hand2', command=lambda: setattr(modules.globals, 'nsfw', nsfw_value.get()))
nsfw_switch.place(relx=0.6, rely=0.6125)
2024-09-25 20:06:50 +08:00
start_button = ctk.CTkButton(root, text='Start', cursor='hand2', command=lambda: select_output_path(start))
start_button.place(relx=0.15, rely=0.7, relwidth=0.2, relheight=0.05)
stop_button = ctk.CTkButton(root, text='Destroy', cursor='hand2', command=destroy)
stop_button.place(relx=0.4, rely=0.7, relwidth=0.2, relheight=0.05)
preview_button = ctk.CTkButton(root, text='Preview', cursor='hand2', command=toggle_preview)
preview_button.place(relx=0.65, rely=0.7, relwidth=0.2, relheight=0.05)
2024-09-10 07:07:58 +08:00
camera_label = ctk.CTkLabel(root, text="Select Camera:")
camera_label.place(relx=0.4, rely=0.7525, relwidth=0.2, relheight=0.05)
available_cameras = get_available_cameras()
available_camera_strings = [str(cam) for cam in available_cameras]
camera_variable = ctk.StringVar(value=available_camera_strings[0] if available_camera_strings else "No cameras found")
camera_optionmenu = ctk.CTkOptionMenu(root, variable=camera_variable, values=available_camera_strings)
camera_optionmenu.place(relx=0.65, rely=0.7525, relwidth=0.2, relheight=0.05)
virtual_cam_out_value = ctk.BooleanVar(value=False)
virtual_cam_out_switch = ctk.CTkSwitch(root, text='Virtual Cam Output (OBS)', variable=virtual_cam_out_value, cursor='hand2')
virtual_cam_out_switch.place(relx=0.4, rely=0.805)
live_button = ctk.CTkButton(root, text='Live', cursor='hand2', command=lambda: webcam_preview(camera_variable.get(), virtual_cam_out_value.get()))
live_button.place(relx=0.15, rely=0.7525, relwidth=0.2, relheight=0.05)
2023-09-24 21:36:57 +08:00
status_label = ctk.CTkLabel(root, text=None, justify='center')
status_label.place(relx=0.1, relwidth=0.8, rely=0.875)
donate_label = ctk.CTkLabel(root, text='Deep Live Cam', justify='center', cursor='hand2')
donate_label.place(relx=0.1, rely=0.95, relwidth=0.8)
donate_label.configure(text_color=ctk.ThemeManager.theme.get('URL').get('text_color'))
donate_label.bind('<Button-1>', lambda event: webbrowser.open('https://paypal.me/hacksider'))
return root
def create_preview(parent: ctk.CTk) -> ctk.CTkToplevel:
2023-09-24 21:36:57 +08:00
global preview_label, preview_slider
preview = ctk.CTkToplevel(parent)
preview.withdraw()
preview.title('Preview')
preview.protocol('WM_DELETE_WINDOW', toggle_preview)
preview.resizable(width=True, height=True)
2023-09-24 21:36:57 +08:00
preview_label = ctk.CTkLabel(preview, text=None)
preview_label.pack(fill='both', expand=True)
preview_slider = ctk.CTkSlider(preview, from_=0, to=0, command=update_preview)
2023-09-24 21:36:57 +08:00
return preview
def update_status(text: str) -> None:
status_label.configure(text=text)
ROOT.update()
2024-09-25 20:06:50 +08:00
2023-09-24 21:36:57 +08:00
def update_tumbler(var: str, value: bool) -> None:
modules.globals.fp_ui[var] = value
def select_source_path() -> None:
global RECENT_DIRECTORY_SOURCE
2023-09-24 21:36:57 +08:00
PREVIEW.withdraw()
source_path = ctk.filedialog.askopenfilename(title='Select a source image', initialdir=RECENT_DIRECTORY_SOURCE, filetypes=[img_ft])
2023-09-24 21:36:57 +08:00
if is_image(source_path):
modules.globals.source_path = source_path
RECENT_DIRECTORY_SOURCE = os.path.dirname(modules.globals.source_path)
image = render_image_preview(modules.globals.source_path, (200, 200))
source_label.configure(image=image)
else:
modules.globals.source_path = None
source_label.configure(image=None)
def swap_faces_paths() -> None:
global RECENT_DIRECTORY_SOURCE, RECENT_DIRECTORY_TARGET
source_path = modules.globals.source_path
target_path = modules.globals.target_path
if not is_image(source_path) or not is_image(target_path):
return
modules.globals.source_path = target_path
modules.globals.target_path = source_path
RECENT_DIRECTORY_SOURCE = os.path.dirname(modules.globals.source_path)
RECENT_DIRECTORY_TARGET = os.path.dirname(modules.globals.target_path)
PREVIEW.withdraw()
source_image = render_image_preview(modules.globals.source_path, (200, 200))
source_label.configure(image=source_image)
target_image = render_image_preview(modules.globals.target_path, (200, 200))
target_label.configure(image=target_image)
2023-09-24 21:36:57 +08:00
def select_target_path() -> None:
global RECENT_DIRECTORY_TARGET
2023-09-24 21:36:57 +08:00
PREVIEW.withdraw()
target_path = ctk.filedialog.askopenfilename(title='Select a target image or video', initialdir=RECENT_DIRECTORY_TARGET, filetypes=[img_ft, vid_ft])
2023-09-24 21:36:57 +08:00
if is_image(target_path):
modules.globals.target_path = target_path
RECENT_DIRECTORY_TARGET = os.path.dirname(modules.globals.target_path)
image = render_image_preview(modules.globals.target_path, (200, 200))
target_label.configure(image=image)
elif is_video(target_path):
modules.globals.target_path = target_path
RECENT_DIRECTORY_TARGET = os.path.dirname(modules.globals.target_path)
video_frame = render_video_preview(target_path, (200, 200))
target_label.configure(image=video_frame)
else:
modules.globals.target_path = None
target_label.configure(image=None)
def select_output_path(start: Callable[[], None]) -> None:
global RECENT_DIRECTORY_OUTPUT
2023-09-24 21:36:57 +08:00
if is_image(modules.globals.target_path):
output_path = ctk.filedialog.asksaveasfilename(title='Save image output file', filetypes=[img_ft], defaultextension='.png', initialfile='output.png', initialdir=RECENT_DIRECTORY_OUTPUT)
2023-09-24 21:36:57 +08:00
elif is_video(modules.globals.target_path):
output_path = ctk.filedialog.asksaveasfilename(title='Save video output file', filetypes=[vid_ft], defaultextension='.mp4', initialfile='output.mp4', initialdir=RECENT_DIRECTORY_OUTPUT)
2023-09-24 21:36:57 +08:00
else:
output_path = None
if output_path:
modules.globals.output_path = output_path
RECENT_DIRECTORY_OUTPUT = os.path.dirname(modules.globals.output_path)
start()
def render_image_preview(image_path: str, size: Tuple[int, int]) -> ctk.CTkImage:
image = Image.open(image_path)
if size:
image = ImageOps.fit(image, size, Image.LANCZOS)
return ctk.CTkImage(image, size=image.size)
def render_video_preview(video_path: str, size: Tuple[int, int], frame_number: int = 0) -> ctk.CTkImage:
2023-09-24 21:36:57 +08:00
capture = cv2.VideoCapture(video_path)
if frame_number:
capture.set(cv2.CAP_PROP_POS_FRAMES, frame_number)
has_frame, frame = capture.read()
capture.release()
2023-09-24 21:36:57 +08:00
if has_frame:
image = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
if size:
image = ImageOps.fit(image, size, Image.LANCZOS)
return ctk.CTkImage(image, size=image.size)
return None
2023-09-24 21:36:57 +08:00
def toggle_preview() -> None:
if PREVIEW.state() == 'normal':
2023-09-24 21:36:57 +08:00
PREVIEW.withdraw()
elif modules.globals.source_path and modules.globals.target_path:
init_preview()
update_preview()
PREVIEW.deiconify()
global camera
if PREVIEW.state() == 'withdrawn':
if camera and camera.isOpened():
camera.release()
camera = None
2023-09-24 21:36:57 +08:00
def init_preview() -> None:
if is_image(modules.globals.target_path):
preview_slider.pack_forget()
elif is_video(modules.globals.target_path):
2023-09-24 21:36:57 +08:00
video_frame_total = get_video_frame_total(modules.globals.target_path)
preview_slider.configure(to=video_frame_total)
preview_slider.pack(fill='x')
2023-09-24 21:36:57 +08:00
preview_slider.set(0)
def update_preview(frame_number: int = 0) -> None:
if modules.globals.source_path and modules.globals.target_path:
temp_frame = get_video_frame(modules.globals.target_path, frame_number)
if not modules.globals.nsfw:
from modules.predicter import predict_frame
if predict_frame(temp_frame):
quit()
for frame_processor in get_frame_processors_modules(modules.globals.frame_processors):
2023-09-24 21:36:57 +08:00
temp_frame = frame_processor.process_frame(
get_one_face(cv2.imread(modules.globals.source_path)),
temp_frame
2023-09-24 21:36:57 +08:00
)
image = Image.fromarray(cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB))
image = ImageOps.contain(image, (PREVIEW_MAX_WIDTH, PREVIEW_MAX_HEIGHT), Image.LANCZOS)
2023-09-24 21:36:57 +08:00
image = ctk.CTkImage(image, size=image.size)
preview_label.configure(image=image)
2024-10-02 12:52:02 +08:00
def webcam_preview_loop(
camera: cv2.VideoCapture,
source_image: Any,
frame_processors: List[ModuleType],
virtual_cam: Optional[pyvirtualcam.Camera] = None
) -> bool:
2024-10-02 05:30:41 +08:00
try:
return _process_webcam_frames(camera, source_image, frame_processors, virtual_cam)
except Exception as e:
2024-10-02 12:52:02 +08:00
logging.error(f"Error in webcam preview: {str(e)}")
2024-10-02 05:30:41 +08:00
return False
2024-10-02 12:52:02 +08:00
def _process_webcam_frames(
camera: cv2.VideoCapture,
source_image: Any,
frame_processors: List[ModuleType],
virtual_cam: Optional[pyvirtualcam.Camera] = None
) -> bool:
while True:
ret, frame = camera.read()
if not ret:
logging.error("Failed to read frame from camera")
return False
# Apply any frame processors
for processor in frame_processors:
frame = processor.process(frame, source_image)
# Show frame preview
cv2.imshow('Webcam Preview', frame)
# Send frame to virtual camera if available
if virtual_cam:
virtual_cam.send(frame)
virtual_cam.sleep_until_next_frame()
# Break loop on key press
if cv2.waitKey(1) & 0xFF == ord('q'):
break
camera.release()
cv2.destroyAllWindows()
return True
def fit_image_to_size(image, width: int, height: int):
if width is None and height is None:
return image
h, w, _ = image.shape
ratio_h = 0.0
ratio_w = 0.0
if width > height:
ratio_h = height / h
else:
ratio_w = width / w
ratio = max(ratio_w, ratio_h)
new_size = (int(ratio * w), int(ratio * h))
return cv2.resize(image, dsize=new_size)
2024-10-02 12:45:59 +08:00
class WebcamHandler:
def __init__(self, camera_name: str, virtual_cam_output: bool):
self.camera_name = camera_name
self.virtual_cam_output = virtual_cam_output
self.camera = None
self.virtual_cam = None
self.preview_running = True
def setup_camera(self):
self.camera = cv2.VideoCapture(self.camera_name)
if not self.camera.isOpened():
logging.error(f"Cannot open camera: {self.camera_name}")
raise RuntimeError(f"Cannot open camera: {self.camera_name}")
if self.virtual_cam_output:
self.virtual_cam = pyvirtualcam.Camera(width=640, height=480, fps=30)
def process_frame(self, source_image: Any, frame_processors: List[ModuleType]):
ret, frame = self.camera.read()
if not ret:
logging.error("Failed to read frame from camera")
return None
# Apply any frame processors
for processor in frame_processors:
frame = processor.process(frame, source_image)
return frame
def handle_output(self, frame: Any):
# Show frame preview
cv2.imshow('Webcam Preview', frame)
# Send frame to virtual camera if available
if self.virtual_cam:
self.virtual_cam.send(frame)
self.virtual_cam.sleep_until_next_frame()
# Break loop on key press
if cv2.waitKey(1) & 0xFF == ord('q'):
self.preview_running = False
def run(self, source_image: Any, frame_processors: List[ModuleType]):
self.setup_camera()
while self.preview_running:
processed_frame = self.process_frame(source_image, frame_processors)
if processed_frame is not None:
self.handle_output(processed_frame)
self.cleanup()
def cleanup(self):
if self.camera:
self.camera.release()
if self.virtual_cam:
self.virtual_cam.close()
cv2.destroyAllWindows()
def webcam_preview(camera_name: str, virtual_cam_output: bool, source_image: Any, frame_processors: List[ModuleType]):
if source_image is None: # Assuming source_image is checked for validity here
return
2024-10-02 12:45:59 +08:00
handler = WebcamHandler(camera_name, virtual_cam_output)
handler.run(source_image, frame_processors)
2024-09-25 20:06:50 +08:00
def get_camera_index_by_name(camera_name: str) -> int:
"""Map camera name to index for OpenCV."""
if platform.system() == 'Darwin': # macOS-specific
if "FaceTime" in camera_name:
return 0 # Assuming FaceTime is at index 0
elif "iPhone" in camera_name:
return 1 # Assuming iPhone camera is at index 1
elif platform.system() == 'Windows' or platform.system() == 'Linux':
# Map camera name to index dynamically (OpenCV on these platforms usually starts with 0)
return get_available_cameras().index(camera_name)
return -1
def get_available_cameras():
"""Get available camera names (cross-platform)."""
available_cameras = []
2024-10-02 05:08:53 +08:00
if platform.system() == "Windows":
import wmi
c = wmi.WMI()
for camera in c.Win32_PnPEntity(PNPClass="Image"):
available_cameras.append(camera.Name)
elif platform.system() == "Darwin": # macOS
import subprocess
output = subprocess.check_output(["system_profiler", "SPCameraDataType"]).decode()
available_cameras = [line.split(":")[1].strip() for line in output.split("\n") if "Camera Name" in line]
else: # Linux and others
import glob
available_cameras = [f"/dev/video{i}" for i in range(10) if os.path.exists(f"/dev/video{i}")]
2024-10-02 12:33:08 +08:00
return available_cameras