677 lines
		
	
	
		
			25 KiB
		
	
	
	
		
			Python
		
	
			
		
		
	
	
			677 lines
		
	
	
		
			25 KiB
		
	
	
	
		
			Python
		
	
| from typing import Any, List
 | |
| import cv2
 | |
| import insightface
 | |
| import threading
 | |
| import numpy as np
 | |
| import modules.globals
 | |
| import logging
 | |
| import modules.processors.frame.core
 | |
| from modules.core import update_status
 | |
| from modules.face_analyser import get_one_face, get_many_faces, default_source_face
 | |
| from modules.typing import Face, Frame
 | |
| from modules.utilities import (
 | |
|     conditional_download,
 | |
|     is_image,
 | |
|     is_video,
 | |
| )
 | |
| from modules.cluster_analysis import find_closest_centroid
 | |
| import os
 | |
| 
 | |
| FACE_SWAPPER = None
 | |
| THREAD_LOCK = threading.Lock()
 | |
| NAME = "DLC.FACE-SWAPPER"
 | |
| 
 | |
| 
 | |
| def _validate_kernel_size(kernel_tuple, default_kernel_tuple):
 | |
|     if isinstance(kernel_tuple, tuple) and len(kernel_tuple) == 2 and \
 | |
|        isinstance(kernel_tuple[0], int) and kernel_tuple[0] > 0 and kernel_tuple[0] % 2 == 1 and \
 | |
|        isinstance(kernel_tuple[1], int) and kernel_tuple[1] > 0 and kernel_tuple[1] % 2 == 1:
 | |
|         return kernel_tuple
 | |
|     else:
 | |
|         logging.warning(f"Invalid kernel size {kernel_tuple} received. Must be a tuple of two positive odd integers. Falling back to default {default_kernel_tuple}.")
 | |
|         return default_kernel_tuple
 | |
| 
 | |
| abs_dir = os.path.dirname(os.path.abspath(__file__))
 | |
| models_dir = os.path.join(
 | |
|     os.path.dirname(os.path.dirname(os.path.dirname(abs_dir))), "models"
 | |
| )
 | |
| 
 | |
| 
 | |
| def pre_check() -> bool:
 | |
|     download_directory_path = abs_dir
 | |
|     conditional_download(
 | |
|         download_directory_path,
 | |
|         [
 | |
|             "https://huggingface.co/hacksider/deep-live-cam/blob/main/inswapper_128.onnx"
 | |
|         ],
 | |
|     )
 | |
|     return True
 | |
| 
 | |
| 
 | |
| def pre_start() -> bool:
 | |
|     if not modules.globals.map_faces and not is_image(modules.globals.source_path):
 | |
|         update_status("Select an image for source path.", NAME)
 | |
|         return False
 | |
|     elif not modules.globals.map_faces and not get_one_face(
 | |
|         cv2.imread(modules.globals.source_path)
 | |
|     ):
 | |
|         update_status("No face in source path detected.", NAME)
 | |
|         return False
 | |
|     if not is_image(modules.globals.target_path) and not is_video(
 | |
|         modules.globals.target_path
 | |
|     ):
 | |
|         update_status("Select an image or video for target path.", NAME)
 | |
|         return False
 | |
|     return True
 | |
| 
 | |
| 
 | |
| def get_face_swapper() -> Any:
 | |
|     global FACE_SWAPPER
 | |
| 
 | |
|     with THREAD_LOCK:
 | |
|         if FACE_SWAPPER is None:
 | |
|             model_path = os.path.join(models_dir, "inswapper_128.onnx")
 | |
|             FACE_SWAPPER = insightface.model_zoo.get_model(
 | |
|                 model_path, providers=modules.globals.execution_providers
 | |
|             )
 | |
|     return FACE_SWAPPER
 | |
| 
 | |
| 
 | |
| def swap_face(source_face: Face, target_face: Face, temp_frame: Frame) -> Frame:
 | |
|     face_swapper = get_face_swapper()
 | |
| 
 | |
|     # Statistical color correction
 | |
|     if getattr(modules.globals, 'statistical_color_correction', True) and target_face.bbox is not None:
 | |
|         x1, y1, x2, y2 = target_face.bbox.astype(int)
 | |
|         original_target_face_roi = temp_frame[y1:y2, x1:x2].copy()
 | |
| 
 | |
|         # Apply the face swap
 | |
|         swapped_frame = face_swapper.get(
 | |
|             temp_frame, target_face, source_face, paste_back=True
 | |
|         )
 | |
| 
 | |
|         if original_target_face_roi.size > 0:
 | |
|             swapped_face_roi = swapped_frame[y1:y2, x1:x2].copy()
 | |
|             if swapped_face_roi.size > 0:
 | |
|                 try:
 | |
|                     corrected_swapped_face_roi = apply_color_transfer(swapped_face_roi, original_target_face_roi)
 | |
|                     swapped_frame[y1:y2, x1:x2] = corrected_swapped_face_roi
 | |
|                 except Exception as e:
 | |
|                     logging.error(f"Failed to apply statistical color transfer: {e}. Using original swapped ROI.")
 | |
|                     # swapped_frame already contains the uncorrected swapped_face_roi in this region
 | |
|     else:
 | |
|         # Apply the face swap without statistical color correction
 | |
|         swapped_frame = face_swapper.get(
 | |
|             temp_frame, target_face, source_face, paste_back=True
 | |
|         )
 | |
| 
 | |
|     if modules.globals.mouth_mask:
 | |
|         # Create a mask for the target face
 | |
|         face_mask = create_face_mask(target_face, swapped_frame) # Use swapped_frame here
 | |
| 
 | |
|         # Create the mouth mask
 | |
|         mouth_mask, mouth_cutout, mouth_box, lower_lip_polygon = (
 | |
|             create_lower_mouth_mask(target_face, swapped_frame) # Use swapped_frame here
 | |
|         )
 | |
| 
 | |
|         # Apply the mouth area
 | |
|         swapped_frame = apply_mouth_area(
 | |
|             swapped_frame, mouth_cutout, mouth_box, face_mask, lower_lip_polygon
 | |
|         )
 | |
| 
 | |
|         if modules.globals.show_mouth_mask_box:
 | |
|             mouth_mask_data = (mouth_mask, mouth_cutout, mouth_box, lower_lip_polygon)
 | |
|             swapped_frame = draw_mouth_mask_visualization(
 | |
|                 swapped_frame, target_face, mouth_mask_data
 | |
|             )
 | |
| 
 | |
|     return swapped_frame
 | |
| 
 | |
| 
 | |
| def process_frame(source_face: Face, temp_frame: Frame) -> Frame:
 | |
|     if modules.globals.color_correction:
 | |
|         temp_frame = cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB)
 | |
| 
 | |
|     if modules.globals.many_faces:
 | |
|         many_faces = get_many_faces(temp_frame)
 | |
|         if many_faces:
 | |
|             for target_face in many_faces:
 | |
|                 if source_face and target_face: # target_face from many_faces will always be valid here
 | |
|                     temp_frame = swap_face(source_face, target_face, temp_frame)
 | |
|                 elif not source_face: # Check source_face specifically
 | |
|                     logging.error("Source face is not available or no face detected in source image. Skipping swap for this target face.")
 | |
|                     # Optionally `continue` or `break` if source_face is essential for all
 | |
|         elif not source_face : # if many_faces is empty AND source_face is also an issue
 | |
|              logging.error("Source face is not available AND no faces detected in target frame.")
 | |
|         else: # many_faces is empty, but source_face is ok
 | |
|              logging.info(f"No faces detected in the current target frame for 'many_faces' mode.")
 | |
|     else:
 | |
|         target_face = get_one_face(temp_frame)
 | |
|         if target_face and source_face:
 | |
|             temp_frame = swap_face(source_face, target_face, temp_frame)
 | |
|         else:
 | |
|             if not source_face:
 | |
|                 logging.error("Source face is not available or no face detected in source image.")
 | |
|             elif not target_face:
 | |
|                 logging.error(f"No face detected in the current target frame.")
 | |
|             else: # Should not happen if logic is right, but as a fallback
 | |
|                 logging.error("Face detection failed for an unknown reason concerning target or source.")
 | |
|     return temp_frame
 | |
| 
 | |
| 
 | |
| 
 | |
| def process_frame_v2(temp_frame: Frame, temp_frame_path: str = "") -> Frame:
 | |
|     if is_image(modules.globals.target_path):
 | |
|         if modules.globals.many_faces:
 | |
|             source_face = default_source_face()
 | |
|             for map in modules.globals.source_target_map:
 | |
|                 target_face = map["target"]["face"]
 | |
|                 temp_frame = swap_face(source_face, target_face, temp_frame)
 | |
| 
 | |
|         elif not modules.globals.many_faces:
 | |
|             for map in modules.globals.source_target_map:
 | |
|                 if "source" in map:
 | |
|                     source_face = map["source"]["face"]
 | |
|                     target_face = map["target"]["face"]
 | |
|                     temp_frame = swap_face(source_face, target_face, temp_frame)
 | |
| 
 | |
|     elif is_video(modules.globals.target_path):
 | |
|         if modules.globals.many_faces:
 | |
|             source_face = default_source_face()
 | |
|             for map in modules.globals.source_target_map:
 | |
|                 target_frame = [
 | |
|                     f
 | |
|                     for f in map["target_faces_in_frame"]
 | |
|                     if f["location"] == temp_frame_path
 | |
|                 ]
 | |
| 
 | |
|                 for frame in target_frame:
 | |
|                     for target_face in frame["faces"]:
 | |
|                         temp_frame = swap_face(source_face, target_face, temp_frame)
 | |
| 
 | |
|         elif not modules.globals.many_faces:
 | |
|             for map in modules.globals.source_target_map:
 | |
|                 if "source" in map:
 | |
|                     target_frame = [
 | |
|                         f
 | |
|                         for f in map["target_faces_in_frame"]
 | |
|                         if f["location"] == temp_frame_path
 | |
|                     ]
 | |
|                     source_face = map["source"]["face"]
 | |
| 
 | |
|                     for frame in target_frame:
 | |
|                         for target_face in frame["faces"]:
 | |
|                             temp_frame = swap_face(source_face, target_face, temp_frame)
 | |
| 
 | |
|     else:
 | |
|         detected_faces = get_many_faces(temp_frame)
 | |
|         if modules.globals.many_faces:
 | |
|             if detected_faces:
 | |
|                 source_face = default_source_face()
 | |
|                 for target_face in detected_faces:
 | |
|                     temp_frame = swap_face(source_face, target_face, temp_frame)
 | |
| 
 | |
|         elif not modules.globals.many_faces:
 | |
|             if detected_faces:
 | |
|                 if len(detected_faces) <= len(
 | |
|                     modules.globals.simple_map["target_embeddings"]
 | |
|                 ):
 | |
|                     for detected_face in detected_faces:
 | |
|                         closest_centroid_index, _ = find_closest_centroid(
 | |
|                             modules.globals.simple_map["target_embeddings"],
 | |
|                             detected_face.normed_embedding,
 | |
|                         )
 | |
| 
 | |
|                         temp_frame = swap_face(
 | |
|                             modules.globals.simple_map["source_faces"][
 | |
|                                 closest_centroid_index
 | |
|                             ],
 | |
|                             detected_face,
 | |
|                             temp_frame,
 | |
|                         )
 | |
|                 else:
 | |
|                     detected_faces_centroids = []
 | |
|                     for face in detected_faces:
 | |
|                         detected_faces_centroids.append(face.normed_embedding)
 | |
|                     i = 0
 | |
|                     for target_embedding in modules.globals.simple_map[
 | |
|                         "target_embeddings"
 | |
|                     ]:
 | |
|                         closest_centroid_index, _ = find_closest_centroid(
 | |
|                             detected_faces_centroids, target_embedding
 | |
|                         )
 | |
| 
 | |
|                         temp_frame = swap_face(
 | |
|                             modules.globals.simple_map["source_faces"][i],
 | |
|                             detected_faces[closest_centroid_index],
 | |
|                             temp_frame,
 | |
|                         )
 | |
|                         i += 1
 | |
|     return temp_frame
 | |
| 
 | |
| 
 | |
| def process_frames(
 | |
|     source_path: str, temp_frame_paths: List[str], progress: Any = None
 | |
| ) -> None:
 | |
|     if not modules.globals.map_faces:
 | |
|         source_face = get_one_face(cv2.imread(source_path))
 | |
|         for temp_frame_path in temp_frame_paths:
 | |
|             temp_frame = cv2.imread(temp_frame_path)
 | |
|             try:
 | |
|                 result = process_frame(source_face, temp_frame)
 | |
|                 cv2.imwrite(temp_frame_path, result)
 | |
|             except Exception as exception:
 | |
|                 print(exception)
 | |
|                 pass
 | |
|             if progress:
 | |
|                 progress.update(1)
 | |
|     else:
 | |
|         for temp_frame_path in temp_frame_paths:
 | |
|             temp_frame = cv2.imread(temp_frame_path)
 | |
|             try:
 | |
|                 result = process_frame_v2(temp_frame, temp_frame_path)
 | |
|                 cv2.imwrite(temp_frame_path, result)
 | |
|             except Exception as exception:
 | |
|                 print(exception)
 | |
|                 pass
 | |
|             if progress:
 | |
|                 progress.update(1)
 | |
| 
 | |
| 
 | |
| def process_image(source_path: str, target_path: str, output_path: str) -> None:
 | |
|     if not modules.globals.map_faces:
 | |
|         source_face = get_one_face(cv2.imread(source_path))
 | |
|         target_frame = cv2.imread(target_path)
 | |
|         result = process_frame(source_face, target_frame)
 | |
|         cv2.imwrite(output_path, result)
 | |
|     else:
 | |
|         if modules.globals.many_faces:
 | |
|             update_status(
 | |
|                 "Many faces enabled. Using first source image. Progressing...", NAME
 | |
|             )
 | |
|         target_frame = cv2.imread(output_path)
 | |
|         result = process_frame_v2(target_frame)
 | |
|         cv2.imwrite(output_path, result)
 | |
| 
 | |
| 
 | |
| def process_video(source_path: str, temp_frame_paths: List[str]) -> None:
 | |
|     if modules.globals.map_faces and modules.globals.many_faces:
 | |
|         update_status(
 | |
|             "Many faces enabled. Using first source image. Progressing...", NAME
 | |
|         )
 | |
|     modules.processors.frame.core.process_video(
 | |
|         source_path, temp_frame_paths, process_frames
 | |
|     )
 | |
| 
 | |
| 
 | |
| def create_lower_mouth_mask(
 | |
|     face: Face, frame: Frame
 | |
| ) -> (np.ndarray, np.ndarray, tuple, np.ndarray):
 | |
|     mask = np.zeros(frame.shape[:2], dtype=np.uint8)
 | |
|     mouth_cutout = None
 | |
|     landmarks = face.landmark_2d_106
 | |
|     if landmarks is not None:
 | |
|         #                  0  1  2  3  4  5  6  7  8  9  10 11 12 13 14 15 16 17 18 19 20
 | |
|         lower_lip_order = [
 | |
|             65,
 | |
|             66,
 | |
|             62,
 | |
|             70,
 | |
|             69,
 | |
|             18,
 | |
|             19,
 | |
|             20,
 | |
|             21,
 | |
|             22,
 | |
|             23,
 | |
|             24,
 | |
|             0,
 | |
|             8,
 | |
|             7,
 | |
|             6,
 | |
|             5,
 | |
|             4,
 | |
|             3,
 | |
|             2,
 | |
|             65,
 | |
|         ]
 | |
|         lower_lip_landmarks = landmarks[lower_lip_order].astype(
 | |
|             np.float32
 | |
|         )  # Use float for precise calculations
 | |
| 
 | |
|         # Calculate the center of the landmarks
 | |
|         center = np.mean(lower_lip_landmarks, axis=0)
 | |
| 
 | |
|         # Expand the landmarks outward
 | |
|         expansion_factor = (
 | |
|             1 + modules.globals.mask_down_size
 | |
|         )  # Adjust this for more or less expansion
 | |
|         expanded_landmarks = (lower_lip_landmarks - center) * expansion_factor + center
 | |
| 
 | |
|         # Extend the top lip part
 | |
|         toplip_indices = [
 | |
|             20,
 | |
|             0,
 | |
|             1,
 | |
|             2,
 | |
|             3,
 | |
|             4,
 | |
|             5,
 | |
|         ]  # Indices for landmarks 2, 65, 66, 62, 70, 69, 18
 | |
|         toplip_extension = (
 | |
|             modules.globals.mask_size * 0.5
 | |
|         )  # Adjust this factor to control the extension
 | |
|         for idx in toplip_indices:
 | |
|             direction = expanded_landmarks[idx] - center
 | |
|             direction = direction / np.linalg.norm(direction)
 | |
|             expanded_landmarks[idx] += direction * toplip_extension
 | |
| 
 | |
|         # Extend the bottom part (chin area)
 | |
|         chin_indices = [
 | |
|             11,
 | |
|             12,
 | |
|             13,
 | |
|             14,
 | |
|             15,
 | |
|             16,
 | |
|         ]  # Indices for landmarks 21, 22, 23, 24, 0, 8
 | |
|         chin_extension = 2 * 0.2  # Adjust this factor to control the extension
 | |
|         for idx in chin_indices:
 | |
|             expanded_landmarks[idx][1] += (
 | |
|                 expanded_landmarks[idx][1] - center[1]
 | |
|             ) * chin_extension
 | |
| 
 | |
|         # Convert back to integer coordinates
 | |
|         expanded_landmarks = expanded_landmarks.astype(np.int32)
 | |
| 
 | |
|         # Calculate bounding box for the expanded lower mouth
 | |
|         min_x, min_y = np.min(expanded_landmarks, axis=0)
 | |
|         max_x, max_y = np.max(expanded_landmarks, axis=0)
 | |
| 
 | |
|         # Add some padding to the bounding box
 | |
|         padding = int((max_x - min_x) * 0.1)  # 10% padding
 | |
|         min_x = max(0, min_x - padding)
 | |
|         min_y = max(0, min_y - padding)
 | |
|         max_x = min(frame.shape[1], max_x + padding)
 | |
|         max_y = min(frame.shape[0], max_y + padding)
 | |
| 
 | |
|         # Ensure the bounding box dimensions are valid
 | |
|         if max_x <= min_x or max_y <= min_y:
 | |
|             if (max_x - min_x) <= 1:
 | |
|                 max_x = min_x + 1
 | |
|             if (max_y - min_y) <= 1:
 | |
|                 max_y = min_y + 1
 | |
| 
 | |
|         # Create the mask
 | |
|         mask_roi = np.zeros((max_y - min_y, max_x - min_x), dtype=np.uint8)
 | |
|         cv2.fillPoly(mask_roi, [expanded_landmarks - [min_x, min_y]], 255)
 | |
| 
 | |
|         # Apply Gaussian blur to soften the mask edges
 | |
|         # Default kernel size for mouth mask blur is (9,9) as a balance between performance and smoothing.
 | |
|         # Larger values (e.g., (15,15) - the previous hardcoded value) provide more smoothing but are slower.
 | |
|         # This is configurable via modules.globals.mouth_mask_blur_kernel_size.
 | |
|         kernel_size_mouth_config = getattr(modules.globals, 'mouth_mask_blur_kernel_size', (9, 9))
 | |
|         valid_kernel_mouth = _validate_kernel_size(kernel_size_mouth_config, (9, 9))
 | |
|         mask_roi = cv2.GaussianBlur(mask_roi, valid_kernel_mouth, 0)
 | |
| 
 | |
|         # Place the mask ROI in the full-sized mask
 | |
|         mask[min_y:max_y, min_x:max_x] = mask_roi
 | |
| 
 | |
|         # Extract the masked area from the frame
 | |
|         mouth_cutout = frame[min_y:max_y, min_x:max_x].copy()
 | |
| 
 | |
|         # Return the expanded lower lip polygon in original frame coordinates
 | |
|         lower_lip_polygon = expanded_landmarks
 | |
| 
 | |
|     return mask, mouth_cutout, (min_x, min_y, max_x, max_y), lower_lip_polygon
 | |
| 
 | |
| 
 | |
| def draw_mouth_mask_visualization(
 | |
|     frame: Frame, face: Face, mouth_mask_data: tuple
 | |
| ) -> Frame:
 | |
|     landmarks = face.landmark_2d_106
 | |
|     if landmarks is not None and mouth_mask_data is not None:
 | |
|         mask, mouth_cutout, (min_x, min_y, max_x, max_y), lower_lip_polygon = (
 | |
|             mouth_mask_data
 | |
|         )
 | |
| 
 | |
|         vis_frame = frame.copy()
 | |
| 
 | |
|         # Ensure coordinates are within frame bounds
 | |
|         height, width = vis_frame.shape[:2]
 | |
|         min_x, min_y = max(0, min_x), max(0, min_y)
 | |
|         max_x, max_y = min(width, max_x), min(height, max_y)
 | |
| 
 | |
|         # Adjust mask to match the region size
 | |
|         mask_region = mask[0 : max_y - min_y, 0 : max_x - min_x]
 | |
| 
 | |
|         # Remove the color mask overlay
 | |
|         # color_mask = cv2.applyColorMap((mask_region * 255).astype(np.uint8), cv2.COLORMAP_JET)
 | |
| 
 | |
|         # Ensure shapes match before blending
 | |
|         vis_region = vis_frame[min_y:max_y, min_x:max_x]
 | |
|         # Remove blending with color_mask
 | |
|         # if vis_region.shape[:2] == color_mask.shape[:2]:
 | |
|         #     blended = cv2.addWeighted(vis_region, 0.7, color_mask, 0.3, 0)
 | |
|         #     vis_frame[min_y:max_y, min_x:max_x] = blended
 | |
| 
 | |
|         # Draw the lower lip polygon
 | |
|         cv2.polylines(vis_frame, [lower_lip_polygon], True, (0, 255, 0), 2)
 | |
| 
 | |
|         # Remove the red box
 | |
|         # cv2.rectangle(vis_frame, (min_x, min_y), (max_x, max_y), (0, 0, 255), 2)
 | |
| 
 | |
|         # Visualize the feathered mask
 | |
|         feather_amount = max(
 | |
|             1,
 | |
|             min(
 | |
|                 30,
 | |
|                 (max_x - min_x) // modules.globals.mask_feather_ratio,
 | |
|                 (max_y - min_y) // modules.globals.mask_feather_ratio,
 | |
|             ),
 | |
|         )
 | |
|         # Ensure kernel size is odd
 | |
|         kernel_size = 2 * feather_amount + 1
 | |
|         feathered_mask = cv2.GaussianBlur(
 | |
|             mask_region.astype(float), (kernel_size, kernel_size), 0
 | |
|         )
 | |
|         feathered_mask = (feathered_mask / feathered_mask.max() * 255).astype(np.uint8)
 | |
|         # Remove the feathered mask color overlay
 | |
|         # color_feathered_mask = cv2.applyColorMap(feathered_mask, cv2.COLORMAP_VIRIDIS)
 | |
| 
 | |
|         # Ensure shapes match before blending feathered mask
 | |
|         # if vis_region.shape == color_feathered_mask.shape:
 | |
|         #     blended_feathered = cv2.addWeighted(vis_region, 0.7, color_feathered_mask, 0.3, 0)
 | |
|         #     vis_frame[min_y:max_y, min_x:max_x] = blended_feathered
 | |
| 
 | |
|         # Add labels
 | |
|         cv2.putText(
 | |
|             vis_frame,
 | |
|             "Lower Mouth Mask",
 | |
|             (min_x, min_y - 10),
 | |
|             cv2.FONT_HERSHEY_SIMPLEX,
 | |
|             0.5,
 | |
|             (255, 255, 255),
 | |
|             1,
 | |
|         )
 | |
|         cv2.putText(
 | |
|             vis_frame,
 | |
|             "Feathered Mask",
 | |
|             (min_x, max_y + 20),
 | |
|             cv2.FONT_HERSHEY_SIMPLEX,
 | |
|             0.5,
 | |
|             (255, 255, 255),
 | |
|             1,
 | |
|         )
 | |
| 
 | |
|         return vis_frame
 | |
|     return frame
 | |
| 
 | |
| 
 | |
| def apply_mouth_area(
 | |
|     frame: np.ndarray,
 | |
|     mouth_cutout: np.ndarray,
 | |
|     mouth_box: tuple,
 | |
|     face_mask: np.ndarray,
 | |
|     mouth_polygon: np.ndarray,
 | |
| ) -> np.ndarray:
 | |
|     min_x, min_y, max_x, max_y = mouth_box
 | |
|     box_width = max_x - min_x
 | |
|     box_height = max_y - min_y
 | |
| 
 | |
|     if (
 | |
|         mouth_cutout is None
 | |
|         or box_width is None
 | |
|         or box_height is None
 | |
|         or face_mask is None
 | |
|         or mouth_polygon is None
 | |
|     ):
 | |
|         return frame
 | |
| 
 | |
|     try:
 | |
|         resized_mouth_cutout = cv2.resize(mouth_cutout, (box_width, box_height))
 | |
|         roi = frame[min_y:max_y, min_x:max_x]
 | |
| 
 | |
|         if roi.shape != resized_mouth_cutout.shape:
 | |
|             resized_mouth_cutout = cv2.resize(
 | |
|                 resized_mouth_cutout, (roi.shape[1], roi.shape[0])
 | |
|             )
 | |
| 
 | |
|         color_corrected_mouth = apply_color_transfer(resized_mouth_cutout, roi)
 | |
| 
 | |
|         # Use the provided mouth polygon to create the mask
 | |
|         polygon_mask = np.zeros(roi.shape[:2], dtype=np.uint8)
 | |
|         adjusted_polygon = mouth_polygon - [min_x, min_y]
 | |
|         cv2.fillPoly(polygon_mask, [adjusted_polygon], 255)
 | |
| 
 | |
|         # Apply feathering to the polygon mask
 | |
|         feather_amount = min(
 | |
|             30,
 | |
|             box_width // modules.globals.mask_feather_ratio,
 | |
|             box_height // modules.globals.mask_feather_ratio,
 | |
|         )
 | |
|         feathered_mask = cv2.GaussianBlur(
 | |
|             polygon_mask.astype(float), (0, 0), feather_amount
 | |
|         )
 | |
| 
 | |
|         mask_max_value = feathered_mask.max()
 | |
|         if mask_max_value < 1e-6:  # Check if max is effectively zero
 | |
|             logging.warning("Mouth mask's feathered_mask is all zeros or near-zeros after blur. Resulting mask will be black.")
 | |
|             feathered_mask = np.zeros_like(polygon_mask, dtype=np.uint8)
 | |
|         else:
 | |
|             feathered_mask = (feathered_mask / mask_max_value * 255).astype(np.uint8)
 | |
| 
 | |
|         face_mask_roi = face_mask[min_y:max_y, min_x:max_x]
 | |
|         combined_mask = feathered_mask * (face_mask_roi / 255.0)
 | |
| 
 | |
|         combined_mask = combined_mask[:, :, np.newaxis]
 | |
|         blended = (
 | |
|             color_corrected_mouth * combined_mask + roi * (1 - combined_mask)
 | |
|         ).astype(np.uint8)
 | |
| 
 | |
|         # Apply face mask to blended result
 | |
|         face_mask_3channel = (
 | |
|             np.repeat(face_mask_roi[:, :, np.newaxis], 3, axis=2) / 255.0
 | |
|         )
 | |
|         final_blend = blended * face_mask_3channel + roi * (1 - face_mask_3channel)
 | |
| 
 | |
|         frame[min_y:max_y, min_x:max_x] = final_blend.astype(np.uint8)
 | |
|     except Exception as e:
 | |
|         pass
 | |
| 
 | |
|     return frame
 | |
| 
 | |
| 
 | |
| def create_face_mask(face: Face, frame: Frame) -> np.ndarray:
 | |
|     mask = np.zeros(frame.shape[:2], dtype=np.uint8)
 | |
|     landmarks = face.landmark_2d_106
 | |
|     if landmarks is not None:
 | |
|         # Convert landmarks to int32
 | |
|         landmarks = landmarks.astype(np.int32)
 | |
| 
 | |
|         # Extract facial features
 | |
|         right_side_face = landmarks[0:16]
 | |
|         left_side_face = landmarks[17:32]
 | |
|         right_eye = landmarks[33:42]
 | |
|         right_eye_brow = landmarks[43:51]
 | |
|         left_eye = landmarks[87:96]
 | |
|         left_eye_brow = landmarks[97:105]
 | |
| 
 | |
|         # Calculate forehead extension
 | |
|         right_eyebrow_top = np.min(right_eye_brow[:, 1])
 | |
|         left_eyebrow_top = np.min(left_eye_brow[:, 1])
 | |
|         eyebrow_top = min(right_eyebrow_top, left_eyebrow_top)
 | |
| 
 | |
|         face_top = np.min([right_side_face[0, 1], left_side_face[-1, 1]])
 | |
|         forehead_height = face_top - eyebrow_top
 | |
|         forehead_factor = getattr(modules.globals, 'forehead_extension_factor', 2.5)
 | |
|         extended_forehead_height = int(forehead_height * forehead_factor)
 | |
| 
 | |
|         # Create forehead points
 | |
|         forehead_left = right_side_face[0].copy()
 | |
|         forehead_right = left_side_face[-1].copy()
 | |
|         forehead_left[1] -= extended_forehead_height
 | |
|         forehead_right[1] -= extended_forehead_height
 | |
| 
 | |
|         # Combine all points to create the face outline
 | |
|         face_outline = np.vstack(
 | |
|             [
 | |
|                 [forehead_left],
 | |
|                 right_side_face,
 | |
|                 left_side_face[
 | |
|                     ::-1
 | |
|                 ],  # Reverse left side to create a continuous outline
 | |
|                 [forehead_right],
 | |
|             ]
 | |
|         )
 | |
| 
 | |
|         # Calculate padding
 | |
|         padding = int(
 | |
|             np.linalg.norm(right_side_face[0] - left_side_face[-1]) * 0.05
 | |
|         )  # 5% of face width
 | |
| 
 | |
|         # Create a slightly larger convex hull for padding
 | |
|         hull = cv2.convexHull(face_outline)
 | |
|         hull_padded = []
 | |
|         for point in hull:
 | |
|             x, y = point[0]
 | |
|             center = np.mean(face_outline, axis=0)
 | |
|             direction = np.array([x, y]) - center
 | |
|             direction = direction / np.linalg.norm(direction)
 | |
|             padded_point = np.array([x, y]) + direction * padding
 | |
|             hull_padded.append(padded_point)
 | |
| 
 | |
|         hull_padded = np.array(hull_padded, dtype=np.int32)
 | |
| 
 | |
|         # Fill the padded convex hull
 | |
|         cv2.fillConvexPoly(mask, hull_padded, 255)
 | |
| 
 | |
|         # Smooth the mask edges
 | |
|         kernel_size_face_config = getattr(modules.globals, 'face_mask_blur_kernel_size', (5, 5))
 | |
|         valid_kernel_face = _validate_kernel_size(kernel_size_face_config, (5, 5))
 | |
|         mask = cv2.GaussianBlur(mask, valid_kernel_face, 0)
 | |
| 
 | |
|     return mask
 | |
| 
 | |
| 
 | |
| def apply_color_transfer(source, target):
 | |
|     """
 | |
|     Apply color transfer from target to source image
 | |
|     """
 | |
|     source = cv2.cvtColor(source, cv2.COLOR_BGR2LAB).astype("float32")
 | |
|     target = cv2.cvtColor(target, cv2.COLOR_BGR2LAB).astype("float32")
 | |
| 
 | |
|     source_mean, source_std = cv2.meanStdDev(source)
 | |
|     target_mean, target_std = cv2.meanStdDev(target)
 | |
| 
 | |
|     # Reshape mean and std to be broadcastable
 | |
|     source_mean = source_mean.reshape(1, 1, 3)
 | |
|     source_std = source_std.reshape(1, 1, 3)
 | |
|     target_mean = target_mean.reshape(1, 1, 3)
 | |
|     target_std = target_std.reshape(1, 1, 3)
 | |
| 
 | |
|     # Perform the color transfer
 | |
|     source = (source - source_mean) * (target_std / source_std) + target_mean
 | |
| 
 | |
|     return cv2.cvtColor(np.clip(source, 0, 255).astype("uint8"), cv2.COLOR_LAB2BGR)
 |