Spaces:

VanNguyen1214
/

real_finals

Runtime error

App Files Files Community

VanNguyen1214 commited on Jun 17, 2025

Commit

8dff9a2

verified ·

1 Parent(s): dd1b6cd

Upload 58 files

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +33 -0
README.md +12 -12
app.py +182 -0
baldhead.py +272 -0
bbox_utils.py +31 -0
detect_face.py +93 -0
example_wigs/Heart/HH02.png +3 -0
example_wigs/Heart/HH03.png +3 -0
example_wigs/Heart/Loire.png +3 -0
example_wigs/Heart/SantaRossa.png +3 -0
example_wigs/Heart/Tuscany.png +3 -0
example_wigs/Oblong/HH01.png +3 -0
example_wigs/Oblong/HH02.png +3 -0
example_wigs/Oblong/HH03.png +3 -0
example_wigs/Oblong/HH07.png +3 -0
example_wigs/Oblong/Loire.png +3 -0
example_wigs/Oval/Alsace.png +3 -0
example_wigs/Oval/Barossa.png +3 -0
example_wigs/Oval/Burgundy.png +3 -0
example_wigs/Oval/HH01.png +3 -0
example_wigs/Oval/HH02.png +3 -0
example_wigs/Oval/HH03.png +3 -0
example_wigs/Oval/HH07.png +3 -0
example_wigs/Oval/Loire.png +3 -0
example_wigs/Oval/Napa.png +3 -0
example_wigs/Oval/Piemonte.png +3 -0
example_wigs/Oval/Rhone.png +3 -0
example_wigs/Oval/SantaRossa.png +3 -0
example_wigs/Oval/Sonoma.png +3 -0
example_wigs/Oval/Tuscany.png +3 -0
example_wigs/Round/Loire.png +3 -0
example_wigs/Round/Piemonte.png +3 -0
example_wigs/Round/Sonoma.png +3 -0
example_wigs/Round/Tuscany.png +3 -0
example_wigs/Square/HH03.png +3 -0
example_wigs/Square/Loire.png +3 -0
example_wigs/Square/Piemonte.png +3 -0
example_wigs/Square/Sonoma.png +3 -0
example_wigs/Square/Tuscany.png +3 -0
overlay.py +89 -0
requirements.txt +35 -0
roop/__init__.py +0 -0
roop/capturer.py +20 -0
roop/core.py +217 -0
roop/face_analyser.py +124 -0
roop/globals.py +17 -0
roop/metadata.py +2 -0
roop/predicter.py +25 -0
roop/processors/__init__.py +0 -0
roop/processors/frame/__init__.py +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,36 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+example_wigs/Heart/HH02.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Heart/HH03.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Heart/Loire.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Heart/SantaRossa.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Heart/Tuscany.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oblong/HH01.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oblong/HH02.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oblong/HH03.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oblong/HH07.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oblong/Loire.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/Alsace.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/Barossa.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/Burgundy.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/HH01.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/HH02.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/HH03.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/HH07.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/Loire.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/Napa.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/Piemonte.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/Rhone.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/SantaRossa.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/Sonoma.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Oval/Tuscany.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Round/Loire.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Round/Piemonte.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Round/Sonoma.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Round/Tuscany.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Square/HH03.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Square/Loire.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Square/Piemonte.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Square/Sonoma.png filter=lfs diff=lfs merge=lfs -text
+example_wigs/Square/Tuscany.png filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -1,12 +1,12 @@
----
-title: Real Finals
-emoji: 📊
-colorFrom: yellow
-colorTo: gray
-sdk: gradio
-sdk_version: 5.34.0
-app_file: app.py
-pinned: false
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+---
+title: Ghep Image
+emoji: 📉
+colorFrom: pink
+colorTo: blue
+sdk: gradio
+sdk_version: 5.31.0
+app_file: app.py
+pinned: false
+---
+Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

app.py ADDED Viewed

	@@ -0,0 +1,182 @@

+import gradio as gr
+from overlay import overlay_source
+from detect_face import predict, NUM_CLASSES
+from swapface import swap_face_now
+import os
+from pathlib import Path
+BASE_DIR = Path(__file__).parent  # thư mục chứa app.py
+FOLDER = BASE_DIR / "example_wigs"
+# --- Hàm load ảnh từ folder ---
+def load_images_from_folder(folder_path: str) -> list[str]:
+    """
+    Trả về list[str] chứa tất cả các hình (jpg, png, gif, bmp) trong folder_path.
+    """
+    supported = {'.jpg', '.jpeg', '.png', '.gif', '.bmp'}
+    if not os.path.isdir(folder_path):
+        print(f"Cảnh báo: '{folder_path}' không phải folder hợp lệ.")
+        return []
+    files = [
+        os.path.join(folder_path, fn)
+        for fn in os.listdir(folder_path)
+        if os.path.splitext(fn)[1].lower() in supported
+    ]
+    if not files:
+        print(f"Không tìm thấy hình trong: {folder_path}")
+    return files
+def on_gallery_select(evt: gr.SelectData):
+    """
+    Khi click thumbnail: trả về
+      1) filepath để nạp vào Image Source
+      2) tên file (basename) để hiển thị trong Textbox
+    """
+    val = evt.value
+    # --- logic trích filepath y như cũ ---
+    if isinstance(val, dict):
+        img = val.get("image")
+        if isinstance(img, str):
+            filepath = img
+        elif isinstance(img, dict):
+            filepath = img.get("path") or img.get("url")
+        else:
+            filepath = next(
+                (v for v in val.values() if isinstance(v, str) and os.path.isfile(v)),
+                None
+            )
+    elif isinstance(val, str):
+        filepath = val
+    else:
+        raise ValueError(f"Kiểu không hỗ trợ: {type(val)}")
+    filename = os.path.basename(filepath) if filepath else ""
+    return filepath, filename
+# --- Hàm xác định folder dựa trên phân lớp ---
+def infer_folder(image) -> str:
+    cls = predict(image)["predicted_class"]
+    folder = str(FOLDER / cls)
+    return folder
+# --- Hàm gộp: phân loại + load ảnh ---
+def handle_bg_change(image):
+    """
+    Khi thay đổi background:
+    1. Phân loại khuôn mặt
+    2. Load ảnh từ folder tương ứng
+    """
+    if image is None:
+        return "", []
+    try:
+        folder = infer_folder(image)
+        images = load_images_from_folder(folder)
+        return folder, images
+    except Exception as e:
+        print(f"Lỗi xử lý ảnh: {e}")
+        return "", []
+# --- Hàm swap face ---
+def swap_face_wrapper(background_img, result_img):
+    """
+    Wrapper function cho swap face giữa background và result image
+    """
+    if background_img is None or result_img is None:
+        return None
+    try:
+        # Swap face từ background vào result image
+        swapped = swap_face_now(background_img, result_img, do_enhance=True)
+        return swapped
+    except Exception as e:
+        print(f"Lỗi swap face: {e}")
+        return result_img  # Trả về ảnh gốc nếu có lỗi
+# --- Hàm gộp overlay + swap face ---
+def combined_hair_and_face(background_img, source_img):
+    """
+    Hàm gộp: chạy overlay trước, sau đó swap face
+    """
+    if background_img is None or source_img is None:
+        return None
+    try:
+        # Bước 1: Chạy overlay (ghép tóc)
+        hair_result = overlay_source(background_img, source_img)
+        # Bước 2: Chạy swap face từ background lên kết quả overlay
+        final_result = swap_face_wrapper(background_img, hair_result)
+        return final_result
+    except Exception as e:
+        print(f"Lỗi trong quá trình gộp hair + face: {e}")
+        return None
+# --- Xây dựng giao diện Gradio ---
+def build_demo():
+    with gr.Blocks(title="Hair Try-On & Face Swap", theme=gr.themes.Soft()) as demo:
+        gr.Markdown("""
+        # 🎯 Hair Try-On & Face Swap Application
+        """)
+        with gr.Row():
+            bg = gr.Image(type="pil", label="Background", height=500)
+            src = gr.Image(type="pil", label="Source", height=500, interactive=False)
+            out = gr.Image(label="Result", height=500, interactive=False)
+        folder_path_box = gr.Textbox(label="Folder path", visible=False)
+        with gr.Row():
+            src_name_box = gr.Textbox(
+                        label="Wigs Name",
+                        interactive=False,
+                        show_copy_button=True ,     # tuỳ chọn – tiện copy đường dẫn
+                        scale = 1
+                        )
+            gallery = gr.Gallery(
+                            label="Recommend For You",
+                            height=300,
+                            value=[],
+                            type="filepath",
+                            interactive=False,
+                            columns=5,
+                            object_fit="cover",
+                            allow_preview=True,
+                            scale = 8
+                            )
+            with gr.Column(scale=1):
+                combined_btn = gr.Button("🔄✨ Run Hair + Face Swap", variant="primary")
+                btn = gr.Button("🔄 Run Hair Only", variant="secondary")
+                swap_btn = gr.Button("👤 Swap Face Only", variant="secondary")
+        # Chạy gộp hair + face swap
+        combined_btn.click(fn=combined_hair_and_face, inputs=[bg, src], outputs=[out])
+        # Chạy ghép tóc
+        btn.click(fn=overlay_source, inputs=[bg, src], outputs=[out])
+        # Chạy swap face
+        swap_btn.click(fn=swap_face_wrapper, inputs=[bg, out], outputs=[out])
+        # Khi đổi ảnh background, tự động phân loại và load ảnh gợi ý
+        bg.change(
+            fn=handle_bg_change,
+            inputs=[bg],
+            outputs=[folder_path_box, gallery],
+            show_progress=True
+        )
+        # Khi chọn ảnh trong gallery, cập nhật vào khung Source
+        gallery.select(
+            fn=on_gallery_select,
+            outputs=[src, src_name_box]
+        )
+    return demo
+if __name__ == "__main__":
+    build_demo().launch()

baldhead.py ADDED Viewed

	@@ -0,0 +1,272 @@

+# baldhead.py
+import os
+import cv2
+import numpy as np
+from PIL import Image
+import tensorflow as tf
+import gradio as gr
+# Keras imports (note: keras-contrib must be installed)
+import keras.backend as K
+from keras.layers import (
+    Input,
+    Conv2D,
+    UpSampling2D,
+    LeakyReLU,
+    GlobalAveragePooling2D,
+    Dense,
+    Reshape,
+    Dropout,
+    Concatenate,
+    multiply,                 # ← Thêm import multiply
+)
+from keras.models import Model
+from keras_contrib.layers.normalization.instancenormalization import InstanceNormalization
+# RetinaFace + skimage for face alignment
+from retinaface import RetinaFace
+from skimage import transform as trans
+# Hugging Face Hub helper
+from huggingface_hub import hf_hub_download
+# --- Face‐alignment helpers (giống code gốc) ---
+image_size = [256, 256]
+src_landmarks = np.array([
+    [30.2946, 51.6963],
+    [65.5318, 51.5014],
+    [48.0252, 71.7366],
+    [33.5493, 92.3655],
+    [62.7299, 92.2041],
+], dtype=np.float32)
+src_landmarks[:, 0] += 8.0
+src_landmarks[:, 0] += 15.0
+src_landmarks[:, 1] += 30.0
+src_landmarks /= 112
+src_landmarks *= 200
+def list2array(values):
+    return np.array(list(values))
+def align_face(img: np.ndarray):
+    """
+    Detect faces + landmarks in `img` via RetinaFace.
+    Returns lists of aligned face patches (256×256 RGB),
+    corresponding binary masks, and the transformation matrices.
+    """
+    faces = RetinaFace.detect_faces(img)
+    bboxes = np.array([list2array(faces[f]['facial_area']) for f in faces])
+    landmarks = np.array([list2array(faces[f]['landmarks'].values()) for f in faces])
+    white_canvas = np.ones(img.shape, dtype=np.uint8) * 255
+    aligned_faces, masks, matrices = [], [], []
+    if bboxes.shape[0] > 0:
+        for i in range(bboxes.shape[0]):
+            dst = landmarks[i]  # detected landmarks
+            tform = trans.SimilarityTransform()
+            tform.estimate(dst, src_landmarks)
+            M = tform.params[0:2, :]
+            warped_face = cv2.warpAffine(
+                img, M, (image_size[1], image_size[0]), borderValue=0.0
+            )
+            warped_mask = cv2.warpAffine(
+                white_canvas, M, (image_size[1], image_size[0]), borderValue=0.0
+            )
+            aligned_faces.append(warped_face)
+            masks.append(warped_mask)
+            matrices.append(tform.params[0:3, :])
+    return aligned_faces, masks, matrices
+def put_face_back(
+    orig_img: np.ndarray,
+    processed_faces: list[np.ndarray],
+    masks: list[np.ndarray],
+    matrices: list[np.ndarray],
+):
+    """
+    Warp each processed face back onto the original `orig_img`
+    using the inverse of the transformation matrices.
+    """
+    result = orig_img.copy()
+    h, w = orig_img.shape[:2]
+    for i in range(len(processed_faces)):
+        invM = np.linalg.inv(matrices[i])[0:2]
+        warped = cv2.warpAffine(processed_faces[i], invM, (w, h), borderValue=0.0)
+        mask = cv2.warpAffine(masks[i], invM, (w, h), borderValue=0.0)
+        binary_mask = (mask // 255).astype(np.uint8)
+        # Composite: result = result * (1 - mask) + warped * mask
+        result = result * (1 - binary_mask)
+        result = result.astype(np.uint8)
+        result = result + warped * binary_mask
+    return result
+# ----------------------------
+# 2. GENERATOR ARCHITECTURE
+# ----------------------------
+def squeeze_excite_block(x, ratio=4):
+    """
+    Squeeze-and-Excitation block: channel-wise attention.
+    """
+    init = x
+    channel_axis = 1 if K.image_data_format() == "channels_first" else -1
+    filters = init.shape[channel_axis]
+    se_shape = (1, 1, filters)
+    se = GlobalAveragePooling2D()(init)
+    se = Reshape(se_shape)(se)
+    se = Dense(filters // ratio, activation="relu", kernel_initializer="he_normal", use_bias=False)(se)
+    se = Dense(filters, activation="sigmoid", kernel_initializer="he_normal", use_bias=False)(se)
+    return multiply([init, se])
+def conv2d(layer_input, filters, f_size=4, bn=True, se=False):
+    """
+    Downsampling block: Conv2D → LeakyReLU → (InstanceNorm) → (SE block)
+    """
+    d = Conv2D(filters, kernel_size=f_size, strides=2, padding="same")(layer_input)
+    d = LeakyReLU(alpha=0.2)(d)
+    if bn:
+        d = InstanceNormalization()(d)
+    if se:
+        d = squeeze_excite_block(d)
+    return d
+def atrous(layer_input, filters, f_size=4, bn=True):
+    """
+    Atrous (dilated) convolution block with dilation rates [2,4,8].
+    """
+    a_list = []
+    for rate in [2, 4, 8]:
+        a = Conv2D(filters, f_size, dilation_rate=rate, padding="same")(layer_input)
+        a_list.append(a)
+    a = Concatenate()(a_list)
+    a = LeakyReLU(alpha=0.2)(a)
+    if bn:
+        a = InstanceNormalization()(a)
+    return a
+def deconv2d(layer_input, skip_input, filters, f_size=4, dropout_rate=0):
+    """
+    Upsampling block: UpSampling2D → Conv2D → (Dropout) → InstanceNorm → Concatenate(skip)
+    """
+    u = UpSampling2D(size=2)(layer_input)
+    u = Conv2D(filters, kernel_size=f_size, strides=1, padding="same", activation="relu")(u)
+    if dropout_rate:
+        u = Dropout(dropout_rate)(u)
+    u = InstanceNormalization()(u)
+    u = Concatenate()([u, skip_input])
+    return u
+def build_generator():
+    """
+    Reconstruct the generator architecture exactly as in the notebook,
+    then return a Keras Model object.
+    """
+    d0 = Input(shape=(256, 256, 3))
+    gf = 64
+    # Downsampling
+    d1 = conv2d(d0, gf, bn=False, se=True)
+    d2 = conv2d(d1, gf * 2, se=True)
+    d3 = conv2d(d2, gf * 4, se=True)
+    d4 = conv2d(d3, gf * 8)
+    d5 = conv2d(d4, gf * 8)
+    # Atrous block
+    a1 = atrous(d5, gf * 8)
+    # Upsampling
+    u3 = deconv2d(a1, d4, gf * 8)
+    u4 = deconv2d(u3, d3, gf * 4)
+    u5 = deconv2d(u4, d2, gf * 2)
+    u6 = deconv2d(u5, d1, gf)
+    # Final upsample + conv
+    u7 = UpSampling2D(size=2)(u6)
+    output_img = Conv2D(3, kernel_size=4, strides=1, padding="same", activation="tanh")(u7)
+    model = Model(d0, output_img)
+    return model
+# ----------------------------
+# 3. LOAD MODEL WEIGHTS
+# ----------------------------
+HF_REPO_ID = "VanNguyen1214/baldhead"
+HF_FILENAME = "model_G_5_170.hdf5"
+HF_TOKEN = os.environ["HUGGINGFACEHUB_API_TOKEN"]
+def load_generator_from_hub():
+    """
+    Download the .hdf5 weights from HF Hub into cache,
+    rebuild the generator, then load weights.
+    """
+    local_path = hf_hub_download(repo_id=HF_REPO_ID, filename=HF_FILENAME,token=HF_TOKEN)
+    gen = build_generator()
+    gen.load_weights(local_path)
+    return gen
+# Load once at startup
+try:
+    GENERATOR = load_generator_from_hub()
+    print(f"[INFO] Loaded generator weights from {HF_REPO_ID}/{HF_FILENAME}")
+except Exception as e:
+    print("[ERROR] Could not load generator:", e)
+    GENERATOR = None
+# ----------------------------
+# 4. INFERENCE FUNCTION
+# ----------------------------
+def inference(image: Image.Image) -> Image.Image:
+    """
+    Gradio-compatible inference function:
+    - Convert PIL→ numpy RGB
+    - Align faces
+    - For each face: normalize to [-1,1], run through generator, denormalize to uint8
+    - Put processed faces back onto original image
+    - Return full-image PIL
+    """
+    if GENERATOR is None:
+        return image
+    orig = np.array(image.convert("RGB"))
+    faces, masks, mats = align_face(orig)
+    if len(faces) == 0:
+        return image
+    processed_faces = []
+    for face in faces:
+        face_input = face.astype(np.float32)
+        face_input = (face_input / 127.5) - 1.0  # scale to [-1,1]
+        face_input = np.expand_dims(face_input, axis=0)  # (1,256,256,3)
+        pred = GENERATOR.predict(face_input)[0]  # (256,256,3) in [-1,1]
+        pred = ((pred + 1.0) * 127.5).astype(np.uint8)
+        processed_faces.append(pred)
+    output_np = put_face_back(orig, processed_faces, masks, mats)
+    output_pil = Image.fromarray(output_np)
+    return output_pil

bbox_utils.py ADDED Viewed

	@@ -0,0 +1,31 @@

+import numpy as np
+from PIL import Image
+def get_bbox_from_alpha(rgba: Image.Image):
+    arr = np.array(rgba)
+    alpha = arr[...,3]
+    ys, xs = np.where(alpha>0)
+    if ys.size == 0:
+        return None
+    x1, x2 = xs.min(), xs.max()
+    y1, y2 = ys.min(), ys.max()
+    return x1, y1, x2, y2
+def paste_with_alpha(bg: np.ndarray, src: np.ndarray, offset: tuple[int,int]) -> Image.Image:
+    res = bg.copy()
+    x, y = offset
+    h, w = src.shape[:2]
+    x1, y1 = max(x,0), max(y,0)
+    x2 = min(x+w, bg.shape[1])
+    y2 = min(y+h, bg.shape[0])
+    if x1>=x2 or y1>=y2:
+        return Image.fromarray(res)
+    cs = src[y1-y:y2-y, x1-x:x2-x]
+    cd = res[y1:y2, x1:x2]
+    mask = cs[...,3]>0
+    if cd.shape[2]==3:
+        cd[mask] = cs[mask][..., :3]
+    else:
+        cd[mask] = cs[mask]
+    res[y1:y2, x1:x2] = cd
+    return Image.fromarray(res)

detect_face.py ADDED Viewed

	@@ -0,0 +1,93 @@

+# model.py
+import os
+import sys
+import torch
+import torch.nn as nn
+import torchvision
+from torchvision import transforms
+from huggingface_hub import hf_hub_download
+from PIL import Image
+import numpy as np
+# --- Cấu hình chung ---
+DEVICE       = "cuda" if torch.cuda.is_available() else "cpu"
+HF_REPO      = "VanNguyen1214/detect_faceshape"  # repo của bạn trên HF Hub
+HF_FILENAME  = "best_model.pth"                  # file ở root của repo
+LOCAL_CKPT   = "models/best_model.pth"           # sẽ lưu tại đây
+CLASS_NAMES  = ['Heart', 'Oblong', 'Oval', 'Round', 'Square']
+NUM_CLASSES  = len(CLASS_NAMES)
+# --- Transform cho ảnh trước inference ---
+_TRANSFORM = transforms.Compose([
+    transforms.Resize((224, 224)),
+    transforms.ToTensor(),
+    transforms.Normalize(mean=[0.485, 0.456, 0.406],
+                         std =[0.229, 0.224, 0.225]),
+])
+def _ensure_checkpoint() -> str:
+    """
+    Kiểm tra xem LOCAL_CKPT đã tồn tại chưa.
+    Nếu chưa, tải best_model.pth từ HF_REPO và lưu vào ./models/
+    """
+    if os.path.exists(LOCAL_CKPT):
+        return LOCAL_CKPT
+    try:
+        ckpt_path = hf_hub_download(
+            repo_id=HF_REPO,
+            filename=HF_FILENAME,
+            local_dir="models",
+        )
+        return ckpt_path
+    except Exception as e:
+        print(f"❌ Không tải được model từ HF Hub: {e}")
+        sys.exit(1)
+def _load_model(ckpt_path: str) -> torch.nn.Module:
+    """
+    Tái tạo kiến trúc EfficientNet-B4, load state_dict, đưa về eval mode.
+    """
+    # 1) Khởi tạo EfficientNet-B4
+    model = torchvision.models.efficientnet_b4(pretrained=False)
+    in_features = model.classifier[1].in_features
+    model.classifier = nn.Sequential(
+        nn.Dropout(p=0.3, inplace=True),
+        nn.Linear(in_features, NUM_CLASSES)
+    )
+    # 2) Load trọng số
+    state = torch.load(ckpt_path, map_location=DEVICE)
+    model.load_state_dict(state)
+    # 3) Đưa model về chế độ evaluation
+    return model.to(DEVICE).eval()
+# === Build model ngay khi import ===
+_CKPT_PATH = _ensure_checkpoint()
+_MODEL     = _load_model(_CKPT_PATH)
+def predict(image: Image.Image) -> dict:
+    """
+    Chức năng inference:
+      - image: numpy array H×W×3 RGB
+      - Trả về dict:
+          {
+            "predicted_class": str,
+            "confidence": float,
+            "probabilities": { class_name: prob, ... }
+          }
+    """
+    # Convert về PIL + transform
+    img = image.convert("RGB")
+    x   = _TRANSFORM(img).unsqueeze(0).to(DEVICE)
+    # Inference
+    with torch.no_grad():
+        logits = _MODEL(x)
+        probs  = torch.softmax(logits, dim=1).squeeze().cpu().numpy()
+    idx = int(probs.argmax())
+    return {"predicted_class": CLASS_NAMES[idx]}

example_wigs/Heart/HH02.png ADDED Viewed

Git LFS Details

SHA256: 357555727e476770a7e53ee10711ad8f795caedfdcb90adb5083bf077439c63e
Pointer size: 132 Bytes
Size of remote file: 2.49 MB

example_wigs/Heart/HH03.png ADDED Viewed

Git LFS Details

SHA256: a5ba9ef2d6fe37480923fbbd93a7bdf6fdb0590ed5c93f8e741163be31bc26eb
Pointer size: 132 Bytes
Size of remote file: 2.48 MB

example_wigs/Heart/Loire.png ADDED Viewed

Git LFS Details

SHA256: dc8864c7d5dd20de52ac6f5c8e1ddf236f4fda8278d63dae347306b0f33fb02a
Pointer size: 132 Bytes
Size of remote file: 2.36 MB

example_wigs/Heart/SantaRossa.png ADDED Viewed

Git LFS Details

SHA256: e70fffdbe0a0b61b267f483ea35467a0108d5b961e86df7d293459a3944c93c4
Pointer size: 132 Bytes
Size of remote file: 2.2 MB

example_wigs/Heart/Tuscany.png ADDED Viewed

Git LFS Details

SHA256: 35ebf617bbbab34b05d019042f5ab8e9eb90cd6a186957a96df7c3793c142a9e
Pointer size: 132 Bytes
Size of remote file: 2.99 MB

example_wigs/Oblong/HH01.png ADDED Viewed

Git LFS Details

SHA256: bdf028002be35de79da4067264cce2627b5739b7f356ece65c703f1878e83537
Pointer size: 132 Bytes
Size of remote file: 2.44 MB

example_wigs/Oblong/HH02.png ADDED Viewed

Git LFS Details

SHA256: 357555727e476770a7e53ee10711ad8f795caedfdcb90adb5083bf077439c63e
Pointer size: 132 Bytes
Size of remote file: 2.49 MB

example_wigs/Oblong/HH03.png ADDED Viewed

Git LFS Details

SHA256: a5ba9ef2d6fe37480923fbbd93a7bdf6fdb0590ed5c93f8e741163be31bc26eb
Pointer size: 132 Bytes
Size of remote file: 2.48 MB

example_wigs/Oblong/HH07.png ADDED Viewed

Git LFS Details

SHA256: 1205c879380091b4fe13bdc29b070511f745b7365be956d627dc7b94c115118e
Pointer size: 132 Bytes
Size of remote file: 2.72 MB

example_wigs/Oblong/Loire.png ADDED Viewed

Git LFS Details

SHA256: dc8864c7d5dd20de52ac6f5c8e1ddf236f4fda8278d63dae347306b0f33fb02a
Pointer size: 132 Bytes
Size of remote file: 2.36 MB

example_wigs/Oval/Alsace.png ADDED Viewed

Git LFS Details

SHA256: 83767c820759344c15bed941abd94a7f5e7fe8cb462a5ae2d1e289265269d5c7
Pointer size: 132 Bytes
Size of remote file: 2.28 MB

example_wigs/Oval/Barossa.png ADDED Viewed

Git LFS Details

SHA256: bf9f6e9abbc352390d1826f186dd08f3536eaba60d96131b81bab49468f202e8
Pointer size: 132 Bytes
Size of remote file: 2.44 MB

example_wigs/Oval/Burgundy.png ADDED Viewed

Git LFS Details

SHA256: b48e47a7e1244efe2ed472fb212c39b1f646fc2e726f1a314d7b5cff475a2755
Pointer size: 132 Bytes
Size of remote file: 2.69 MB

example_wigs/Oval/HH01.png ADDED Viewed

Git LFS Details

SHA256: bdf028002be35de79da4067264cce2627b5739b7f356ece65c703f1878e83537
Pointer size: 132 Bytes
Size of remote file: 2.44 MB

example_wigs/Oval/HH02.png ADDED Viewed

Git LFS Details

SHA256: 357555727e476770a7e53ee10711ad8f795caedfdcb90adb5083bf077439c63e
Pointer size: 132 Bytes
Size of remote file: 2.49 MB

example_wigs/Oval/HH03.png ADDED Viewed

Git LFS Details

SHA256: a5ba9ef2d6fe37480923fbbd93a7bdf6fdb0590ed5c93f8e741163be31bc26eb
Pointer size: 132 Bytes
Size of remote file: 2.48 MB

example_wigs/Oval/HH07.png ADDED Viewed

Git LFS Details

SHA256: 1205c879380091b4fe13bdc29b070511f745b7365be956d627dc7b94c115118e
Pointer size: 132 Bytes
Size of remote file: 2.72 MB

example_wigs/Oval/Loire.png ADDED Viewed

Git LFS Details

SHA256: dc8864c7d5dd20de52ac6f5c8e1ddf236f4fda8278d63dae347306b0f33fb02a
Pointer size: 132 Bytes
Size of remote file: 2.36 MB

example_wigs/Oval/Napa.png ADDED Viewed

Git LFS Details

SHA256: 1a9a929040f0bb2d4d527f811b35a6f7d92135aca380afa72e729cc74db6c5a2
Pointer size: 132 Bytes
Size of remote file: 2.37 MB

example_wigs/Oval/Piemonte.png ADDED Viewed

Git LFS Details

SHA256: 43b0d004d0565425c442b5c75d1dfd0ac8efa239f600fe07c85524fa0eb09e83
Pointer size: 132 Bytes
Size of remote file: 2.23 MB

example_wigs/Oval/Rhone.png ADDED Viewed

Git LFS Details

SHA256: 928ece7bd6fa34d6b0d4e98f9457199f8247b21d0cc5929aaa3d1edc6332722b
Pointer size: 132 Bytes
Size of remote file: 2.06 MB

example_wigs/Oval/SantaRossa.png ADDED Viewed

Git LFS Details

SHA256: e70fffdbe0a0b61b267f483ea35467a0108d5b961e86df7d293459a3944c93c4
Pointer size: 132 Bytes
Size of remote file: 2.2 MB

example_wigs/Oval/Sonoma.png ADDED Viewed

Git LFS Details

SHA256: a9d70d9b95a40319beeff562149c708a6525fccbb8245caf484cb8b2cb74edc6
Pointer size: 132 Bytes
Size of remote file: 2.18 MB

example_wigs/Oval/Tuscany.png ADDED Viewed

Git LFS Details

SHA256: 35ebf617bbbab34b05d019042f5ab8e9eb90cd6a186957a96df7c3793c142a9e
Pointer size: 132 Bytes
Size of remote file: 2.99 MB

example_wigs/Round/Loire.png ADDED Viewed

Git LFS Details

SHA256: dc8864c7d5dd20de52ac6f5c8e1ddf236f4fda8278d63dae347306b0f33fb02a
Pointer size: 132 Bytes
Size of remote file: 2.36 MB

example_wigs/Round/Piemonte.png ADDED Viewed

Git LFS Details

SHA256: 43b0d004d0565425c442b5c75d1dfd0ac8efa239f600fe07c85524fa0eb09e83
Pointer size: 132 Bytes
Size of remote file: 2.23 MB

example_wigs/Round/Sonoma.png ADDED Viewed

Git LFS Details

SHA256: a9d70d9b95a40319beeff562149c708a6525fccbb8245caf484cb8b2cb74edc6
Pointer size: 132 Bytes
Size of remote file: 2.18 MB

example_wigs/Round/Tuscany.png ADDED Viewed

Git LFS Details

SHA256: 35ebf617bbbab34b05d019042f5ab8e9eb90cd6a186957a96df7c3793c142a9e
Pointer size: 132 Bytes
Size of remote file: 2.99 MB

example_wigs/Square/HH03.png ADDED Viewed

Git LFS Details

SHA256: a5ba9ef2d6fe37480923fbbd93a7bdf6fdb0590ed5c93f8e741163be31bc26eb
Pointer size: 132 Bytes
Size of remote file: 2.48 MB

example_wigs/Square/Loire.png ADDED Viewed

Git LFS Details

SHA256: dc8864c7d5dd20de52ac6f5c8e1ddf236f4fda8278d63dae347306b0f33fb02a
Pointer size: 132 Bytes
Size of remote file: 2.36 MB

example_wigs/Square/Piemonte.png ADDED Viewed

Git LFS Details

SHA256: 43b0d004d0565425c442b5c75d1dfd0ac8efa239f600fe07c85524fa0eb09e83
Pointer size: 132 Bytes
Size of remote file: 2.23 MB

example_wigs/Square/Sonoma.png ADDED Viewed

Git LFS Details

SHA256: a9d70d9b95a40319beeff562149c708a6525fccbb8245caf484cb8b2cb74edc6
Pointer size: 132 Bytes
Size of remote file: 2.18 MB

example_wigs/Square/Tuscany.png ADDED Viewed

Git LFS Details

SHA256: 35ebf617bbbab34b05d019042f5ab8e9eb90cd6a186957a96df7c3793c142a9e
Pointer size: 132 Bytes
Size of remote file: 2.99 MB

overlay.py ADDED Viewed

	@@ -0,0 +1,89 @@

+import numpy as np
+from PIL import Image
+import mediapipe as mp
+from baldhead import inference       # cạo tóc background
+from segmentation import extract_hair
+# MediaPipe Face Detection
+mp_fd = mp.solutions.face_detection.FaceDetection(model_selection=1,
+                                                  min_detection_confidence=0.5)
+def get_face_bbox(img: Image.Image) -> tuple[int,int,int,int] | None:
+    arr = np.array(img.convert("RGB"))
+    res = mp_fd.process(arr)
+    if not res.detections:
+        return None
+    d = res.detections[0].location_data.relative_bounding_box
+    h, w = arr.shape[:2]
+    x1 = int(d.xmin * w)
+    y1 = int(d.ymin * h)
+    x2 = x1 + int(d.width * w)
+    y2 = y1 + int(d.height * h)
+    return x1, y1, x2, y2
+def compute_scale(w_bg, h_bg, w_src, h_src) -> float:
+    return ((w_bg / w_src) + (h_bg / h_src)) / 2
+def compute_offset(bbox_bg, bbox_src, scale) -> tuple[int,int]:
+    x1, y1, x2, y2 = bbox_bg
+    bg_cx = x1 + (x2 - x1)//2
+    bg_cy = y1 + (y2 - y1)//2
+    sx1, sy1, sx2, sy2 = bbox_src
+    src_cx = int((sx1 + (sx2 - sx1)//2) * scale)
+    src_cy = int((sy1 + (sy2 - sy1)//2) * scale)
+    return bg_cx - src_cx, bg_cy - src_cy
+def paste_with_alpha(bg: np.ndarray, src: np.ndarray, offset: tuple[int,int]) -> Image.Image:
+    res = bg.copy()
+    x, y = offset
+    h, w = src.shape[:2]
+    x1, y1 = max(x,0), max(y,0)
+    x2 = min(x+w, bg.shape[1])
+    y2 = min(y+h, bg.shape[0])
+    if x1>=x2 or y1>=y2:
+        return Image.fromarray(res)
+    cs = src[y1-y:y2-y, x1-x:x2-x]
+    cd = res[y1:y2, x1:x2]
+    mask = cs[...,3] > 0
+    if cd.shape[2] == 3:
+        cd[mask] = cs[mask][...,:3]
+    else:
+        cd[mask] = cs[mask]
+    res[y1:y2, x1:x2] = cd
+    return Image.fromarray(res)
+def overlay_source(background: Image.Image, source: Image.Image):
+    # 1) detect bboxes
+    bbox_bg  = get_face_bbox(background)
+    bbox_src = get_face_bbox(source)
+    if bbox_bg is None:
+        return None, "❌ No face in background."
+    if bbox_src is None:
+        return None, "❌ No face in source."
+    # 2) compute scale & resize source
+    w_bg, h_bg = bbox_bg[2]-bbox_bg[0], bbox_bg[3]-bbox_bg[1]
+    w_src, h_src = bbox_src[2]-bbox_src[0], bbox_src[3]-bbox_src[1]
+    scale = compute_scale(w_bg, h_bg, w_src, h_src)
+    src_scaled = source.resize(
+        (int(source.width*scale), int(source.height*scale)),
+        Image.Resampling.LANCZOS
+    )
+    # 3) compute offset
+    offset = compute_offset(bbox_bg, bbox_src, scale)
+    # 4) baldhead background
+    bg_bald = inference(background)
+    # 5) extract hair-only from source
+    hair_only = extract_hair(src_scaled)
+    # 6) paste onto bald background
+    result = paste_with_alpha(
+        np.array(bg_bald.convert("RGBA")),
+        np.array(hair_only),
+        offset
+    )
+    return result

requirements.txt ADDED Viewed

	@@ -0,0 +1,35 @@

+--extra-index-url https://download.pytorch.org/whl/cu118 # Dòng này có vẻ là comment hoặc cấu hình cho pip, không phải là một gói
+# spaces # Dòng này không rõ ràng là một gói, có thể là ghi chú. Nếu không phải gói, hãy xóa đi.
+huggingface_hub>=0.20.3
+numpy==1.23.5
+transformers==4.30.0
+opencv-python-headless==4.7.0.72
+onnx==1.14.0
+insightface==0.7.3
+psutil==5.9.5
+tk==0.1.0 # Lưu ý: tk thường được bao gồm trong bản cài đặt Python chuẩn, không phải lúc nào cũng cần cài qua pip.
+customtkinter==5.1.3
+pillow==9.5.0
+torch==2.0.1+cu118; sys_platform != 'darwin'
+torch==2.0.1; sys_platform == 'darwin'
+torchvision==0.15.2+cu118; sys_platform != 'darwin'
+torchvision==0.15.2; sys_platform == 'darwin'
+# onnxruntime==1.15.0; # Bỏ comment cho dòng này nếu bạn muốn cố định phiên bản cho mọi OS
+# sys_platform == 'darwin' and platform_machine != 'arm64' # Comment
+onnxruntime-silicon==1.13.1; sys_platform == 'darwin' and platform_machine == 'arm64'
+onnxruntime-gpu==1.15.0; sys_platform != 'darwin' # Nên giữ lại dòng này cho non-darwin GPU
+onnxruntime==1.15.0; sys_platform == 'darwin' and platform_machine != 'arm64' # Thêm lại dòng onnxruntime cho Mac Intel
+tensorflow==2.12.0
+# sys_platform != 'darwin' # Comment
+opennsfw2==0.10.2
+# protobuf==4.23.2 # Thay thế dòng này
+protobuf==4.25.3  # *** THAY ĐỔI QUAN TRỌNG ***
+tqdm==4.65.0
+gfpgan==1.3.8
+# torch # Dòng này không cần thiết vì torch đã được định nghĩa ở trên với phiên bản cụ thể.
+# Thêm các thư viện mới cần thiết cho app.py đã cập nhật
+scikit-image>=0.19 # Hoặc một phiên bản cụ thể hơn nếu bạn muốn, ví dụ: scikit-image==0.19.3
+mediapipe==0.10.14 # *** THÊM MỚI HOẶC CẬP NHẬT *** (Phiên bản này yêu cầu protobuf >=4.25.3)
+git+https://github.com/keras-team/keras-contrib.git
+retina-face==0.0.13

roop/__init__.py ADDED Viewed

File without changes

roop/capturer.py ADDED Viewed

	@@ -0,0 +1,20 @@

+from typing import Any
+import cv2
+def get_video_frame(video_path: str, frame_number: int = 0) -> Any:
+    capture = cv2.VideoCapture(video_path)
+    frame_total = capture.get(cv2.CAP_PROP_FRAME_COUNT)
+    capture.set(cv2.CAP_PROP_POS_FRAMES, min(frame_total, frame_number - 1))
+    has_frame, frame = capture.read()
+    capture.release()
+    if has_frame:
+        return frame
+    return None
+def get_video_frame_total(video_path: str) -> int:
+    capture = cv2.VideoCapture(video_path)
+    video_frame_total = int(capture.get(cv2.CAP_PROP_FRAME_COUNT))
+    capture.release()
+    return video_frame_total

roop/core.py ADDED Viewed

	@@ -0,0 +1,217 @@

+#!/usr/bin/env python3
+import os
+import sys
+# single thread doubles cuda performance - needs to be set before torch import
+if any(arg.startswith('--execution-provider') for arg in sys.argv):
+    os.environ['OMP_NUM_THREADS'] = '1'
+# reduce tensorflow log level
+os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2'
+import warnings
+from typing import List
+import platform
+import signal
+import shutil
+import argparse
+import torch
+import onnxruntime
+import tensorflow
+import roop.globals
+import roop.metadata
+import roop.ui as ui
+from roop.predicter import predict_image, predict_video
+from roop.processors.frame.core import get_frame_processors_modules
+from roop.utilities import has_image_extension, is_image, is_video, detect_fps, create_video, extract_frames, get_temp_frame_paths, restore_audio, create_temp, move_temp, clean_temp, normalize_output_path
+if 'ROCMExecutionProvider' in roop.globals.execution_providers:
+    del torch
+warnings.filterwarnings('ignore', category=FutureWarning, module='insightface')
+warnings.filterwarnings('ignore', category=UserWarning, module='torchvision')
+def parse_args() -> None:
+    signal.signal(signal.SIGINT, lambda signal_number, frame: destroy())
+    program = argparse.ArgumentParser(formatter_class=lambda prog: argparse.HelpFormatter(prog, max_help_position=100))
+    program.add_argument('-s', '--source', help='select an source image', dest='source_path')
+    program.add_argument('-t', '--target', help='select an target image or video', dest='target_path')
+    program.add_argument('-o', '--output', help='select output file or directory', dest='output_path')
+    program.add_argument('--frame-processor', help='frame processors (choices: face_swapper, face_enhancer, ...)', dest='frame_processor', default=['face_swapper'], nargs='+')
+    program.add_argument('--keep-fps', help='keep original fps', dest='keep_fps', action='store_true', default=False)
+    program.add_argument('--keep-audio', help='keep original audio', dest='keep_audio', action='store_true', default=True)
+    program.add_argument('--keep-frames', help='keep temporary frames', dest='keep_frames', action='store_true', default=False)
+    program.add_argument('--many-faces', help='process every face', dest='many_faces', action='store_true', default=False)
+    program.add_argument('--video-encoder', help='adjust output video encoder', dest='video_encoder', default='libx264', choices=['libx264', 'libx265', 'libvpx-vp9'])
+    program.add_argument('--video-quality', help='adjust output video quality', dest='video_quality', type=int, default=18, choices=range(52), metavar='[0-51]')
+    program.add_argument('--max-memory', help='maximum amount of RAM in GB', dest='max_memory', type=int, default=suggest_max_memory())
+    program.add_argument('--execution-provider', help='available execution provider (choices: cpu, ...)', dest='execution_provider', default=['cpu'], choices=suggest_execution_providers(), nargs='+')
+    program.add_argument('--execution-threads', help='number of execution threads', dest='execution_threads', type=int, default=suggest_execution_threads())
+    program.add_argument('-v', '--version', action='version', version=f'{roop.metadata.name} {roop.metadata.version}')
+    args = program.parse_args()
+    roop.globals.source_path = args.source_path
+    roop.globals.target_path = args.target_path
+    roop.globals.output_path = normalize_output_path(roop.globals.source_path, roop.globals.target_path, args.output_path)
+    roop.globals.frame_processors = args.frame_processor
+    roop.globals.headless = args.source_path or args.target_path or args.output_path
+    roop.globals.keep_fps = args.keep_fps
+    roop.globals.keep_audio = args.keep_audio
+    roop.globals.keep_frames = args.keep_frames
+    roop.globals.many_faces = args.many_faces
+    roop.globals.video_encoder = args.video_encoder
+    roop.globals.video_quality = args.video_quality
+    roop.globals.max_memory = args.max_memory
+    roop.globals.execution_providers = decode_execution_providers(args.execution_provider)
+    roop.globals.execution_threads = args.execution_threads
+def encode_execution_providers(execution_providers: List[str]) -> List[str]:
+    return [execution_provider.replace('ExecutionProvider', '').lower() for execution_provider in execution_providers]
+def decode_execution_providers(execution_providers: List[str]) -> List[str]:
+    return [provider for provider, encoded_execution_provider in zip(onnxruntime.get_available_providers(), encode_execution_providers(onnxruntime.get_available_providers()))
+            if any(execution_provider in encoded_execution_provider for execution_provider in execution_providers)]
+def suggest_max_memory() -> int:
+    if platform.system().lower() == 'darwin':
+        return 4
+    return 16
+def suggest_execution_providers() -> List[str]:
+    return encode_execution_providers(onnxruntime.get_available_providers())
+def suggest_execution_threads() -> int:
+    if 'DmlExecutionProvider' in roop.globals.execution_providers:
+        return 1
+    if 'ROCMExecutionProvider' in roop.globals.execution_providers:
+        return 1
+    return 8
+def limit_resources() -> None:
+    # prevent tensorflow memory leak
+    gpus = tensorflow.config.experimental.list_physical_devices('GPU')
+    for gpu in gpus:
+        tensorflow.config.experimental.set_virtual_device_configuration(gpu, [
+            tensorflow.config.experimental.VirtualDeviceConfiguration(memory_limit=1024)
+        ])
+    # limit memory usage
+    if roop.globals.max_memory:
+        memory = roop.globals.max_memory * 1024 ** 3
+        if platform.system().lower() == 'darwin':
+            memory = roop.globals.max_memory * 1024 ** 6
+        if platform.system().lower() == 'windows':
+            import ctypes
+            kernel32 = ctypes.windll.kernel32
+            kernel32.SetProcessWorkingSetSize(-1, ctypes.c_size_t(memory), ctypes.c_size_t(memory))
+        else:
+            import resource
+            resource.setrlimit(resource.RLIMIT_DATA, (memory, memory))
+def release_resources() -> None:
+    if 'CUDAExecutionProvider' in roop.globals.execution_providers:
+        torch.cuda.empty_cache()
+def pre_check() -> bool:
+    if sys.version_info < (3, 9):
+        update_status('Python version is not supported - please upgrade to 3.9 or higher.')
+        return False
+    if not shutil.which('ffmpeg'):
+        update_status('ffmpeg is not installed.')
+        return False
+    return True
+def update_status(message: str, scope: str = 'ROOP.CORE') -> None:
+    print(f'[{scope}] {message}')
+    if not roop.globals.headless:
+        ui.update_status(message)
+def start() -> None:
+    for frame_processor in get_frame_processors_modules(roop.globals.frame_processors):
+        if not frame_processor.pre_start():
+            return
+    # process image to image
+    if has_image_extension(roop.globals.target_path):
+        if predict_image(roop.globals.target_path):
+            destroy()
+        shutil.copy2(roop.globals.target_path, roop.globals.output_path)
+        for frame_processor in get_frame_processors_modules(roop.globals.frame_processors):
+            for frame_processor_name in roop.globals.frame_processors:
+                if frame_processor_name == frame_processor.frame_name:
+                    update_status('Progressing...', frame_processor.NAME)
+                    frame_processor.process_image(roop.globals.source_path, roop.globals.output_path, roop.globals.output_path)
+                    frame_processor.post_process()
+                    release_resources()
+        if is_image(roop.globals.target_path):
+            update_status('Processing to image succeed!')
+        else:
+            update_status('Processing to image failed!')
+        return
+    # process image to videos
+    if predict_video(roop.globals.target_path):
+        destroy()
+    update_status('Creating temp resources...')
+    create_temp(roop.globals.target_path)
+    update_status('Extracting frames...')
+    extract_frames(roop.globals.target_path)
+    temp_frame_paths = get_temp_frame_paths(roop.globals.target_path)
+    for frame_processor in get_frame_processors_modules(roop.globals.frame_processors):
+        update_status('Progressing...', frame_processor.NAME)
+        frame_processor.process_video(roop.globals.source_path, temp_frame_paths)
+        frame_processor.post_process()
+        release_resources()
+    # handles fps
+    if roop.globals.keep_fps:
+        update_status('Detecting fps...')
+        fps = detect_fps(roop.globals.target_path)
+        update_status(f'Creating video with {fps} fps...')
+        create_video(roop.globals.target_path, fps)
+    else:
+        update_status('Creating video with 30.0 fps...')
+        create_video(roop.globals.target_path)
+    # handle audio
+    if roop.globals.keep_audio:
+        if roop.globals.keep_fps:
+            update_status('Restoring audio...')
+        else:
+            update_status('Restoring audio might cause issues as fps are not kept...')
+        restore_audio(roop.globals.target_path, roop.globals.output_path)
+    else:
+        move_temp(roop.globals.target_path, roop.globals.output_path)
+    # clean and validate
+    clean_temp(roop.globals.target_path)
+    if is_video(roop.globals.target_path):
+        update_status('Processing to video succeed!')
+    else:
+        update_status('Processing to video failed!')
+def destroy() -> None:
+    if roop.globals.target_path:
+        clean_temp(roop.globals.target_path)
+    quit()
+def run() -> None:
+    parse_args()
+    if not pre_check():
+        return
+    for frame_processor in get_frame_processors_modules(roop.globals.frame_processors):
+        if not frame_processor.pre_check():
+            return
+    limit_resources()
+    if roop.globals.headless:
+        start()
+    else:
+        window = ui.init(start, destroy)
+        window.mainloop()

roop/face_analyser.py ADDED Viewed

	@@ -0,0 +1,124 @@

+import threading
+from typing import Any
+import insightface
+import numpy as np
+from PIL import Image
+import roop.globals
+from roop.typing import Frame
+FACE_ANALYSER = None
+THREAD_LOCK = threading.Lock()
+def get_face_analyser() -> Any:
+    global FACE_ANALYSER
+    with THREAD_LOCK:
+        if FACE_ANALYSER is None:
+            FACE_ANALYSER = insightface.app.FaceAnalysis(name='buffalo_l', providers=roop.globals.execution_providers)
+            FACE_ANALYSER.prepare(ctx_id=0, det_size=(640, 640))
+    return FACE_ANALYSER
+def get_precise_face_mask(frame: Frame) -> Any:
+    """
+    Get precise face mask using advanced segmentation (same as detect_face_and_forehead_no_hair).
+    Returns both InsightFace detection and precise mask.
+    """
+    try:
+        # Import the precise detection function
+        import sys
+        import os
+        sys.path.append(os.path.dirname(os.path.dirname(__file__)))
+        from segmentation import detect_face_and_forehead_no_hair
+        # Convert frame to PIL Image
+        if isinstance(frame, np.ndarray):
+            pil_image = Image.fromarray(frame)
+        else:
+            pil_image = frame
+        # Get precise face mask (clean skin only)
+        precise_mask = detect_face_and_forehead_no_hair(pil_image)
+        # Also get InsightFace detection for face swapping compatibility
+        insightface_faces = get_face_analyser().get(frame)
+        return {
+            'precise_mask': precise_mask,
+            'insightface_faces': insightface_faces,
+            'has_face': precise_mask.sum() > 0 and len(insightface_faces) > 0
+        }
+    except Exception as e:
+        print(f"Precise face detection failed: {e}")
+        # Fallback to regular InsightFace
+        insightface_faces = get_face_analyser().get(frame)
+        return {
+            'precise_mask': None,
+            'insightface_faces': insightface_faces,
+            'has_face': len(insightface_faces) > 0
+        }
+def get_one_face(frame: Frame) -> Any:
+    """
+    Get one face with enhanced precision detection.
+    """
+    # Get precise detection info
+    face_info = get_precise_face_mask(frame)
+    if face_info['has_face'] and face_info['insightface_faces']:
+        try:
+            # Select face (leftmost) for compatibility
+            selected_face = min(face_info['insightface_faces'], key=lambda x: x.bbox[0])
+            # Add precise mask info to face object
+            if face_info['precise_mask'] is not None:
+                selected_face.precise_mask = face_info['precise_mask']
+                print(f"✅ Enhanced face detection: {face_info['precise_mask'].sum()} precise pixels")
+            return selected_face
+        except (ValueError, IndexError):
+            return None
+    # Fallback to original method
+    face = get_face_analyser().get(frame)
+    try:
+        selected_face = min(face, key=lambda x: x.bbox[0])
+        return selected_face
+    except ValueError:
+        return None
+def get_many_faces(frame: Frame) -> Any:
+    """
+    Get many faces with enhanced precision detection.
+    """
+    # Get precise detection info
+    face_info = get_precise_face_mask(frame)
+    if face_info['has_face'] and face_info['insightface_faces']:
+        faces = face_info['insightface_faces']
+        # Add precise mask info to all face objects
+        if face_info['precise_mask'] is not None:
+            for face in faces:
+                face.precise_mask = face_info['precise_mask']
+        print(f"✅ Enhanced multi-face detection: {len(faces)} faces with precise masks")
+        return faces
+    # Fallback to original method
+    try:
+        return get_face_analyser().get(frame)
+    except IndexError:
+        return None
+def has_precise_face_mask(face_obj) -> bool:
+    """
+    Check if face object has precise mask attached.
+    """
+    return hasattr(face_obj, 'precise_mask') and face_obj.precise_mask is not None

roop/globals.py ADDED Viewed

	@@ -0,0 +1,17 @@

+from typing import List
+source_path = None
+target_path = None
+output_path = None
+frame_processors: List[str] = []
+keep_fps = None
+keep_audio = None
+keep_frames = None
+many_faces = None
+video_encoder = None
+video_quality = None
+max_memory = None
+execution_providers: List[str] = []
+execution_threads = None
+headless = None
+log_level = 'error'

roop/metadata.py ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ name = 'roop'
2	+ version = '1.1.0'

roop/predicter.py ADDED Viewed

	@@ -0,0 +1,25 @@

+import numpy
+import opennsfw2
+from PIL import Image
+from roop.typing import Frame
+MAX_PROBABILITY = 0.85
+def predict_frame(target_frame: Frame) -> bool:
+    image = Image.fromarray(target_frame)
+    image = opennsfw2.preprocess_image(image, opennsfw2.Preprocessing.YAHOO)
+    model = opennsfw2.make_open_nsfw_model()
+    views = numpy.expand_dims(image, axis=0)
+    _, probability = model.predict(views)[0]
+    return probability > MAX_PROBABILITY
+def predict_image(target_path: str) -> bool:
+    return opennsfw2.predict_image(target_path) > MAX_PROBABILITY
+def predict_video(target_path: str) -> bool:
+    _, probabilities = opennsfw2.predict_video_frames(video_path=target_path, frame_interval=100)
+    return any(probability > MAX_PROBABILITY for probability in probabilities)

roop/processors/__init__.py ADDED Viewed

File without changes

roop/processors/frame/__init__.py ADDED Viewed

File without changes