Spaces:

aproxtimedev
/

api-swapface

Running

App Files Files Community

Ahmad Faris commited on Jun 24, 2025

Commit

33d53d8

1 Parent(s): 4a763bf

remove : unused

Browse files

Files changed (1) hide show

app.py +70 -364

app.py CHANGED Viewed

@@ -154,36 +154,37 @@ load_face_swapper_model()
 def process(
-    input_type,
-    image_path,
     video_path,
-    directory_path,
     source_path,
-    output_path,
-    output_name,
-    keep_output_sequence,
-    condition,
-    age,
-    distance,
-    face_enhancer_name,
-    enable_face_parser,
-    mask_includes,
-    mask_soft_kernel,
-    mask_soft_iterations,
-    blur_amount,
-    erode_amount,
-    face_scale,
-    enable_laplacian_blend,
-    crop_top,
-    crop_bott,
-    crop_left,
-    crop_right,
-    *specifics,
 ):
     global WORKSPACE
     global OUTPUT_FILE
     global PREVIEW
     WORKSPACE, OUTPUT_FILE, PREVIEW = None, None, None
     ## ------------------------------ GUI UPDATE FUNC ------------------------------
@@ -217,8 +218,6 @@ def process(
     ## ------------------------------ PREPARE INPUTS & LOAD MODELS ------------------------------
     yield "### \n ⌛ Loading face analyser model...", *ui_before()
     load_face_analyser_model()
@@ -236,11 +235,7 @@ def process(
         yield "### \n ⌛ Loading face parsing model...", *ui_before()
         load_face_parser_model()
-    includes = mask_regions_to_list(mask_includes)
-    specifics = list(specifics)
-    half = len(specifics) // 2
-    sources = specifics[:half]
-    specifics = specifics[half:]
     if crop_top > crop_bott:
         crop_top, crop_bott = crop_bott, crop_top
     if crop_left > crop_right:
@@ -251,10 +246,7 @@ def process(
         ## ------------------------------ CONTENT CHECK ------------------------------
         print("### \n ⌛ Analysing face data...")
         log_message("⌛ Analysing face data...")
-        if condition != "Specific Face":
-            source_data = source_path, age
-        else:
-            source_data = ((sources, specifics), distance)
         analysed_targets, analysed_sources, whole_frame_list, num_faces_per_frame = get_analysed_data(
             FACE_ANALYSER,
             image_sequence,
@@ -306,7 +298,7 @@ def process(
             log_message("⌛ Face-parsing mask...")
             masks = []
             count = 0
-            for batch_mask in get_parsed_mask(FACE_PARSER, preds, classes=includes, device=device, batch_size=BATCH_SIZE, softness=int(mask_soft_iterations)):
                 masks.append(batch_mask)
                 EMPTY_CACHE()
                 count += 1
@@ -374,147 +366,59 @@ def process(
     ## ------------------------------ IMAGE ------------------------------
-    if input_type == "Image":
-        target = cv2.imread(image_path)
-        output_file = os.path.join(output_path, output_name + ".png")
-        cv2.imwrite(output_file, target)
-        for info_update in swap_process([output_file]):
-            yield info_update
-        OUTPUT_FILE = output_file
-        WORKSPACE = output_path
-        PREVIEW = cv2.imread(output_file)[:, :, ::-1]
-        yield get_finsh_text(start_time), *ui_after()
     ## ------------------------------ VIDEO ------------------------------
-    elif input_type == "Video":
-        temp_path = os.path.join(output_path, output_name, "sequence")
-        os.makedirs(temp_path, exist_ok=True)
-        print("### \n ⌛ Extracting video frames...")
-        log_message("⌛ Extracting video frames...")
-        image_sequence = []
-        cap = cv2.VideoCapture(video_path)
-        curr_idx = 0
-        while True:
-            ret, frame = cap.read()
-            if not ret:break
-            frame_path = os.path.join(temp_path, f"frame_{curr_idx}.jpg")
-            cv2.imwrite(frame_path, frame)
-            image_sequence.append(frame_path)
-            curr_idx += 1
-            print("Curr IDX: {}".format(curr_idx))
-        cap.release()
-        cv2.destroyAllWindows()
-        print("Total image sequence: {}".format(len(image_sequence)))
-        swap_process(image_sequence)
-        # for info_update in swap_process(image_sequence):
-        #     # print(info_update)
-        #     yield info_update, *ui_before()
-        print("End swap_process")
-        # yield "### \n ⌛ Merging sequence...", *ui_before()
-        print("### \n ⌛ Merging sequence...")
-        log_message("⌛ Merging sequence...")
-        output_video_path = os.path.join(output_path, output_name + ".mp4")
-        merge_img_sequence_from_ref(video_path, image_sequence, output_video_path)
-        if os.path.exists(temp_path) and not keep_output_sequence:
-            print("### \n ⌛ Removing temporary files...")
-            print("⌛ Removing temporary files...")
-            shutil.rmtree(temp_path)
-        WORKSPACE = output_path
-        OUTPUT_FILE = output_video_path
-        log_result(OUTPUT_FILE)
-        gr.update(value=OUTPUT_FILE, visible=True)
-        yield get_finsh_text(start_time), *ui_after_vid()
-    ## ------------------------------ DIRECTORY ------------------------------
-    elif input_type == "Directory":
-        extensions = ["jpg", "jpeg", "png", "bmp", "tiff", "ico", "webp"]
-        temp_path = os.path.join(output_path, output_name)
-        if os.path.exists(temp_path):
-            shutil.rmtree(temp_path)
-        os.mkdir(temp_path)
-        file_paths =[]
-        for file_path in glob.glob(os.path.join(directory_path, "*")):
-            if any(file_path.lower().endswith(ext) for ext in extensions):
-                img = cv2.imread(file_path)
-                new_file_path = os.path.join(temp_path, os.path.basename(file_path))
-                cv2.imwrite(new_file_path, img)
-                file_paths.append(new_file_path)
-        for info_update in swap_process(file_paths):
-            yield info_update
-        PREVIEW = cv2.imread(file_paths[-1])[:, :, ::-1]
-        WORKSPACE = temp_path
-        OUTPUT_FILE = file_paths[-1]
-        yield get_finsh_text(start_time), *ui_after()
-    ## ------------------------------ STREAM ------------------------------
-    elif input_type == "Stream":
-        pass
 ## ------------------------------ GRADIO FUNC ------------------------------
-def update_radio(value):
-    if value == "Image":
-        return (
-            gr.update(visible=True),
-            gr.update(visible=False),
-            gr.update(visible=False),
-        )
-    elif value == "Video":
-        return (
-            gr.update(visible=False),
-            gr.update(visible=True),
-            gr.update(visible=False),
-        )
-    elif value == "Directory":
-        return (
-            gr.update(visible=False),
-            gr.update(visible=False),
-            gr.update(visible=True),
-        )
-    elif value == "Stream":
-        return (
-            gr.update(visible=False),
-            gr.update(visible=False),
-            gr.update(visible=True),
-        )
-def swap_option_changed(value):
-    if value.startswith("Age"):
-        return (
-            gr.update(visible=True),
-            gr.update(visible=False),
-            gr.update(visible=True),
-        )
-    elif value == "Specific Face":
-        return (
-            gr.update(visible=False),
-            gr.update(visible=True),
-            gr.update(visible=False),
-        )
-    return gr.update(visible=False), gr.update(visible=False), gr.update(visible=True)
 def video_changed(video_path):
     sliders_update = gr.Slider.update
     button_update = gr.Button.update
@@ -605,161 +509,12 @@ with gr.Blocks(css=css) as interface:
     with gr.Row():
         with gr.Row():
             with gr.Column(scale=0.4):
-                with gr.Tab("📄 Swap Condition"):
-                    swap_option = gr.Dropdown(
-                        swap_options_list,
-                        info="Choose which face or faces in the target image to swap.",
-                        multiselect=False,
-                        show_label=False,
-                        value=swap_options_list[0],
-                        interactive=True,
-                    )
-                    age = gr.Number(
-                        value=25, label="Value", interactive=True, visible=False
-                    )
-                with gr.Tab("🎚️ Detection Settings"):
-                    detect_condition_dropdown = gr.Dropdown(
-                        detect_conditions,
-                        label="Condition",
-                        value=DETECT_CONDITION,
-                        interactive=True,
-                        info="This condition is only used when multiple faces are detected on source or specific image.",
-                    )
-                    detection_size = gr.Number(
-                        label="Detection Size", value=DETECT_SIZE, interactive=True
-                    )
-                    detection_threshold = gr.Number(
-                        label="Detection Threshold",
-                        value=DETECT_THRESH,
-                        interactive=True,
-                    )
-                    apply_detection_settings = gr.Button("Apply settings")
-                with gr.Tab("📤 Output Settings"):
-                    output_directory = gr.Text(
-                        label="Output Directory",
-                        value=DEF_OUTPUT_PATH,
-                        interactive=True,
-                    )
-                    output_name = gr.Text(
-                        label="Output Name", value="Result", interactive=True
-                    )
-                    keep_output_sequence = gr.Checkbox(
-                        label="Keep output sequence", value=False, interactive=True
-                    )
-                with gr.Tab("🪄 Other Settings"):
-                    face_scale = gr.Slider(
-                        label="Face Scale",
-                        minimum=0,
-                        maximum=2,
-                        value=1,
-                        interactive=True,
-                    )
-                    face_enhancer_name = gr.Dropdown(
-                        FACE_ENHANCER_LIST, label="Face Enhancer", value="NONE", multiselect=False, interactive=True
-                    )
-                    with gr.Accordion("Advanced Mask", open=False):
-                        enable_face_parser_mask = gr.Checkbox(
-                            label="Enable Face Parsing",
-                            value=False,
-                            interactive=True,
-                        )
-                        mask_include = gr.Dropdown(
-                            mask_regions.keys(),
-                            value=MASK_INCLUDE,
-                            multiselect=True,
-                            label="Include",
-                            interactive=True,
-                        )
-                        mask_soft_kernel = gr.Number(
-                            label="Soft Erode Kernel",
-                            value=MASK_SOFT_KERNEL,
-                            minimum=3,
-                            interactive=True,
-                            visible = False
-                        )
-                        mask_soft_iterations = gr.Number(
-                            label="Soft Erode Iterations",
-                            value=MASK_SOFT_ITERATIONS,
-                            minimum=0,
-                            interactive=True,
-                        )
-                    with gr.Accordion("Crop Mask", open=False):
-                        crop_top = gr.Slider(label="Top", minimum=0, maximum=511, value=0, step=1, interactive=True)
-                        crop_bott = gr.Slider(label="Bottom", minimum=0, maximum=511, value=511, step=1, interactive=True)
-                        crop_left = gr.Slider(label="Left", minimum=0, maximum=511, value=0, step=1, interactive=True)
-                        crop_right = gr.Slider(label="Right", minimum=0, maximum=511, value=511, step=1, interactive=True)
-                    erode_amount = gr.Slider(
-                            label="Mask Erode",
-                            minimum=0,
-                            maximum=1,
-                            value=MASK_ERODE_AMOUNT,
-                            step=0.05,
-                            interactive=True,
-                        )
-                    blur_amount = gr.Slider(
-                            label="Mask Blur",
-                            minimum=0,
-                            maximum=1,
-                            value=MASK_BLUR_AMOUNT,
-                            step=0.05,
-                            interactive=True,
-                        )
-                    enable_laplacian_blend = gr.Checkbox(
-                        label="Laplacian Blending",
-                        value=True,
-                        interactive=True,
-                    )
                 source_image_input = gr.Image(
                     label="Source face", type="filepath", interactive=True
                 )
-                with gr.Box(visible=False) as specific_face:
-                    for i in range(NUM_OF_SRC_SPECIFIC):
-                        idx = i + 1
-                        code = "\n"
-                        code += f"with gr.Tab(label='({idx})'):"
-                        code += "\n\twith gr.Row():"
-                        code += f"\n\t\tsrc{idx} = gr.Image(interactive=True, type='numpy', label='Source Face {idx}')"
-                        code += f"\n\t\ttrg{idx} = gr.Image(interactive=True, type='numpy', label='Specific Face {idx}')"
-                        exec(code)
-                    distance_slider = gr.Slider(
-                        minimum=0,
-                        maximum=2,
-                        value=0.6,
-                        interactive=True,
-                        label="Distance",
-                        info="Lower distance is more similar and higher distance is less similar to the target face.",
-                    )
                 with gr.Group():
-                    input_type = gr.Radio(
-                        ["Image", "Video"],
-                        label="Target Type",
-                        value="Image",
-                    )
-                    with gr.Box(visible=True) as input_image_group:
-                        image_input = gr.Image(
-                            label="Target Image", interactive=True, type="filepath"
-                        )
-                    with gr.Box(visible=False) as input_video_group:
                         vid_widget = gr.Video if USE_COLAB else gr.Text
                         video_input = gr.Video(
                             label="Target Video", interactive=True
@@ -804,9 +559,6 @@ with gr.Blocks(css=css) as interface:
                                 "Trim and Reload", interactive=True
                             )
-                    with gr.Box(visible=False) as input_directory_group:
-                        direc_input = gr.Text(label="Path", interactive=True)
             with gr.Column(scale=0.6):
                 info = gr.Markdown(value="...")
@@ -873,55 +625,9 @@ with gr.Blocks(css=css) as interface:
         show_progress=True,
     )
-    input_type.change(
-        update_radio,
-        inputs=[input_type],
-        outputs=[input_image_group, input_video_group, input_directory_group],
-    )
-    swap_option.change(
-        swap_option_changed,
-        inputs=[swap_option],
-        outputs=[age, specific_face, source_image_input],
-    )
-    apply_detection_settings.click(
-        analyse_settings_changed,
-        inputs=[detect_condition_dropdown, detection_size, detection_threshold],
-        outputs=[info],
-    )
-    src_specific_inputs = []
-    gen_variable_txt = ",".join(
-        [f"src{i+1}" for i in range(NUM_OF_SRC_SPECIFIC)]
-        + [f"trg{i+1}" for i in range(NUM_OF_SRC_SPECIFIC)]
-    )
-    exec(f"src_specific_inputs = ({gen_variable_txt})")
     swap_inputs = [
-        input_type,
-        image_input,
         video_input,
-        direc_input,
-        source_image_input,
-        output_directory,
-        output_name,
-        keep_output_sequence,
-        swap_option,
-        age,
-        distance_slider,
-        face_enhancer_name,
-        enable_face_parser_mask,
-        mask_include,
-        mask_soft_kernel,
-        mask_soft_iterations,
-        blur_amount,
-        erode_amount,
-        face_scale,
-        enable_laplacian_blend,
-        crop_top,
-        crop_bott,
-        crop_left,
-        crop_right,
-        *src_specific_inputs,
     ]
     swap_outputs = [

 def process(
     video_path,
     source_path,
 ):
     global WORKSPACE
     global OUTPUT_FILE
     global PREVIEW
+    global MASK_INCLUDE
+    global MASK_SOFT_ITERATIONS
+    global MASK_BLUR_AMOUNT
+    global MASK_ERODE_AMOUNT
+    global NUM_OF_SRC_SPECIFIC
     WORKSPACE, OUTPUT_FILE, PREVIEW = None, None, None
+    ## Hardcoded value
+    input_type = "Video"
+    output_path = "/home/user/app"
+    output_name = "Result"
+    keep_output_sequence = False
+    face_scale = 1.0
+    condition = "All Female"
+    age = 25
+    face_enhancer_name = "NONE"
+    enable_face_parser = True
+    crop_top = 0
+    crop_bott = 511
+    crop_left = 0
+    crop_right = 511
+    blur_amount = MASK_BLUR_AMOUNT
+    erode_amount = MASK_ERODE_AMOUNT
+    enable_laplacian_blend = True
     ## ------------------------------ GUI UPDATE FUNC ------------------------------
     ## ------------------------------ PREPARE INPUTS & LOAD MODELS ------------------------------
     yield "### \n ⌛ Loading face analyser model...", *ui_before()
     load_face_analyser_model()
         yield "### \n ⌛ Loading face parsing model...", *ui_before()
         load_face_parser_model()
+    includes = mask_regions_to_list(MASK_INCLUDE)
     if crop_top > crop_bott:
         crop_top, crop_bott = crop_bott, crop_top
     if crop_left > crop_right:
         ## ------------------------------ CONTENT CHECK ------------------------------
         print("### \n ⌛ Analysing face data...")
         log_message("⌛ Analysing face data...")
+        source_data = source_path, age
         analysed_targets, analysed_sources, whole_frame_list, num_faces_per_frame = get_analysed_data(
             FACE_ANALYSER,
             image_sequence,
             log_message("⌛ Face-parsing mask...")
             masks = []
             count = 0
+            for batch_mask in get_parsed_mask(FACE_PARSER, preds, classes=includes, device=device, batch_size=BATCH_SIZE, softness=int(MASK_SOFT_ITERATIONS)):
                 masks.append(batch_mask)
                 EMPTY_CACHE()
                 count += 1
     ## ------------------------------ IMAGE ------------------------------
     ## ------------------------------ VIDEO ------------------------------
+    temp_path = os.path.join(output_path, output_name, "sequence")
+    os.makedirs(temp_path, exist_ok=True)
+    print("### \n ⌛ Extracting video frames...")
+    log_message("⌛ Extracting video frames...")
+    image_sequence = []
+    cap = cv2.VideoCapture(video_path)
+    curr_idx = 0
+    while True:
+        ret, frame = cap.read()
+        if not ret:break
+        frame_path = os.path.join(temp_path, f"frame_{curr_idx}.jpg")
+        cv2.imwrite(frame_path, frame)
+        image_sequence.append(frame_path)
+        curr_idx += 1
+        print("Curr IDX: {}".format(curr_idx))
+    cap.release()
+    cv2.destroyAllWindows()
+    print("Total image sequence: {}".format(len(image_sequence)))
+    swap_process(image_sequence)
+    # for info_update in swap_process(image_sequence):
+    #     # print(info_update)
+    #     yield info_update, *ui_before()
+    print("End swap_process")
+    # yield "### \n ⌛ Merging sequence...", *ui_before()
+    print("### \n ⌛ Merging sequence...")
+    log_message("⌛ Merging sequence...")
+    output_video_path = os.path.join(output_path, output_name + ".mp4")
+    merge_img_sequence_from_ref(video_path, image_sequence, output_video_path)
+    if os.path.exists(temp_path) and not keep_output_sequence:
+        print("### \n ⌛ Removing temporary files...")
+        print("⌛ Removing temporary files...")
+        shutil.rmtree(temp_path)
+    WORKSPACE = output_path
+    OUTPUT_FILE = output_video_path
+    log_result(OUTPUT_FILE)
+    gr.update(value=OUTPUT_FILE, visible=True)
+    yield get_finsh_text(start_time), *ui_after_vid()
+    ## ------------------------------ DIRECTORY ------------------------------
 ## ------------------------------ GRADIO FUNC ------------------------------
 def video_changed(video_path):
     sliders_update = gr.Slider.update
     button_update = gr.Button.update
     with gr.Row():
         with gr.Row():
             with gr.Column(scale=0.4):
                 source_image_input = gr.Image(
                     label="Source face", type="filepath", interactive=True
                 )
                 with gr.Group():
+                    with gr.Box(visible=True) as input_video_group:
                         vid_widget = gr.Video if USE_COLAB else gr.Text
                         video_input = gr.Video(
                             label="Target Video", interactive=True
                                 "Trim and Reload", interactive=True
                             )
             with gr.Column(scale=0.6):
                 info = gr.Markdown(value="...")
         show_progress=True,
     )
     swap_inputs = [
         video_input,
+        source_image_input
     ]
     swap_outputs = [