File size: 25,068 Bytes
9ac2526
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
import os
import uuid
import time
from dataclasses import dataclass
from typing import Any, Dict, List, Optional, Tuple

import gradio as gr
import numpy as np
from PIL import Image, ImageDraw, ImageFont


APP_NAME = "FaceSwap AI"
DEFAULT_REMOTE_SPACE_ID = os.getenv("REMOTE_SPACE_ID", "felixrosberg/face-swap")
HF_TOKEN = os.getenv("HF_TOKEN") or os.getenv("HUGGINGFACEHUB_API_TOKEN")

OUTPUT_DIR = os.path.join(os.path.dirname(__file__), "outputs")
EXAMPLES_DIR = os.path.join(os.path.dirname(__file__), "assets", "examples")
MODELS_DIR = os.path.join(os.path.dirname(__file__), "models")


@dataclass
class SwapResult:
    output_path: str
    share_url: str
    error: Optional[str] = None


def _ensure_dirs() -> None:
    os.makedirs(OUTPUT_DIR, exist_ok=True)
    os.makedirs(EXAMPLES_DIR, exist_ok=True)
    os.makedirs(MODELS_DIR, exist_ok=True)


def _pil_from_any(img: Any) -> Image.Image:
    if img is None:
        raise ValueError("No image provided.")
    if isinstance(img, Image.Image):
        return img.convert("RGB")
    if isinstance(img, np.ndarray):
        if img.ndim == 2:
            return Image.fromarray(img).convert("RGB")
        if img.ndim == 3:
            return Image.fromarray(img[:, :, :3]).convert("RGB")
    if isinstance(img, str) and os.path.exists(img):
        return Image.open(img).convert("RGB")
    raise ValueError("Unsupported image format.")


def _save_temp_upload(img: Image.Image, prefix: str) -> str:
    _ensure_dirs()
    fp = os.path.join(OUTPUT_DIR, f"{prefix}_{uuid.uuid4().hex}.png")
    img.save(fp, format="PNG")
    return fp


def _detect_faces_haar(pil_img: Image.Image) -> int:
    """
    Lightweight face detection for user-friendly errors.
    This is not used for swapping; only for "No face detected" messaging.
    """
    try:
        import cv2  # lazy import

        cv_img = cv2.cvtColor(np.array(pil_img), cv2.COLOR_RGB2BGR)
        gray = cv2.cvtColor(cv_img, cv2.COLOR_BGR2GRAY)
        cascade = cv2.CascadeClassifier(
            os.path.join(cv2.data.haarcascades, "haarcascade_frontalface_default.xml")
        )
        faces = cascade.detectMultiScale(gray, scaleFactor=1.1, minNeighbors=5, minSize=(60, 60))
        return int(len(faces))
    except Exception:
        # If OpenCV isn't available for any reason, skip the pre-check.
        return 1


def _onnx_providers() -> List[str]:
    """
    Best-effort provider selection for ONNXRuntime / InsightFace.
    Set `FORCE_CPU=1` to disable CUDA even if available.
    """
    force_cpu = os.getenv("FORCE_CPU", "").strip().lower() in {"1", "true", "yes", "y"}
    if force_cpu:
        return ["CPUExecutionProvider"]

    try:
        import onnxruntime as ort  # type: ignore

        available = set(ort.get_available_providers())
        if "CUDAExecutionProvider" in available:
            return ["CUDAExecutionProvider", "CPUExecutionProvider"]
    except Exception:
        pass

    return ["CPUExecutionProvider"]


def _ensure_inswapper_onnx() -> str:
    """
    Ensures `inswapper_128.onnx` exists locally and returns its path.

    You can override with:
      - `INSWAPPER_ONNX_PATH` (absolute/relative path)
      - `INSWAPPER_REPO_ID` and `INSWAPPER_FILENAME` for HF download
    """
    override = os.getenv("INSWAPPER_ONNX_PATH", "").strip()
    if override:
        p = override
        if not os.path.isabs(p):
            p = os.path.join(os.path.dirname(__file__), p)
        if not os.path.exists(p):
            raise FileNotFoundError(f"INSWAPPER_ONNX_PATH not found: {p}")
        return p

    _ensure_dirs()
    local_path = os.path.join(MODELS_DIR, "inswapper_128.onnx")
    if os.path.exists(local_path):
        return local_path

    # Default to a small community HF repo that hosts the file.
    repo_id = os.getenv("INSWAPPER_REPO_ID", "ezioruan/inswapper_128.onnx").strip()
    filename = os.getenv("INSWAPPER_FILENAME", "inswapper_128.onnx").strip()

    try:
        from huggingface_hub import hf_hub_download  # type: ignore

        downloaded = hf_hub_download(
            repo_id=repo_id,
            filename=filename,
            token=HF_TOKEN,
        )
        # Copy to our local models dir so users can find it easily.
        # (Avoid importing shutil at module import time.)
        import shutil

        shutil.copyfile(downloaded, local_path)
        return local_path
    except Exception as e:
        raise RuntimeError(
            "Could not download inswapper ONNX model.\n"
            f"- Tried repo `{repo_id}` file `{filename}`\n"
            f"- You can also set `INSWAPPER_ONNX_PATH` to a local file.\n"
            f"Error: {e}"
        )


_IFACE_ANALYZER = None
_IFACE_SWAPPER = None


def _load_local_faceswap_models():
    """
    Lazy-load InsightFace analyzer + inswapper ONNX swapper.
    Returns (analyzer, swapper).
    """
    global _IFACE_ANALYZER, _IFACE_SWAPPER
    if _IFACE_ANALYZER is not None and _IFACE_SWAPPER is not None:
        return _IFACE_ANALYZER, _IFACE_SWAPPER

    try:
        import insightface  # type: ignore
        from insightface.app import FaceAnalysis  # type: ignore
    except Exception as e:
        raise RuntimeError(
            "Missing dependency for local live swap. Install `insightface`.\n"
            f"Error: {e}"
        )

    providers = _onnx_providers()
    # buffalo_l includes detection + recognition (needed to build embeddings for swapper).
    analyzer = FaceAnalysis(name="buffalo_l", providers=providers)
    analyzer.prepare(ctx_id=0 if providers[0] != "CPUExecutionProvider" else -1, det_size=(640, 640))

    onnx_path = _ensure_inswapper_onnx()
    swapper = insightface.model_zoo.get_model(onnx_path, providers=providers)

    _IFACE_ANALYZER, _IFACE_SWAPPER = analyzer, swapper
    return analyzer, swapper


def _largest_face(faces: List[Any]) -> Optional[Any]:
    if not faces:
        return None
    best = None
    best_area = -1
    for f in faces:
        try:
            x1, y1, x2, y2 = f.bbox.astype(int).tolist()
            area = max(0, x2 - x1) * max(0, y2 - y1)
        except Exception:
            area = -1
        if area > best_area:
            best_area = area
            best = f
    return best


def _np_rgb_to_bgr(img: np.ndarray) -> np.ndarray:
    # Gradio gives RGB; InsightFace expects BGR.
    if img is None:
        raise ValueError("No image provided.")
    if img.ndim != 3 or img.shape[2] < 3:
        raise ValueError("Expected a 3-channel color image.")

    rgb = img[:, :, :3]
    if rgb.dtype != np.uint8:
        # Gradio can emit float images (0..1 or 0..255). Normalize to uint8.
        mx = float(np.max(rgb)) if rgb.size else 255.0
        if mx <= 1.5:
            rgb = np.clip(rgb, 0.0, 1.0) * 255.0
        else:
            rgb = np.clip(rgb, 0.0, 255.0)
        rgb = rgb.astype(np.uint8)

    return rgb[:, :, ::-1].copy()


def _np_bgr_to_rgb(img: np.ndarray) -> np.ndarray:
    if img is None:
        raise ValueError("No image provided.")
    if img.ndim != 3 or img.shape[2] < 3:
        return img
    return img[:, :, :3][:, :, ::-1].copy()


def _watermark(pil_img: Image.Image, text: str = "FaceSwap AI • demo") -> Image.Image:
    img = pil_img.copy().convert("RGBA")
    w, h = img.size

    overlay = Image.new("RGBA", img.size, (0, 0, 0, 0))
    draw = ImageDraw.Draw(overlay)

    # Try a default font; fall back to PIL bitmap font.
    font_size = max(14, int(min(w, h) * 0.03))
    try:
        font = ImageFont.truetype("DejaVuSans.ttf", font_size)
    except Exception:
        font = ImageFont.load_default()

    padding = max(10, int(font_size * 0.6))
    tw, th = draw.textbbox((0, 0), text, font=font)[2:]
    x = w - tw - padding
    y = h - th - padding

    # Semi-transparent background pill
    bg_pad = max(6, int(font_size * 0.5))
    draw.rounded_rectangle(
        (x - bg_pad, y - bg_pad, x + tw + bg_pad, y + th + bg_pad),
        radius=max(6, int(font_size * 0.6)),
        fill=(0, 0, 0, 110),
    )
    draw.text((x, y), text, font=font, fill=(255, 255, 255, 220))

    return Image.alpha_composite(img, overlay).convert("RGB")


def _host_base_url() -> str:
    # HF Spaces commonly provide one of these.
    for k in ("SPACE_HOST", "HOST", "GRADIO_SERVER_NAME"):
        v = os.getenv(k)
        if v and v.startswith("http"):
            return v.rstrip("/")

    space_id = os.getenv("SPACE_ID")
    if space_id:
        return f"https://{space_id.replace('/', '-')}.hf.space"
    return ""


def _make_share_url(local_file_path: str) -> str:
    # Gradio will serve returned file paths via its /file=... mechanism.
    # We keep a friendly full URL for copy/paste when hosted.
    base = _host_base_url()
    if not base:
        return ""
    # When returning a file to a component, Gradio rewrites it; but a direct
    # "file=" URL is still useful for HF Spaces in many cases.
    rel = os.path.relpath(local_file_path, os.path.dirname(__file__)).replace("\\", "/")
    return f"{base}/file={rel}"


def _call_remote_space(
    source_pil: Image.Image,
    target_pil: Image.Image,
    *,
    defense_ratio: int,
    blend_ratio: int,
    options: List[str],
    remote_space_id: str,
) -> Image.Image:
    """
    Calls a remote Gradio Space as the "cloud inference" backend.
    Default backend: felixrosberg/face-swap (FaceDancer).
    """
    from gradio_client import Client, handle_file  # type: ignore

    client = Client(remote_space_id, token=HF_TOKEN)

    # Save uploads to disk so we can pass them via handle_file
    src_path = _save_temp_upload(source_pil, "source")
    trg_path = _save_temp_upload(target_pil, "target")

    # FaceDancer Space signature (from its app.py):
    # run_inference(target, source, defense_ratio, merge_ratio, options)
    out = client.predict(
        handle_file(trg_path),
        handle_file(src_path),
        int(defense_ratio),
        int(blend_ratio),
        options,
        api_name="/run_inference",
    )

    return _pil_from_any(out)


def _call_custom_endpoint(
    source_pil: Image.Image,
    target_pil: Image.Image,
    *,
    strength: float,
    steps: int,
    guidance: float,
) -> Image.Image:
    """
    Optional BYO endpoint mode.
    Contract: POST $HF_INFERENCE_ENDPOINT_URL with multipart form:
      - source: image file
      - target: image file
      - strength: float
      - steps: int
      - guidance: float
    Returns: image bytes (PNG/JPEG) in response body.
    """
    import requests

    url = os.getenv("HF_INFERENCE_ENDPOINT_URL", "").strip()
    if not url:
        raise ValueError("Custom endpoint URL is not set.")

    src_bytes = _pil_to_png_bytes(source_pil)
    trg_bytes = _pil_to_png_bytes(target_pil)
    files = {
        "source": ("source.png", src_bytes, "image/png"),
        "target": ("target.png", trg_bytes, "image/png"),
    }
    data = {"strength": str(strength), "steps": str(int(steps)), "guidance": str(guidance)}
    headers = {}
    token = os.getenv("HF_ENDPOINT_TOKEN") or HF_TOKEN
    if token:
        headers["Authorization"] = f"Bearer {token}"

    resp = requests.post(url, files=files, data=data, headers=headers, timeout=180)
    if resp.status_code >= 400:
        raise RuntimeError(f"Endpoint error {resp.status_code}: {resp.text[:300]}")
    return Image.open(_bytes_io(resp.content)).convert("RGB")


def _bytes_io(b: bytes):
    import io

    return io.BytesIO(b)


def _pil_to_png_bytes(img: Image.Image) -> bytes:
    import io

    buf = io.BytesIO()
    img.save(buf, format="PNG")
    return buf.getvalue()


def _download_example_images() -> List[Tuple[str, str]]:
    """
    Downloads a couple of lightweight example images on first run.
    Returned list is (source_path, target_path) pairs.
    """
    import requests

    _ensure_dirs()
    examples: List[Tuple[str, str]] = []

    # Public domain / permissive sample images (Wikimedia).
    # We keep them small-ish to stay friendly for Spaces.
    pairs = [
        (
            "https://upload.wikimedia.org/wikipedia/commons/thumb/3/37/Face_of_a_young_woman.jpg/512px-Face_of_a_young_woman.jpg",
            "https://upload.wikimedia.org/wikipedia/commons/thumb/0/0b/Barack_Obama.jpg/512px-Barack_Obama.jpg",
        ),
        (
            "https://upload.wikimedia.org/wikipedia/commons/thumb/5/50/Vd-Orig.png/512px-Vd-Orig.png",
            "https://upload.wikimedia.org/wikipedia/commons/thumb/8/8d/Portrait_Placeholder.png/512px-Portrait_Placeholder.png",
        ),
    ]

    def fetch(url: str, out_path: str) -> None:
        if os.path.exists(out_path):
            return
        r = requests.get(url, timeout=60)
        r.raise_for_status()
        with open(out_path, "wb") as f:
            f.write(r.content)

    for i, (src_url, trg_url) in enumerate(pairs, start=1):
        src_path = os.path.join(EXAMPLES_DIR, f"source_{i}.jpg")
        trg_path = os.path.join(EXAMPLES_DIR, f"target_{i}.jpg")
        try:
            fetch(src_url, src_path)
            fetch(trg_url, trg_path)
            examples.append((src_path, trg_path))
        except Exception:
            # If network is restricted, examples will just be absent.
            continue

    return examples


def swap_faces(
    source_img: Any,
    target_img: Any,
    consent_ok: bool,
    strength: float,
    steps: int,
    guidance: float,
    backend: str,
    history: List[Dict[str, str]],
) -> Tuple[Any, Any, Any, List[Dict[str, str]], str]:
    if not consent_ok:
        return None, None, None, history, "Please confirm you have consent to swap faces."

    try:
        src = _pil_from_any(source_img)
        trg = _pil_from_any(target_img)
    except Exception as e:
        return None, None, None, history, str(e)

    # Pre-check for better errors
    if _detect_faces_haar(src) < 1:
        return None, None, None, history, "No face detected in Source Face."
    if _detect_faces_haar(trg) < 1:
        return None, None, None, history, "No face detected in Target Photo."

    try:
        t0 = time.time()
        if backend == "Cloud (FaceDancer Space)":
            # Map our UX knobs to the backend's available inputs.
            # - strength -> blend_ratio (0..100)
            # - steps/guidance don't exist here; we keep them for BYO endpoint.
            out = _call_remote_space(
                src,
                trg,
                defense_ratio=100,
                blend_ratio=int(np.clip(strength * 100, 0, 100)),
                options=[],
                remote_space_id=DEFAULT_REMOTE_SPACE_ID,
            )
        else:
            out = _call_custom_endpoint(src, trg, strength=strength, steps=steps, guidance=guidance)

        out = _watermark(out)

        _ensure_dirs()
        out_path = os.path.join(OUTPUT_DIR, f"faceswap_{uuid.uuid4().hex}.png")
        out.save(out_path, format="PNG")

        share = _make_share_url(out_path)
        elapsed = time.time() - t0

        history = [{"result": out_path, "source": _save_temp_upload(src, "src"), "target": _save_temp_upload(trg, "trg")}][
            :1
        ] + history
        history = history[:12]

        status = f"Done in {elapsed:.1f}s."
        if share:
            status += f" Share link: {share}"
        return trg, out, out_path, history, status
    except Exception as e:
        msg = str(e)
        if "Could not find Space" in msg or "404" in msg:
            msg = (
                "Cloud backend unavailable. Try again, or configure a custom endpoint. "
                "See README for deployment options."
            )
        return None, None, None, history, msg


CSS = """
.fsai-wrap { max-width: 1200px; margin: 0 auto; }
.fsai-hero { font-size: 28px; font-weight: 700; margin: 8px 0 4px; }
.fsai-sub { opacity: 0.8; margin-top: 0; }
.fsai-warn { border: 1px solid rgba(255,255,255,0.12); border-radius: 12px; padding: 12px 14px; }
@media (prefers-color-scheme: dark) {
  .fsai-warn { background: rgba(255,255,255,0.04); }
}
@media (prefers-color-scheme: light) {
  .fsai-warn { background: rgba(0,0,0,0.03); }
}
"""


def build_demo() -> gr.Blocks:
    _ensure_dirs()
    examples = _download_example_images()

    theme = gr.themes.Soft(primary_hue="violet", neutral_hue="slate")

    with gr.Blocks(theme=theme, css=CSS, title=APP_NAME) as demo:
        gr.HTML(
            f"""
            <div class="fsai-wrap">
              <div class="fsai-hero">{APP_NAME}</div>
              <p class="fsai-sub">Swap faces in photos (cloud) or live webcam (local ONNX). Use only with consent.</p>
            </div>
            """
        )

        with gr.Tabs():
            with gr.Tab("Photo Swap (Cloud)"):
                with gr.Accordion("Consent & Safety (required)", open=True):
                    gr.Markdown(
                        """
                        **Important:** Only upload photos you own or have explicit permission to edit.

                        - **Consent**: You confirm you have consent from any person depicted.
                        - **No misuse**: Do not use for harassment, impersonation, fraud, or sexual content.
                        - **Watermark**: Outputs are watermarked to discourage misuse.
                        """
                    )
                    consent = gr.Checkbox(label="I confirm I have consent and will use this responsibly.")

                with gr.Row():
                    with gr.Column(scale=1):
                        source = gr.Image(label="Source Face", type="pil", height=320)
                    with gr.Column(scale=1):
                        target = gr.Image(label="Target Photo", type="pil", height=320)

                with gr.Row():
                    backend = gr.Radio(
                        choices=["Cloud (FaceDancer Space)", "Custom Endpoint (HF Inference Endpoint / your API)"],
                        value="Cloud (FaceDancer Space)",
                        label="Inference backend",
                    )

                with gr.Accordion("Advanced options", open=False):
                    strength = gr.Slider(
                        0.0,
                        1.0,
                        value=0.8,
                        step=0.05,
                        label="Swap strength",
                        info="Higher = stronger identity transfer. (Cloud backend maps this to blend ratio.)",
                    )
                    steps = gr.Slider(
                        10, 60, value=30, step=1, label="Steps", info="Used by Custom Endpoint backends."
                    )
                    guidance = gr.Slider(
                        1.0,
                        10.0,
                        value=4.5,
                        step=0.5,
                        label="Guidance scale",
                        info="Used by Custom Endpoint backends.",
                    )

                swap_btn = gr.Button("Swap Faces", variant="primary", size="lg")
                status = gr.Markdown(value="", elem_classes=["fsai-wrap"])

                with gr.Row():
                    before = gr.Image(label="Before (Target)", type="pil", height=360)
                    after = gr.Image(label="After (Result)", type="pil", height=360)

                with gr.Row():
                    download = gr.File(label="Download result", file_types=[".png"])

                history_state = gr.State([])  # list[dict] with paths
                gallery = gr.Gallery(label="History (this session)", columns=4, height=260, preview=True)

                def _history_to_gallery(items: List[Dict[str, str]]) -> List[str]:
                    return [it["result"] for it in items if "result" in it and os.path.exists(it["result"])]

                def _swap_and_gallery(*args):
                    b, a, f, hist, msg = swap_faces(*args)
                    return b, a, f, hist, _history_to_gallery(hist), msg

                swap_btn.click(
                    _swap_and_gallery,
                    inputs=[source, target, consent, strength, steps, guidance, backend, history_state],
                    outputs=[before, after, download, history_state, gallery, status],
                )

                if examples:
                    gr.Examples(
                        examples=examples,
                        inputs=[source, target],
                        label="Examples",
                        examples_per_page=4,
                    )

                with gr.Accordion("Setup notes", open=False):
                    gr.Markdown(
                        f"""
                        **Default cloud backend:** `{DEFAULT_REMOTE_SPACE_ID}` via Gradio Spaces API.

                        To use a custom backend, set:
                        - `HF_INFERENCE_ENDPOINT_URL` (your endpoint URL)
                        - optional `HF_ENDPOINT_TOKEN` (Bearer token)

                        See `README.md` for a 5-minute deploy guide.
                        """
                    )

            with gr.Tab("Live Swap (Local ONNX)"):
                gr.Markdown(
                    """
                    Upload a **source face** — it **locks automatically** (with consent checked) so the **webcam**
                    shows the swap **in real time**. You can use **Re-lock** if you change the photo.
                    This runs locally using **InsightFace + ONNXRuntime** with `inswapper_128.onnx`.

                    Tip: For best results, use a clear, front-facing source photo and good lighting.
                    """
                )

                live_consent = gr.Checkbox(
                    label="I confirm I have consent and will use this responsibly.",
                    value=False,
                )

                with gr.Row():
                    live_source = gr.Image(label="Source Face (identity to use)", type="numpy", height=260)
                    live_source_status = gr.Markdown(value="")

                source_face_state = gr.State(None)  # cached InsightFace Face object

                def _set_live_source(source_np: Any, consent_ok: bool):
                    if not consent_ok:
                        return None, "Please confirm consent to enable live swap."
                    if source_np is None:
                        return None, "Upload a source face image."

                    analyzer, _ = _load_local_faceswap_models()
                    src_bgr = _np_rgb_to_bgr(np.array(source_np))
                    faces = analyzer.get(src_bgr)
                    src_face = _largest_face(faces)
                    if src_face is None:
                        return None, "No face detected in source image."
                    return src_face, "Source face locked — webcam shows live swap."

                live_set_btn = gr.Button("Re-lock source face", variant="secondary")
                _live_source_inputs = [live_source, live_consent]
                _live_source_outputs = [source_face_state, live_source_status]
                live_source.change(_set_live_source, inputs=_live_source_inputs, outputs=_live_source_outputs)
                live_consent.change(_set_live_source, inputs=_live_source_inputs, outputs=_live_source_outputs)
                live_set_btn.click(_set_live_source, inputs=_live_source_inputs, outputs=_live_source_outputs)

                with gr.Row():
                    webcam = gr.Image(
                        label="Webcam",
                        sources=["webcam"],
                        streaming=True,
                        type="numpy",
                        height=420,
                    )
                    live_out = gr.Image(label="Live swapped output", type="numpy", height=420)

                live_status = gr.Markdown(value="")

                def _live_swap(frame_np: Any, src_face: Any, consent_ok: bool):
                    if not consent_ok:
                        return frame_np, "Consent not confirmed."
                    if frame_np is None:
                        return None, ""
                    if src_face is None:
                        return frame_np, "Lock a source face first."

                    analyzer, swapper = _load_local_faceswap_models()
                    frame_bgr = _np_rgb_to_bgr(np.array(frame_np))
                    faces = analyzer.get(frame_bgr)
                    tgt_face = _largest_face(faces)
                    if tgt_face is None:
                        return _np_bgr_to_rgb(frame_bgr), "No face detected in webcam frame."

                    try:
                        swapped_bgr = swapper.get(frame_bgr, tgt_face, src_face, paste_back=True)
                    except Exception as e:
                        return _np_bgr_to_rgb(frame_bgr), f"Swap error: {e}"

                    return _np_bgr_to_rgb(swapped_bgr), ""

                webcam.stream(
                    _live_swap,
                    inputs=[webcam, source_face_state, live_consent],
                    outputs=[live_out, live_status],
                )

    return demo


if __name__ == "__main__":
    build_demo().launch()