Spaces:

Astridkraft
/

Text-Image_to_Image

Sleeping

App Files Files Community

Astridkraft commited on Oct 27, 2025

Commit

f6548dc

verified ·

1 Parent(s): 26a123d

Update app.py

Browse files

Files changed (1) hide show

app.py +50 -35

app.py CHANGED Viewed

@@ -1,12 +1,13 @@
 import gradio as gr
-from diffusers import StableDiffusionPipeline, StableDiffusionImg2ImgPipeline
-from diffusers import StableDiffusionInpaintPipeline
 import torch
 from PIL import Image, ImageDraw
 import time
 import os
 import tempfile
 import random
 # === OPTIMIERTE EINSTELLUNGEN ===
 device = "cuda" if torch.cuda.is_available() else "cpu"
@@ -15,7 +16,6 @@ IMG_SIZE = 512
 print(f"Running on: {device}")
 # === GESICHTSMASKEN-FUNKTIONEN ===
 def create_face_mask(image, bbox_coords):
     """Erzeugt eine Gesichtsmaske - WEIßE Bereiche werden VERÄNDERT, SCHWARZE BLEIBEN"""
@@ -38,33 +38,49 @@ def create_face_mask(image, bbox_coords):
     return mask
 def auto_detect_face_area(image):
-    """Optimierten Vorschlag für Gesichtsbereich ohne externe Bibliotheken"""
-    width, height = image.size
-    # Größere Bounding Box für bessere Abdeckung (50% statt 40%)
-    face_size = min(width, height) * 0.5
-    # Verschiebe y1 nach oben, um Stirn und Kinn besser abzudecken
-    x1 = (width - face_size) / 2
-    y1 = (height - face_size) / 4  # Höher positioniert (25% statt 33%)
-    x2 = x1 + face_size
-    y2 = y1 + face_size * 1.2  # Leicht länglicher für ovale Gesichter
-    # Stelle sicher, dass Koordinaten innerhalb des Bildes liegen
-    x1, y1 = max(0, int(x1)), max(0, int(y1))
-    x2, y2 = min(width, int(x2)), min(height, int(y2))
-    print(f"✅ Geschätzte Gesichtskoordinaten: [{x1}, {y1}, {x2}, {y2}]")
-    return [x1, y1, x2, y2]
-def auto_detect_face_area(image):
-    """Vorschlag für Gesichtsbereich"""
-    width, height = image.size
-    face_size = min(width, height) * 0.4
-    x1 = (width - face_size) / 2
-    y1 = (height - face_size) / 3
-    x2 = x1 + face_size
-    y2 = y1 + face_size
-    return [int(x1), int(y1), int(x2), int(y2)]
 # === PIPELINES ===
 pipe_txt2img = None
@@ -93,17 +109,16 @@ def load_img2img():
         print("Loading Inpainting model...")
         try:
             pipe_img2img = StableDiffusionInpaintPipeline.from_pretrained(
-                "stabilityai/stable-diffusion-2-inpainting",  # Neues Modell
                 torch_dtype=torch_dtype,
-                use_safetensors=True,  # Erzwinge .safetensors
-                allow_pickle=False,    # Verhindere unsichere Serialisierung
                 safety_checker=None
             ).to(device)
         except Exception as e:
             print(f"❌ Fehler beim Laden des Modells: {e}")
             raise
         from diffusers import DPMSolverMultistepScheduler
         pipe_img2img.scheduler = DPMSolverMultistepScheduler.from_config(
             pipe_img2img.scheduler.config,
@@ -209,7 +224,7 @@ def img_to_image(image, prompt, neg_prompt, strength, steps, guidance_scale, fac
             prompt=prompt,
             negative_prompt=neg_prompt,
             image=img_resized,
-            mask_image=mask,  # None = gesamtes Bild verändern
             strength=adj_strength,
             num_inference_steps=int(steps),
             guidance_scale=adj_guidance,

 import gradio as gr
+from diffusers import StableDiffusionPipeline, StableDiffusionInpaintPipeline
 import torch
 from PIL import Image, ImageDraw
 import time
 import os
 import tempfile
 import random
+import numpy as np  # Neu für DeepFace
+from deepface import DeepFace  # Neu für präzise Gesichtsdetektion
 # === OPTIMIERTE EINSTELLUNGEN ===
 device = "cuda" if torch.cuda.is_available() else "cpu"
 print(f"Running on: {device}")
 # === GESICHTSMASKEN-FUNKTIONEN ===
 def create_face_mask(image, bbox_coords):
     """Erzeugt eine Gesichtsmaske - WEIßE Bereiche werden VERÄNDERT, SCHWARZE BLEIBEN"""
     return mask
 def auto_detect_face_area(image):
+    """Präzise Gesichtsdetektion mit DeepFace, Fallback auf grobe Schätzung"""
+    try:
+        # Konvertiere PIL-Image zu NumPy-Array (DeepFace benötigt das)
+        img_array = np.array(image.convert("RGB"))
+        # Detektiere Gesichter mit DeepFace
+        face_objs = DeepFace.extract_faces(
+            img_path=img_array,
+            detector_backend="retinaface",  # Genau, aber CUDA-kompatibel
+            align=False  # Kein Alignment nötig, nur Bounding Box
+        )
+        if not face_objs:
+            print("⚠️ Kein Gesicht erkannt - Fallback auf grobe Schätzung")
+            # Fallback auf alte Methode
+            width, height = image.size
+            face_size = min(width, height) * 0.4
+            x1 = (width - face_size) / 2
+            y1 = (height - face_size) / 3
+            x2 = x1 + face_size
+            y2 = y1 + face_size
+            return [int(x1), int(y1), int(x2), int(y2)]
+        # Nimm das erste (größte) Gesicht
+        facial_area = face_objs[0]["facial_area"]
+        x1 = facial_area["x"]
+        y1 = facial_area["y"]
+        x2 = x1 + facial_area["w"]
+        y2 = y1 + facial_area["h"]
+        print(f"✅ Gesicht erkannt: [{x1}, {y1}, {x2}, {y2}]")
+        return [int(x1), int(y1), int(x2), int(y2)]
+    except Exception as e:
+        print(f"❌ Fehler bei Gesichtsdetektion: {e}")
+        # Fallback auf alte Methode
+        width, height = image.size
+        face_size = min(width, height) * 0.4
+        x1 = (width - face_size) / 2
+        y1 = (height - face_size) / 3
+        x2 = x1 + face_size
+        y2 = y1 + face_size
+        return [int(x1), int(y1), int(x2), int(y2)]
 # === PIPELINES ===
 pipe_txt2img = None
         print("Loading Inpainting model...")
         try:
             pipe_img2img = StableDiffusionInpaintPipeline.from_pretrained(
+                "stabilityai/stable-diffusion-2-inpainting",
                 torch_dtype=torch_dtype,
+                use_safetensors=True,
+                allow_pickle=False,
                 safety_checker=None
             ).to(device)
         except Exception as e:
             print(f"❌ Fehler beim Laden des Modells: {e}")
             raise
         from diffusers import DPMSolverMultistepScheduler
         pipe_img2img.scheduler = DPMSolverMultistepScheduler.from_config(
             pipe_img2img.scheduler.config,
             prompt=prompt,
             negative_prompt=neg_prompt,
             image=img_resized,
+            mask_image=mask,
             strength=adj_strength,
             num_inference_steps=int(steps),
             guidance_scale=adj_guidance,