Spaces:

Astridkraft
/

Stable-ControlNet-GPU

Paused

App Files Files Community

Astridkraft commited on Nov 14, 2025

Commit

e8e2118

verified ·

1 Parent(s): 3371dca

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -14

app.py CHANGED Viewed

@@ -2,7 +2,7 @@
 #und deutlich besserem Prompt-Verständnis - (Änderung Architektur).
 #Eine deutsche Alternative zur Umsetzung von Text-Bild zu Bild ist Flux - mit einer völlig anderen Architektur als SD!
 import gradio as gr
-from diffusers import StableDiffusionPipeline, StableDiffusionImg2ImgPipeline
 from diffusers import StableDiffusionInpaintPipeline
 from controlnet_module import controlnet_processor
 import torch
@@ -17,7 +17,7 @@ import random
 # === OPTIMIERTE EINSTELLUNGEN ===
 device = "cuda" if torch.cuda.is_available() else "cpu"
 torch_dtype = torch.float16 if device == "cuda" else torch.float32
-IMG_SIZE = 512
 print(f"Running on: {device}")
@@ -65,18 +65,20 @@ pipe_img2img = None
 def load_txt2img():
     global pipe_txt2img
     if pipe_txt2img is None:
-        print("Loading Text-to-Image model...")
-        pipe_txt2img = StableDiffusionPipeline.from_pretrained(
-            "runwayml/stable-diffusion-v1-5",
             torch_dtype=torch_dtype,
             use_safetensors=True,
-            safety_checker=None,
-            requires_safety_checker=False,
-            #clean_up_tokenization_spaces=False #bei der neuen Version ändert sich die Architektur, Clip wird ersetzt/erweitert/integriert. Tokenizer nicht mehr nur auf englisch, kein 77-Token Limit!
         ).to(device)
         from diffusers import DPMSolverMultistepScheduler
-        pipe_txt2img.scheduler = DPMSolverMultistepScheduler.from_config(pipe_txt2img.scheduler.config)
         pipe_txt2img.enable_attention_slicing()
     return pipe_txt2img
@@ -331,7 +333,7 @@ def img_to_image(image, prompt, neg_prompt, strength, steps, guidance_scale,
         pipe = load_img2img()  # ← deine bestehende Funktion
         # inpaint_input ist IMMER das Originalbild (laut neuer ControlNet-Logik)
-        img_resized = inpaint_input.convert("RGB").resize((IMG_SIZE, IMG_SIZE))
         adj_guidance = min(guidance_scale, 12.0)
         seed = random.randint(0, 2**32 - 1)
@@ -344,7 +346,7 @@ def img_to_image(image, prompt, neg_prompt, strength, steps, guidance_scale,
         mask = None
         if bbox_x1 and bbox_y1 and bbox_x2 and bbox_y2:
             orig_w, orig_h = image.size
-            scale_x, scale_y = IMG_SIZE / orig_w, IMG_SIZE / orig_h
             bbox_coords = [
                 int(bbox_x1 * scale_x),
                 int(bbox_y1 * scale_y),
@@ -476,7 +478,7 @@ def main_ui():
         # --- Hauptanwendungsbereich (zunächst versteckt) ---
         with gr.Column(visible=True) as content_area:
             with gr.Tab("Text zu Bild"):
-                gr.Markdown("**Beschreibe dein gewünschtes Bild (maximal 77 Token):**")
                 with gr.Row():
                     txt_input = gr.Textbox(
@@ -580,14 +582,14 @@ def main_ui():
                         img_prompt = gr.Textbox(
                             placeholder="change background to beach with palm trees, keep person unchanged, sunny day",
                             lines=2,
-                            label="Transformations-Prompt (Englisch - maximal 77 Token)",
                             info="Was soll verändert werden? Sei spezifisch."
                         )
                     with gr.Column():
                         img_neg_prompt = gr.Textbox(
                             placeholder="blurry, deformed, ugly, bad anatomy, extra limbs, poorly drawn hands",
                             lines=2,
-                            label="Negativ-Prompt (Englisch - maximal 77 Token)",
                             info="Was soll vermieden werden? Unerwünschte Elemente auflisten."
                         )

 #und deutlich besserem Prompt-Verständnis - (Änderung Architektur).
 #Eine deutsche Alternative zur Umsetzung von Text-Bild zu Bild ist Flux - mit einer völlig anderen Architektur als SD!
 import gradio as gr
+from diffusers import StableDiffusionPipeline, StableDiffusionImg2ImgPipeline, StableDiffusionXLPipeline
 from diffusers import StableDiffusionInpaintPipeline
 from controlnet_module import controlnet_processor
 import torch
 # === OPTIMIERTE EINSTELLUNGEN ===
 device = "cuda" if torch.cuda.is_available() else "cpu"
 torch_dtype = torch.float16 if device == "cuda" else torch.float32
+IMG_SIZE = 1024  # SDXL verwendet 1024x1024 statt 512x512
 print(f"Running on: {device}")
 def load_txt2img():
     global pipe_txt2img
     if pipe_txt2img is None:
+        print("Loading SDXL Text-to-Image model...")
+        pipe_txt2img = StableDiffusionXLPipeline.from_pretrained(
+            "stabilityai/stable-diffusion-xl-base-1.0",
             torch_dtype=torch_dtype,
             use_safetensors=True,
+            add_watermarker=False,
         ).to(device)
         from diffusers import DPMSolverMultistepScheduler
+        pipe_txt2img.scheduler = DPMSolverMultistepScheduler.from_config(
+            pipe_txt2img.scheduler.config,
+            use_karras_sigmas=True,  # Noch bessere Qualität
+            algorithm_type="sde-dpmsolver++"
+        )
         pipe_txt2img.enable_attention_slicing()
     return pipe_txt2img
         pipe = load_img2img()  # ← deine bestehende Funktion
         # inpaint_input ist IMMER das Originalbild (laut neuer ControlNet-Logik)
+        img_resized = inpaint_input.convert("RGB").resize((512, 512))  # Bleibt bei 512 für Inpaint
         adj_guidance = min(guidance_scale, 12.0)
         seed = random.randint(0, 2**32 - 1)
         mask = None
         if bbox_x1 and bbox_y1 and bbox_x2 and bbox_y2:
             orig_w, orig_h = image.size
+            scale_x, scale_y = 512 / orig_w, 512 / orig_h  # Skalierung für Inpaint (512px)
             bbox_coords = [
                 int(bbox_x1 * scale_x),
                 int(bbox_y1 * scale_y),
         # --- Hauptanwendungsbereich (zunächst versteckt) ---
         with gr.Column(visible=True) as content_area:
             with gr.Tab("Text zu Bild"):
+                gr.Markdown("**Beschreibe dein gewünschtes Bild:**")
                 with gr.Row():
                     txt_input = gr.Textbox(
                         img_prompt = gr.Textbox(
                             placeholder="change background to beach with palm trees, keep person unchanged, sunny day",
                             lines=2,
+                            label="Transformations-Prompt (Englisch)",
                             info="Was soll verändert werden? Sei spezifisch."
                         )
                     with gr.Column():
                         img_neg_prompt = gr.Textbox(
                             placeholder="blurry, deformed, ugly, bad anatomy, extra limbs, poorly drawn hands",
                             lines=2,
+                            label="Negativ-Prompt (Englisch)",
                             info="Was soll vermieden werden? Unerwünschte Elemente auflisten."
                         )