Spaces:

X-HighVoltage-X
/

FLUX.1-Fill-dev-Inpaint-Tester

Running on Zero

App Files Files Community

X-HighVoltage-X commited on 25 days ago

Commit

4ad6fb2

verified ·

1 Parent(s): beb57ea

Update app.py

Browse files

Files changed (1) hide show

app.py +160 -104

app.py CHANGED Viewed

@@ -1,5 +1,4 @@
 import random
-from typing import List, Tuple
 import gradio as gr
 import numpy as np
@@ -7,6 +6,7 @@ import spaces
 import torch
 from diffusers import FluxFillPipeline
 from loras import LoRA, loras
 MAX_SEED = np.iinfo(np.int32).max
@@ -14,62 +14,129 @@ pipe = FluxFillPipeline.from_pretrained("black-forest-labs/FLUX.1-Fill-dev", tor
 flux_keywords_available = ["IMG_1025.HEIC", "Selfie"]
 def activate_loras(pipe: FluxFillPipeline, loras_with_weights: list[tuple[LoRA, float]]):
     adapter_names = []
     adapter_weights = []
     for lora, weight in loras_with_weights:
-        print(f"Loading LoRA: {lora.name} with weight {weight}")
         pipe.load_lora_weights(lora.id, weight=weight, adapter_name=lora.name)
         adapter_names.append(lora.name)
         adapter_weights.append(weight)
-    print(f"Activating adapters: {adapter_names} with weights {adapter_weights}")
     pipe.set_adapters(adapter_names, adapter_weights=adapter_weights)
     return pipe
-def get_loras() -> list[dict]:
-    return loras
 def deactivate_loras(pipe):
-    print("Unloading all LoRAs...")
     pipe.unload_lora_weights()
     return pipe
 def calculate_optimal_dimensions(image):
     original_width, original_height = image.size
-    MIN_ASPECT_RATIO = 9 / 16
-    MAX_ASPECT_RATIO = 16 / 9
     FIXED_DIMENSION = 1024
-    original_aspect_ratio = original_width / original_height
-    if original_aspect_ratio > 1:
-        width = FIXED_DIMENSION
-        height = round(FIXED_DIMENSION / original_aspect_ratio)
     else:
-        height = FIXED_DIMENSION
-        width = round(FIXED_DIMENSION * original_aspect_ratio)
-    width = (width // 8) * 8
-    height = (height // 8) * 8
-    calculated_aspect_ratio = width / height
-    if calculated_aspect_ratio > MAX_ASPECT_RATIO:
-        width = int((height * MAX_ASPECT_RATIO // 8) * 8)
-    elif calculated_aspect_ratio < MIN_ASPECT_RATIO:
-        height = int((width / MIN_ASPECT_RATIO // 8) * 8)
-    width = max(width, 576) if width == FIXED_DIMENSION else width
-    height = max(height, 576) if height == FIXED_DIMENSION else height
-    return width, height
-@spaces.GPU(duration=45)
 def inpaint(
     image,
     mask,
     prompt: str = "",
     seed: int = 0,
     num_inference_steps: int = 28,
@@ -80,10 +147,23 @@ def inpaint(
     mask = mask.convert("L")
     width, height = calculate_optimal_dimensions(image)
     pipe.to("cuda")
     result = pipe(
-        image=image,
-        mask_image=mask,
         prompt=prompt,
         width=width,
         height=height,
@@ -91,62 +171,50 @@ def inpaint(
         guidance_scale=guidance_scale,
         strength=strength,
         generator=torch.Generator().manual_seed(seed),
     ).images[0]
-    return result.convert("RGBA"), prompt, seed
 def inpaint_api(
     image,
     mask,
-    prompt: str,
-    seed: int,
-    num_inference_steps: int,
-    guidance_scale: int,
-    strength: float,
-    flux_keywords: List[str] = None,
-    loras_selected: List[Tuple[str, float]] = None,
 ):
-    flux_keywords = flux_keywords or []
-    loras_selected = loras_selected or []
-    # Convertir nombres a objetos LoRA
     selected_loras_with_weights = []
-    for name, weight_value in loras_selected:
-        try:
-            # Convierte explícitamente el peso (que viene como string) a float
-            weight = float(weight_value)
-        except (ValueError, TypeError):
-            # Ignora si el valor no es un número válido (ej: None o string vacío)
-            print(f"Valor de peso inválido '{weight_value}' para LoRA '{name}', omitiendo.")
-            continue  # Pasa al siguiente LoRA
-        lora_obj = next((l for l in loras if l.display_name == name), None)
-        # Ahora la comparación 'weight != 0.0' es segura (float con float)
-        if lora_obj and weight != 0.0:
-            selected_loras_with_weights.append((lora_obj, weight))
     deactivate_loras(pipe)
     if selected_loras_with_weights:
         activate_loras(pipe, selected_loras_with_weights)
-    # Construir prompt final
     final_prompt = ""
     if flux_keywords:
         final_prompt += ", ".join(flux_keywords) + ", "
-    for lora, _ in selected_loras_with_weights:
-        if lora.keyword:
-            if isinstance(lora.keyword, str):
-                final_prompt += lora.keyword + ", "
-            else:
-                final_prompt += ", ".join(lora.keyword) + ", "
-    if final_prompt:
-        final_prompt += "\n\n"
     final_prompt += prompt
     if not isinstance(seed, int) or seed < 0:
@@ -155,6 +223,7 @@ def inpaint_api(
     return inpaint(
         image=image,
         mask=mask,
         prompt=final_prompt,
         seed=seed,
         num_inference_steps=num_inference_steps,
@@ -163,24 +232,14 @@ def inpaint_api(
     )
-# ========================
-# UI DIRECTA A inpaint_api
-# ========================
-with gr.Blocks(title="Flux.1 Fill dev Inpainting with LoRAs", theme=gr.themes.Soft()) as demo:
-    gr.api(get_loras, api_name="get_loras")
     with gr.Row():
         with gr.Column(scale=2):
             prompt_input = gr.Text(label="Prompt", lines=4, value="a 25 years old woman")
-            seed_slider = gr.Slider(
-                label="Seed", minimum=-1, maximum=MAX_SEED, step=1, value=-1, info="(-1 = Random)", interactive=True
-            )
-            num_inference_steps_input = gr.Number(label="Inference steps", value=40, interactive=True)
-            guidance_scale_input = gr.Number(label="Guidance scale", value=28, interactive=True)
-            strength_input = gr.Number(label="Strength", value=1.0, interactive=True, maximum=1.0)
             gr.Markdown("### Flux Keywords")
             flux_keywords_input = gr.CheckboxGroup(choices=flux_keywords_available, label="Flux Keywords")
@@ -192,31 +251,29 @@ with gr.Blocks(title="Flux.1 Fill dev Inpainting with LoRAs", theme=gr.themes.So
                     type="array",
                     headers=["LoRA", "Weight"],
                     value=[[name, 0.0] for name in lora_names],
-                    datatype=["str", "number"],  # Primera columna string, segunda número
-                    interactive=[False, True],  # Solo la segunda columna editable
-                    static_columns=[0],
-                    label="LoRA selection (Weight 0 = disable)",
                 )
         with gr.Column(scale=3):
-            image_input = gr.Image(label="Image", type="pil")
-            mask_input = gr.Image(label="Mask", type="pil")
-            run_btn = gr.Button("Run", variant="primary")
         with gr.Column(scale=3):
             result_image = gr.Image(label="Result")
-            used_prompt_box = gr.Text(label="Used prompt", lines=4)
-            used_seed_box = gr.Number(label="Used seed")
     run_btn.click(
         fn=inpaint_api,
         inputs=[
             image_input,
             mask_input,
             prompt_input,
             seed_slider,
             num_inference_steps_input,
@@ -225,9 +282,8 @@ with gr.Blocks(title="Flux.1 Fill dev Inpainting with LoRAs", theme=gr.themes.So
             flux_keywords_input,
             loras_selected_input,
         ],
-        outputs=[result_image, used_prompt_box, used_seed_box],
-        api_name="inpaint",
     )
 if __name__ == "__main__":
-    demo.launch(share=False, show_error=True)

 import random
 import gradio as gr
 import numpy as np
 import torch
 from diffusers import FluxFillPipeline
 from loras import LoRA, loras
+from PIL import Image
 MAX_SEED = np.iinfo(np.int32).max
 flux_keywords_available = ["IMG_1025.HEIC", "Selfie"]
+# --- LATENT MANIPULATION FUNCTIONS ---
+def pack_latents(latents, batch_size, num_channels, height, width):
+    latents = latents.view(batch_size, num_channels, height // 2, 2, width // 2, 2)
+    latents = latents.permute(0, 2, 4, 1, 3, 5)
+    latents = latents.reshape(batch_size, (height // 2) * (width // 2), num_channels * 4)
+    return latents
+def unpack_latents(latents, height, width, h_scale=2, w_scale=2):
+    batch_size, seq_len, channels = latents.shape
+    # Flux uses a 2x2 patch, so the factor is 2
+    latents = latents.view(
+        batch_size, height // h_scale, width // w_scale, channels // (h_scale * w_scale), h_scale, w_scale
+    )
+    latents = latents.permute(0, 3, 1, 4, 2, 5)
+    latents = latents.reshape(batch_size, channels // (h_scale * w_scale), height, width)
+    return latents
+# --- CALLBACK (PRESERVED AREA + STEP CAPTURE) ---
+def get_gradual_blend_callback(
+    pipe,
+    original_image,
+    preserved_area_mask,
+    total_steps,
+    step_images_list,
+    start_alpha=1.0,
+    end_alpha=0.2,
+):
+    device = pipe.device
+    dtype = pipe.transformer.dtype
+    packed_init_latents = None
+    packed_preserved_mask = None
+    h_latent = w_latent = None
+    if preserved_area_mask is not None:
+        with torch.no_grad():
+            img_tensor = (
+                (torch.from_numpy(np.array(original_image).transpose(2, 0, 1)).float() / 127.5 - 1.0)
+                .unsqueeze(0)
+                .to(device, dtype)
+            )
+            init_latents = pipe.vae.encode(img_tensor).latent_dist.sample()
+            init_latents = (init_latents - pipe.vae.config.shift_factor) * pipe.vae.config.scaling_factor
+            _, _, h_latent, w_latent = init_latents.shape
+            packed_init_latents = pack_latents(
+                init_latents, batch_size=1, num_channels=16, height=h_latent, width=w_latent
+            )
+            mask_tensor = (
+                (torch.from_numpy(np.array(preserved_area_mask.convert("L"))).float() / 255.0)
+                .unsqueeze(0)
+                .unsqueeze(0)
+                .to(device, dtype)
+            )
+            latent_preserved_mask = torch.nn.functional.interpolate(
+                mask_tensor, size=(h_latent, w_latent), mode="nearest"
+            )
+            packed_preserved_mask = pack_latents(
+                latent_preserved_mask, batch_size=1, num_channels=1, height=h_latent, width=w_latent
+            )
+    def callback_fn(pipe, step, timestep, callback_kwargs):
+        latents = callback_kwargs["latents"]
+        if packed_preserved_mask is not None:
+            progress = step / max(1, total_steps - 1)
+            current_alpha = start_alpha - (start_alpha - end_alpha) * progress
+            effective_mask = (packed_preserved_mask * current_alpha).repeat(1, 1, 16)
+            latents = (1 - effective_mask) * latents + effective_mask * packed_init_latents
+        if step % 5 == 0 or step == total_steps - 1:
+            with torch.no_grad():
+                unpacked = unpack_latents(latents, h_latent, w_latent)
+                unpacked = (unpacked / pipe.vae.config.scaling_factor) + pipe.vae.config.shift_factor
+                decoded = pipe.vae.decode(unpacked.to(pipe.vae.dtype)).sample
+                img_step = pipe.image_processor.postprocess(decoded, output_type="pil")[0]
+                step_images_list.append(img_step)
+        callback_kwargs["latents"] = latents
+        return callback_kwargs
+    return callback_fn
+# --- LoRA's FUNCTIONS ---
 def activate_loras(pipe: FluxFillPipeline, loras_with_weights: list[tuple[LoRA, float]]):
     adapter_names = []
     adapter_weights = []
     for lora, weight in loras_with_weights:
         pipe.load_lora_weights(lora.id, weight=weight, adapter_name=lora.name)
         adapter_names.append(lora.name)
         adapter_weights.append(weight)
     pipe.set_adapters(adapter_names, adapter_weights=adapter_weights)
     return pipe
 def deactivate_loras(pipe):
     pipe.unload_lora_weights()
     return pipe
+# --- GENERATION
 def calculate_optimal_dimensions(image):
     original_width, original_height = image.size
     FIXED_DIMENSION = 1024
+    aspect_ratio = original_width / original_height
+    if aspect_ratio > 1:
+        width, height = FIXED_DIMENSION, round(FIXED_DIMENSION / aspect_ratio)
     else:
+        height, width = FIXED_DIMENSION, round(FIXED_DIMENSION * aspect_ratio)
+    return (width // 8) * 8, (height // 8) * 8
+@spaces.GPU(duration=60)
 def inpaint(
     image,
     mask,
+    preserved_area_mask=None,
     prompt: str = "",
     seed: int = 0,
     num_inference_steps: int = 28,
     mask = mask.convert("L")
     width, height = calculate_optimal_dimensions(image)
+    # Resize to match dimensions
+    image_resized = image.resize((width, height), Image.LANCZOS)
     pipe.to("cuda")
+    # Setup callback if a preserved area mask is provided
+    step_images = []
+    callback = None
+    if preserved_area_mask is not None:
+        preserved_area_resized = preserved_area_mask.resize((width, height), Image.NEAREST)
+        callback = get_gradual_blend_callback(
+            pipe, image_resized, preserved_area_resized, num_inference_steps, step_images
+        )
     result = pipe(
+        image=image_resized,
+        mask_image=mask.resize((width, height)),
         prompt=prompt,
         width=width,
         height=height,
         guidance_scale=guidance_scale,
         strength=strength,
         generator=torch.Generator().manual_seed(seed),
+        callback_on_step_end=callback,
+        callback_on_step_end_tensor_inputs=["latents"] if callback else None,
     ).images[0]
+    return result.convert("RGBA"), step_images, prompt, seed
 def inpaint_api(
     image,
     mask,
+    preserved_area_mask=None,
+    prompt: str = "",
+    seed: int = -1,
+    num_inference_steps: int = 40,
+    guidance_scale: float = 30.0,
+    strength: float = 1.0,
+    flux_keywords: list[str] = None,
+    loras_selected: list[tuple[str, float]] = None,
 ):
     selected_loras_with_weights = []
+    if loras_selected:
+        for name, weight_value in loras_selected:
+            try:
+                weight = float(weight_value)
+            except (ValueError, TypeError):
+                continue
+            lora_obj = next((l for l in loras if l.display_name == name), None)
+            if lora_obj and weight != 0.0:
+                selected_loras_with_weights.append((lora_obj, weight))
     deactivate_loras(pipe)
     if selected_loras_with_weights:
         activate_loras(pipe, selected_loras_with_weights)
     final_prompt = ""
     if flux_keywords:
         final_prompt += ", ".join(flux_keywords) + ", "
+    if selected_loras_with_weights:
+        for lora, _ in selected_loras_with_weights:
+            if lora.keyword:
+                final_prompt += (lora.keyword if isinstance(lora.keyword, str) else ", ".join(lora.keyword)) + ", "
     final_prompt += prompt
     if not isinstance(seed, int) or seed < 0:
     return inpaint(
         image=image,
         mask=mask,
+        preserved_area_mask=preserved_area_mask,
         prompt=final_prompt,
         seed=seed,
         num_inference_steps=num_inference_steps,
     )
+with gr.Blocks(title="FLUX.1 Fill dev + Area Preservation", theme=gr.themes.Soft()) as demo:
     with gr.Row():
         with gr.Column(scale=2):
             prompt_input = gr.Text(label="Prompt", lines=4, value="a 25 years old woman")
+            seed_slider = gr.Slider(label="Seed", minimum=-1, maximum=MAX_SEED, step=1, value=-1)
+            num_inference_steps_input = gr.Number(label="Inference steps", value=40)
+            guidance_scale_input = gr.Number(label="Guidance scale", value=30)
+            strength_input = gr.Number(label="Strength", value=1.0, maximum=1.0)
             gr.Markdown("### Flux Keywords")
             flux_keywords_input = gr.CheckboxGroup(choices=flux_keywords_available, label="Flux Keywords")
                     type="array",
                     headers=["LoRA", "Weight"],
                     value=[[name, 0.0] for name in lora_names],
+                    datatype=["str", "number"],
+                    interactive=[False, True],
+                    label="LoRA selection",
                 )
         with gr.Column(scale=3):
+            image_input = gr.Image(label="Original Image", type="pil")
+            mask_input = gr.Image(label="Inpaint Mask (Area to change)", type="pil")
+            preserved_area_input = gr.Image(label="Preserved Area Mask (Area to keep)", type="pil")
+            run_btn = gr.Button("Generate", variant="primary")
         with gr.Column(scale=3):
             result_image = gr.Image(label="Result")
+            used_prompt_box = gr.Text(label="Final Prompt")
+            used_seed_box = gr.Number(label="Used Seed")
+            steps_gallery = gr.Gallery(label="Evolution (Steps)", columns=3, preview=True)
     run_btn.click(
         fn=inpaint_api,
         inputs=[
             image_input,
             mask_input,
+            preserved_area_input,
             prompt_input,
             seed_slider,
             num_inference_steps_input,
             flux_keywords_input,
             loras_selected_input,
         ],
+        outputs=[result_image, steps_gallery, used_prompt_box, used_seed_box],
     )
 if __name__ == "__main__":
+    demo.launch()