FLUX.2-Test

Sleeping

App Files Files Community

jhh6576 commited on Jan 26

Commit

ca0ffa2

verified ·

1 Parent(s): 5b67c31

Update app.py

Browse files

Files changed (1) hide show

app.py +89 -115

app.py CHANGED Viewed

@@ -1,145 +1,119 @@
-import os
 import gradio as gr
-import numpy as np
-import random
-import spaces
 import torch
 from diffusers import FluxImg2ImgPipeline
-from PIL import Image, ImageOps
-import io
-import base64
 # --- CONFIGURATION ---
-# We use bfloat16 for speed/memory on CPU
-dtype = torch.bfloat16
-device = "cpu"
-# We use Schnell because it is 10x faster on CPU than Dev or 'Klein'
-# If you explicitly have access to Flux 2, change this ID.
 MODEL_ID = "black-forest-labs/FLUX.1-schnell"
-print(f"Loading Model: {MODEL_ID} on {device}...")
-# Load Pipeline
 pipe = FluxImg2ImgPipeline.from_pretrained(
     MODEL_ID,
-    torch_dtype=dtype
 )
-# CRITICAL CPU OPTIMIZATION
-# This replaces .to("cuda"). It loads the model in pieces so RAM doesn't crash.
-pipe.enable_model_cpu_offload()
-MAX_SEED = np.iinfo(np.int32).max
-# --- THE "INJECTION" LOGIC ---
-# This acts as a pre-processor injection. It forces the pixel data
-# to be symmetrical before the UNet even sees it.
-# This guarantees the "Face Lock".
-def inject_symmetry(image, side="Left"):
-    if image is None:
-        return None
-    img = image.convert("RGB")
-    w, h = img.size
-    mid = w // 2
-    arr = np.array(img)
-    # Mathematical locking of geometry
     if side == "Left":
-        target_half = arr[:, :mid, :] # Get Left
-        mirrored = np.fliplr(target_half) # Mirror it
-        locked_face = np.concatenate((target_half, mirrored), axis=1)
     else:
-        target_half = arr[:, mid:, :] # Get Right
-        mirrored = np.fliplr(target_half) # Mirror it
-        locked_face = np.concatenate((mirrored, target_half), axis=1)
-    return Image.fromarray(locked_face)
-# --- INFERENCE FUNCTION ---
-@spaces.GPU(duration=120) # Request GPU if available, falls back to CPU logic if not
-def infer(prompt, input_image, side_choice, strength, seed, randomize_seed, width, height, steps, guidance):
-    if input_image is None:
-        raise gr.Error("Please upload an image for face symmetry.")
-    if randomize_seed:
-        seed = random.randint(0, MAX_SEED)
-    # 1. INJECT SYMMETRY
-    # We process the image *before* the model touches it.
-    print("Injecting symmetry constraints...")
-    processed_image = inject_symmetry(input_image, side_choice)
-    # Resize to be compatible with Flux (multiples of 16)
-    w, h = processed_image.size
-    w = (w // 16) * 16
-    h = (h // 16) * 16
-    processed_image = processed_image.resize((w, h))
-    print("Running Flux to smooth seams...")
-    generator = torch.Generator(device="cpu").manual_seed(seed)
-    # 2. RUN DIFFUSION
-    # We use the processed image as the base.
-    # Strength is CRITICAL:
-    # 0.1 - 0.30 = Locks Identity (Only fixes the seam)
-    # 0.35+ = Starts changing the face
-    result = pipe(
-        prompt=prompt,
-        image=processed_image,
-        strength=strength,
-        num_inference_steps=steps,
-        guidance_scale=guidance,
-        generator=generator
-    ).images[0]
-    return result, seed
-# --- UI SETUP ---
 css = """
-#col-container { max-width: 1000px; margin: 0 auto; }
 """
 with gr.Blocks(css=css) as demo:
     with gr.Column(elem_id="col-container"):
-        gr.Markdown("# Flux Face Symmetry (Identity Lock)")
-        gr.Markdown("CPU-Optimized Mode. Uses Pixel Injection to lock face geometry.")
         with gr.Row():
-            with gr.Column():
-                input_img = gr.Image(label="Upload Face", type="pil")
-                with gr.Row():
-                    side = gr.Radio(["Left", "Right"], label="Keep Side", value="Left")
-                    # Strength default is 0.25 -> This ensures ID is locked
-                    strength = gr.Slider(0.1, 0.6, value=0.25, step=0.01, label="Denoise Strength (Keep <0.30 to lock ID)")
-                prompt = gr.Text(
-                    label="Prompt (Optional - usually leave empty or describe lighting)",
-                    value="high quality, realistic, smooth skin, 8k",
-                    lines=2
-                )
-                run_btn = gr.Button("Generate Symmetrical Face", variant="primary")
-                with gr.Accordion("Advanced", open=False):
-                    steps = gr.Slider(1, 50, value=4, step=1, label="Steps (Keep low for CPU)")
-                    guidance = gr.Slider(0, 10, value=1.0, step=0.1, label="Guidance")
-                    width = gr.Slider(256, 1024, value=1024, step=16, label="Width")
-                    height = gr.Slider(256, 1024, value=1024, step=16, label="Height")
-                    seed = gr.Slider(0, MAX_SEED, value=0, label="Seed")
-                    randomize_seed = gr.Checkbox(True, label="Randomize Seed")
-            with gr.Column():
-                output_img = gr.Image(label="Result")
-                seed_output = gr.Number(label="Used Seed")
-    run_btn.click(
-        infer,
-        inputs=[prompt, input_img, side, strength, seed, randomize_seed, width, height, steps, guidance],
-        outputs=[output_img, seed_output]
-    )
-demo.launch()

 import gradio as gr
 import torch
+import numpy as np
+import gc
 from diffusers import FluxImg2ImgPipeline
+from PIL import Image
 # --- CONFIGURATION ---
+# We use Flux.1-Schnell (The official fast/distilled model)
+# It is the closest working alternative to your requested "4B" model.
 MODEL_ID = "black-forest-labs/FLUX.1-schnell"
+DEVICE = "cpu"
+DTYPE = torch.bfloat16
+print(f"Loading {MODEL_ID} on {DEVICE}...")
+# Load Model without GPU offloading (since we are on CPU)
 pipe = FluxImg2ImgPipeline.from_pretrained(
     MODEL_ID,
+    torch_dtype=DTYPE
 )
+# --- THE INJECTION LOGIC ---
+# You requested UNet injection. On CPU, the most efficient way to "Lock" the face
+# is to mathematically force the symmetry on the input tensor (Latent/Pixel)
+# BEFORE the UNet destroys the details.
+def inject_face_symmetry(image, side="Left"):
+    if image is None: return None
+    # 1. Convert to Numpy Buffer
+    img_array = np.array(image.convert("RGB"))
+    height, width, _ = img_array.shape
+    midpoint = width // 2
+    # 2. Force Mathematical Symmetry (The "Lock")
     if side == "Left":
+        # Keep Left, Mirror to Right
+        left_side = img_array[:, :midpoint, :]
+        right_side = np.fliplr(left_side)
+        # Handle odd widths
+        if right_side.shape[1] != left_side.shape[1]:
+            right_side = right_side[:, :left_side.shape[1], :]
+        symmetrical_array = np.concatenate((left_side, right_side), axis=1)
     else:
+        # Keep Right, Mirror to Left
+        right_side = img_array[:, midpoint:, :]
+        left_side = np.fliplr(right_side)
+        symmetrical_array = np.concatenate((left_side, right_side), axis=1)
+    return Image.fromarray(symmetrical_array)
+# --- INFERENCE ---
+def run_inference(prompt, image_input, side, strength, seed, steps):
+    if image_input is None:
+        return None
+    # Clean RAM before starting
+    gc.collect()
+    # 1. INJECTION: Lock the Geometry
+    # We do this first so the UNet receives a perfectly symmetrical input.
+    print("Injecting Symmetry Code...")
+    locked_image = inject_face_symmetry(image_input, side)
+    # 2. RESIZE FOR CPU SAFETY
+    # Flux requires ~24GB RAM. Free CPUs usually have 16GB.
+    # We must resize to 512x512 or 768x768 max to avoid crashing.
+    w, h = locked_image.size
+    # Force resize to manageable CPU dimensions
+    locked_image = locked_image.resize((768, 768))
+    # 3. RUN FLUX (Refining the seams)
+    # We use a low strength (0.15 - 0.25) to preserve the identity (Lock)
+    # while letting the UNet fix the lighting/seams.
+    print("Running Flux UNet...")
+    generator = torch.Generator(DEVICE).manual_seed(int(seed))
+    try:
+        result = pipe(
+            prompt=prompt,
+            image=locked_image,
+            strength=strength,
+            num_inference_steps=steps,
+            guidance_scale=0.0, # Schnell uses 0 guidance usually
+            generator=generator
+        ).images[0]
+    except RuntimeError as e:
+        return None # Handle OOM gracefully if needed
+    return result
+# --- UI ---
 css = """
+#col-container { max-width: 900px; margin: 0 auto; }
 """
 with gr.Blocks(css=css) as demo:
     with gr.Column(elem_id="col-container"):
+        gr.Markdown(f"# Flux Face Symmetry (Identity Lock)")
+        gr.Markdown(f"Running **{MODEL_ID}** on CPU. <br/>Method: Pre-UNet Symmetry Injection.")
         with gr.Row():
+            img_in = gr.Image(label="Upload Face", type="pil")
+            img_out = gr.Image(label="Symmetrical Result")
+        with gr.Row():
+            side = gr.Radio(["Left", "Right"], label="Good Side", value="Left")
+            strength = gr.Slider(0.1, 0.45, value=0.20, step=0.01, label="Denoise (Lower = Stronger Lock)")
+        with gr.Accordion("Advanced Settings", open=False):
+            prompt = gr.Text(label="Prompt", value="high quality, realistic, smooth")
+            steps = gr.Slider(1, 10, value=2, step=1, label="Steps (Schnell only needs 2-4)")
+            seed = gr.Number(label="Seed", value=42)
+        btn = gr.Button("Generate", variant="primary")
+        btn.click(run_inference, inputs=[prompt, img_in, side, strength, seed, steps], outputs=[img_out])
+demo.queue().launch()