Spaces:

beertoshi
/

Unthotifai

Sleeping

App Files Files Community

beertoshi commited on May 27, 2025

Commit

920f263

verified ·

1 Parent(s): da348cc

Update app.py

Browse files

Files changed (1) hide show

app.py +167 -115

app.py CHANGED Viewed

@@ -1,195 +1,247 @@
 import gradio as gr
 import torch
-from diffusers import StableDiffusionInpaintPipeline
-from PIL import Image, ImageDraw, ImageFilter
 import numpy as np
 import spaces
-# Initialize model globally (loaded on CPU first)
-print("Loading model on CPU first (ZeroGPU will move it to GPU when needed)...")
-pipe = StableDiffusionInpaintPipeline.from_pretrained(
     "stabilityai/stable-diffusion-2-inpainting",
     torch_dtype=torch.float16,
     safety_checker=None,
     requires_safety_checker=False
 )
-# Don't move to GPU yet - ZeroGPU will handle this
-pipe.enable_attention_slicing()
-print("✅ Model loaded! ZeroGPU will activate when generating.")
-# Clothing prompts
 CLOTHING_PROMPTS = {
-    "Indian Sari": "woman wearing beautiful red and gold silk sari, traditional Indian saree dress, intricate embroidery",
-    "Japanese Kimono": "person wearing elegant floral kimono with obi belt, traditional Japanese clothing, silk fabric",
-    "African Dashiki": "person wearing colorful African dashiki with geometric patterns, traditional clothing, vibrant",
-    "Chinese Qipao": "woman wearing elegant red qipao cheongsam dress, traditional Chinese dress, silk with gold patterns",
-    "Scottish Kilt": "man wearing traditional Scottish kilt with tartan pattern, highland dress, sporran",
-    "Middle Eastern Thobe": "person wearing white thobe robe, traditional Middle Eastern clothing, flowing fabric"
 }
-def create_body_mask(image):
-    """Create mask for clothing area"""
     width, height = image.size
     mask = Image.new('L', (width, height), 0)
     draw = ImageDraw.Draw(mask)
-    # Body area ellipse
-    left = width * 0.2
-    top = height * 0.25
-    right = width * 0.8
-    bottom = height * 0.95
-    draw.ellipse([left, top, right, bottom], fill=255)
-    mask = mask.filter(ImageFilter.GaussianBlur(radius=20))
     return mask
-@spaces.GPU(duration=60)  # Request GPU for 60 seconds
-def generate_clothing(input_image, clothing_type, num_steps=25, guidance_scale=7.5):
-    """Generate traditional clothing with ZeroGPU"""
     if input_image is None:
-        return None, "Please upload an image first"
     try:
-        # Move model to GPU (ZeroGPU allocates it now)
-        pipe.to("cuda")
-        # Convert to PIL if needed
         if isinstance(input_image, np.ndarray):
             image = Image.fromarray(input_image).convert("RGB")
         else:
             image = input_image.convert("RGB")
-        # Store original size
         original_size = image.size
         # Resize for processing
-        max_size = 512
-        if max(image.size) > max_size:
-            ratio = max_size / max(image.size)
             new_size = tuple(int(dim * ratio) for dim in image.size)
             image = image.resize(new_size, Image.Resampling.LANCZOS)
-        # Create mask
-        mask = create_body_mask(image)
-        # Get prompt
         prompt = CLOTHING_PROMPTS[clothing_type]
-        negative_prompt = "nude, naked, nsfw, bad quality, blurry, distorted"
-        # Generate with GPU
         with torch.autocast("cuda"):
-            result = pipe(
                 prompt=prompt,
                 negative_prompt=negative_prompt,
                 image=image,
                 mask_image=mask,
-                num_inference_steps=num_steps,
-                guidance_scale=guidance_scale,
-                strength=0.95
             ).images[0]
-        # Resize back
-        if result.size != original_size:
-            result = result.resize(original_size, Image.Resampling.LANCZOS)
-        # Move model back to CPU to free GPU
-        pipe.to("cpu")
         torch.cuda.empty_cache()
-        return result, f"✅ Successfully added {clothing_type}!"
     except Exception as e:
-        print(f"Generation error: {e}")
         return None, f"Error: {str(e)}"
-# Create interface
-with gr.Blocks(title="Traditional Clothing AI - ZeroGPU", theme=gr.themes.Soft()) as app:
     gr.Markdown("""
-    # 👘 Traditional Clothing Addition Tool
-    **Powered by ZeroGPU** 🚀 - Free GPU acceleration!
-    Add beautiful traditional clothing from various cultures to your photos.
-    Generation takes about 30-45 seconds per image.
     """)
     with gr.Row():
         with gr.Column():
-            input_image = gr.Image(
-                label="Upload Your Photo",
-                type="pil"
-            )
             clothing_type = gr.Dropdown(
                 choices=list(CLOTHING_PROMPTS.keys()),
                 value="Indian Sari",
-                label="Select Traditional Clothing"
             )
-            with gr.Accordion("Advanced Settings", open=False):
-                num_steps = gr.Slider(
-                    minimum=15,
-                    maximum=50,
-                    value=25,
-                    step=5,
-                    label="Quality Steps",
-                    info="More steps = better quality but slower"
                 )
-                guidance_scale = gr.Slider(
-                    minimum=5,
-                    maximum=15,
-                    value=7.5,
-                    step=0.5,
-                    label="Guidance Scale",
-                    info="Higher = more adherence to prompt"
                 )
-            generate_btn = gr.Button(
-                "🎨 Add Traditional Clothing",
-                variant="primary",
-                size="lg"
-            )
         with gr.Column():
-            output_image = gr.Image(
-                label="Result"
-            )
-            status_text = gr.Textbox(
-                label="Status",
-                placeholder="Upload an image and click generate..."
-            )
     gr.Markdown("""
-    ---
-    ### 💡 Tips for Best Results:
-    - Use clear, front-facing photos
-    - Good lighting improves results
-    - The person should be fully visible
-    - Processing uses free GPU via ZeroGPU
-    ### 🌍 Cultural Note:
-    This tool celebrates cultural diversity through traditional clothing.
-    AI-generated results are artistic interpretations.
-    Please use respectfully.
-    ### ⚡ About ZeroGPU:
-    This Space uses Hugging Face's free ZeroGPU feature.
-    GPU is allocated only during generation, which saves resources!
     """)
-    # Connect button
     generate_btn.click(
-        fn=generate_clothing,
-        inputs=[input_image, clothing_type, num_steps, guidance_scale],
-        outputs=[output_image, status_text]
     )
-if __name__ == "__main__":
-    app.launch()

 import gradio as gr
 import torch
+from diffusers import StableDiffusionInpaintPipeline, StableDiffusionImg2ImgPipeline
+from PIL import Image, ImageDraw, ImageFilter, ImageEnhance
 import numpy as np
 import spaces
+# Load models
+inpaint_pipe = StableDiffusionInpaintPipeline.from_pretrained(
     "stabilityai/stable-diffusion-2-inpainting",
     torch_dtype=torch.float16,
     safety_checker=None,
     requires_safety_checker=False
 )
+inpaint_pipe.enable_attention_slicing()
+inpaint_pipe.enable_vae_slicing()
+inpaint_pipe.enable_vae_tiling()  # For high-res
+print("✅ Model loaded with high-res support!")
 CLOTHING_PROMPTS = {
+    "Indian Sari": "woman wearing luxurious red and gold silk sari with intricate embroidery, traditional Indian saree, professional fashion photography, studio lighting, ultra detailed fabric texture, 8k quality",
+    "Japanese Kimono": "person wearing exquisite silk kimono with cherry blossom patterns, traditional Japanese formal wear, professional portrait, studio lighting, highly detailed fabric, photorealistic",
+    "African Dashiki": "person wearing vibrant African dashiki with authentic kente patterns, traditional clothing, professional photography, rich colors, detailed textile work, high resolution",
+    "Chinese Qipao": "elegant woman in traditional Chinese qipao cheongsam, silk dress with intricate patterns, professional fashion shoot, studio lighting, ultra high quality",
 }
+def create_professional_mask(image, face_margin=0.35):
+    """Create professional mask with precise face avoidance"""
     width, height = image.size
+    # Create multiple mask layers
     mask = Image.new('L', (width, height), 0)
     draw = ImageDraw.Draw(mask)
+    # Calculate face-safe area
+    face_bottom = height * face_margin
+    # Primary body mask
+    body_coords = [
+        width * 0.1,    # left
+        face_bottom,    # top (below face)
+        width * 0.9,    # right
+        height * 0.98   # bottom
+    ]
+    # Draw main body area
+    draw.ellipse(body_coords, fill=255)
+    # Create smooth transition gradient
+    gradient_layers = 30
+    for i in range(gradient_layers):
+        opacity = int(255 * (i / gradient_layers))
+        y = face_bottom - (gradient_layers - i)
+        if y >= 0:
+            draw.rectangle([body_coords[0], y, body_coords[2], y + 1], fill=opacity)
+    # Multi-stage blur for ultra-smooth edges
+    mask = mask.filter(ImageFilter.GaussianBlur(radius=15))
+    mask = mask.filter(ImageFilter.GaussianBlur(radius=25))
     return mask
+def enhance_for_processing(image):
+    """Enhance image before processing"""
+    # Sharpness
+    enhancer = ImageEnhance.Sharpness(image)
+    image = enhancer.enhance(1.3)
+    # Color
+    enhancer = ImageEnhance.Color(image)
+    image = enhancer.enhance(1.1)
+    # Contrast
+    enhancer = ImageEnhance.Contrast(image)
+    image = enhancer.enhance(1.05)
+    return image
+def professional_blend(original, generated, mask, blend_mode="smooth"):
+    """Professional multi-layer blending"""
+    # Convert to RGBA
+    original_rgba = original.convert("RGBA")
+    generated_rgba = generated.convert("RGBA")
+    if blend_mode == "smooth":
+        # Create multiple blend masks for smoother transition
+        blend_mask1 = mask.filter(ImageFilter.GaussianBlur(radius=40))
+        blend_mask2 = mask.filter(ImageFilter.GaussianBlur(radius=60))
+        # First blend pass
+        result = Image.composite(generated_rgba, original_rgba, blend_mask1)
+        # Second blend pass for ultra-smooth transition
+        result = Image.composite(result, original_rgba, blend_mask2)
+    else:
+        # Standard blend
+        result = Image.composite(generated_rgba, original_rgba, mask)
+    return result.convert("RGB")
+@spaces.GPU(duration=120)
+def generate_professional_quality(
+    input_image,
+    clothing_type,
+    face_margin=0.35,
+    quality_preset="ultra",
+    blend_mode="smooth"
+):
+    """Professional workflow with maximum quality"""
     if input_image is None:
+        return None, "Please upload an image"
     try:
+        # Move to GPU
+        inpaint_pipe.to("cuda")
+        # Prepare image
         if isinstance(input_image, np.ndarray):
             image = Image.fromarray(input_image).convert("RGB")
         else:
             image = input_image.convert("RGB")
+        # Store originals
+        original_image = image.copy()
         original_size = image.size
+        # Quality presets
+        quality_settings = {
+            "fast": {"size": 512, "steps": 30, "guidance": 7.5},
+            "balanced": {"size": 768, "steps": 50, "guidance": 8.0},
+            "ultra": {"size": 1024, "steps": 75, "guidance": 8.5}
+        }
+        settings = quality_settings[quality_preset]
         # Resize for processing
+        if max(image.size) > settings["size"]:
+            ratio = settings["size"] / max(image.size)
             new_size = tuple(int(dim * ratio) for dim in image.size)
             image = image.resize(new_size, Image.Resampling.LANCZOS)
+            original_resized = original_image.resize(new_size, Image.Resampling.LANCZOS)
+        else:
+            original_resized = original_image
+        # Enhance image
+        image = enhance_for_processing(image)
+        # Create professional mask
+        mask = create_professional_mask(image, face_margin)
+        # Generate with optimal settings
         prompt = CLOTHING_PROMPTS[clothing_type]
+        negative_prompt = "blurry, low quality, distorted face, bad anatomy, ugly, amateur"
         with torch.autocast("cuda"):
+            result = inpaint_pipe(
                 prompt=prompt,
                 negative_prompt=negative_prompt,
                 image=image,
                 mask_image=mask,
+                num_inference_steps=settings["steps"],
+                guidance_scale=settings["guidance"],
+                strength=0.88,  # Optimal for preservation
+                height=image.height,
+                width=image.width
             ).images[0]
+        # Professional blending
+        final = professional_blend(original_resized, result, mask, blend_mode)
+        # Final enhancement
+        final = enhance_for_processing(final)
+        # Resize to original
+        if final.size != original_size:
+            final = final.resize(original_size, Image.Resampling.LANCZOS)
+        # Cleanup
+        inpaint_pipe.to("cpu")
         torch.cuda.empty_cache()
+        return final, f"✅ Professional quality {clothing_type} applied!"
     except Exception as e:
         return None, f"Error: {str(e)}"
+# Professional UI
+with gr.Blocks(title="Professional Clothing AI", theme=gr.themes.Soft()) as app:
     gr.Markdown("""
+    # 👘 Professional Traditional Clothing AI
+    ### Maximum Quality • Perfect Face Preservation • Studio Results
     """)
     with gr.Row():
         with gr.Column():
+            input_image = gr.Image(type="pil", label="Upload High-Res Photo")
             clothing_type = gr.Dropdown(
                 choices=list(CLOTHING_PROMPTS.keys()),
                 value="Indian Sari",
+                label="Traditional Clothing"
             )
+            with gr.Accordion("Professional Settings", open=True):
+                face_margin = gr.Slider(
+                    0.25, 0.45, 0.35, 0.05,
+                    label="Face Safety Margin",
+                    info="Higher = more face protection"
+                )
+                quality_preset = gr.Radio(
+                    ["fast", "balanced", "ultra"],
+                    value="ultra",
+                    label="Quality Preset",
+                    info="Ultra = best quality (2-3 min)"
                 )
+                blend_mode = gr.Radio(
+                    ["smooth", "standard"],
+                    value="smooth",
+                    label="Blend Mode",
+                    info="Smooth = seamless transitions"
                 )
+            generate_btn = gr.Button("🎨 Generate Professional", variant="primary", size="lg")
         with gr.Column():
+            output_image = gr.Image(label="Result")
+            status = gr.Textbox(label="Status")
     gr.Markdown("""
+    ### 🏆 Professional Tips:
+    - Use photos 1000px+ for best results
+    - Face margin 0.35 preserves faces perfectly
+    - Ultra mode takes 2-3 minutes but worth it
+    - Smooth blending eliminates all artifacts
     """)
     generate_btn.click(
+        generate_professional_quality,
+        inputs=[input_image, clothing_type, face_margin, quality_preset, blend_mode],
+        outputs=[output_image, status]
     )
+app.launch()