Spaces:

VcRlAgent
/

FaceForgeAI_ZeroGPU

Sleeping

App Files Files Community

VcRlAgent commited on Oct 17, 2025

Commit

3c8b597

1 Parent(s): cc10554

Refactor to enable users to chose Avatar generation modes

Browse files

Files changed (4) hide show

app copy.py +226 -0
app.py +68 -27
app.py.orig +0 -14
requirement.txt.bk +0 -34

app copy.py ADDED Viewed

	@@ -0,0 +1,226 @@

+# ==========================================
+# FaceForge AI – ZeroGPU Gradio Version
+# Author: Vijay S. Chaudhari | 2025
+# ==========================================
+import gradio as gr
+import spaces
+import torch
+import cv2
+import numpy as np
+from PIL import Image, ImageEnhance, ImageOps
+from rembg import remove
+from diffusers import StableDiffusionImg2ImgPipeline
+import io
+import torchvision
+print("Printing Torch and TorchVision versions:")
+print(torch.__version__)
+print(torchvision.__version__)
+# GPU libraries
+from gfpgan import GFPGANer
+from basicsr.archs.rrdbnet_arch import RRDBNet
+from realesrgan import RealESRGANer
+# ------------------------------------------
+# Model Loading (Outside GPU decorator)
+# ------------------------------------------
+def load_models():
+    """Load models once at startup"""
+    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+    # RealESRGAN upsampler
+    model = RRDBNet(num_in_ch=3, num_out_ch=3, num_feat=64, num_block=23, num_grow_ch=32, scale=2)
+    upsampler = RealESRGANer(
+        scale=2,
+        model_path='https://github.com/xinntao/Real-ESRGAN/releases/download/v0.2.1/RealESRGAN_x2plus.pth',
+        model=model,
+        tile=400,
+        tile_pad=10,
+        pre_pad=0,
+        half=True,
+        device=device
+    )
+    # GFPGAN enhancer
+    face_enhancer = GFPGANer(
+        model_path='https://github.com/TencentARC/GFPGAN/releases/download/v1.3.0/GFPGANv1.3.pth',
+        upscale=2,
+        arch='clean',
+        channel_multiplier=2,
+        bg_upsampler=upsampler,
+        device=device
+    )
+    # Stable Diffusion Img2Img pipeline (public model)
+    sd_pipe = StableDiffusionImg2ImgPipeline.from_pretrained(
+        "runwayml/stable-diffusion-v1-5",
+        torch_dtype=torch.float16
+    ).to(device)
+    # Optimize for ZeroGPU memory
+    sd_pipe.enable_attention_slicing()
+    sd_pipe.enable_model_cpu_offload()
+    return face_enhancer, sd_pipe
+# Load models globally
+face_enhancer, sd_pipe = load_models()
+# ------------------------------------------
+# GPU-Accelerated Functions
+# ------------------------------------------
+@spaces.GPU
+def enhance_face(img: Image.Image) -> Image.Image:
+    """Enhance face using GFPGAN (GPU)"""
+    img_cv = cv2.cvtColor(np.array(img.convert('RGB')), cv2.COLOR_RGB2BGR)
+    with torch.no_grad():
+        _, _, restored_img = face_enhancer.enhance(
+            img_cv,
+            has_aligned=False,
+            only_center_face=False,
+            paste_back=True,
+            weight=0.5
+        )
+    restored_img = cv2.cvtColor(restored_img, cv2.COLOR_BGR2RGB)
+    return Image.fromarray(restored_img)
+# ------------------------------------------
+# Image Processing Functions
+# ------------------------------------------
+def enhance_image(img: Image.Image) -> Image.Image:
+    """Basic enhancement"""
+    img = ImageEnhance.Contrast(img).enhance(1.15)
+    img = ImageEnhance.Sharpness(img).enhance(1.1)
+    return img
+@spaces.GPU
+def create_headshot(img: Image.Image) -> Image.Image:
+    """Professional headshot with gradient background"""
+    # Enhance face
+    img_enhanced = enhance_face(img)
+    # Remove background
+    img_no_bg = remove(img_enhanced)
+    # Gradient background
+    bg = Image.new("RGB", img_no_bg.size, (200, 210, 230))
+    if img_no_bg.mode == 'RGBA':
+        bg.paste(img_no_bg, mask=img_no_bg.split()[3])
+    return enhance_image(bg)
+@spaces.GPU
+def create_passport(img: Image.Image) -> Image.Image:
+    """Passport photo with white background"""
+    # Enhance face
+    img_enhanced = enhance_face(img)
+    # Remove background
+    img_no_bg = remove(img_enhanced)
+    # White background (600x600)
+    bg = Image.new("RGB", (600, 600), (255, 255, 255))
+    img_no_bg.thumbnail((550, 550), Image.Resampling.LANCZOS)
+    offset = ((600 - img_no_bg.width) // 2, (600 - img_no_bg.height) // 2)
+    if img_no_bg.mode == 'RGBA':
+        bg.paste(img_no_bg, offset, mask=img_no_bg.split()[3])
+    return bg
+@spaces.GPU
+def create_avatar(img: Image.Image) -> Image.Image:
+    """Stylized AI avatar"""
+    # Enhance face
+    img_enhanced = enhance_face(img)
+    # Resize for SD (512x512)
+    img_resized = img_enhanced.convert("RGB").resize((512, 512))
+    # Stylize with SD prompt
+    #prompt = "highly detailed, digital portrait, professional lighting, cinematic style, artistic AI avatar"
+    #prompt = "stylized yet realistic portrait, balanced lighting, subtle gradient background, sharp focus on face"
+    #prompt = "studio portrait, even lighting, neutral background, realistic skin, confident pose"
+    prompt = "realistic professional headshot, soft studio lighting, neutral background, crisp details, natural skin tone"
+    with torch.autocast("cuda"):
+        result = sd_pipe(prompt=prompt, image=img_resized, strength=0.4, guidance_scale=5.0)
+    avatar = result.images[0]
+    return avatar
+@spaces.GPU
+def process_all(img: Image.Image):
+    """Process all three types at once"""
+    headshot = create_headshot(img)
+    passport = create_passport(img)
+    avatar = create_avatar(img)
+    return headshot, passport, avatar
+# ------------------------------------------
+# Gradio Interface
+# ------------------------------------------
+with gr.Blocks(theme=gr.themes.Soft(), title="FaceForge AI") as demo:
+    gr.Markdown(
+        """
+        # 🎨 FaceForge AI
+        ### GPU-Accelerated Professional Headshot & Avatar Generator
+        Upload your photo and generate professional headshots, passport photos, and AI avatars instantly!
+        """
+    )
+    with gr.Row():
+        with gr.Column():
+            input_image = gr.Image(type="pil", label="📷 Upload Your Photo")
+            process_btn = gr.Button("✨ Generate All Images", variant="primary", size="lg")
+        with gr.Column():
+            gr.Markdown("### Results")
+    with gr.Row():
+        output_headshot = gr.Image(label="💼 Professional Headshot", type="pil")
+        output_passport = gr.Image(label="🛂 Passport Photo", type="pil")
+        output_avatar = gr.Image(label="🎭 AI Avatar", type="pil")
+    # Process button
+    process_btn.click(
+        fn=process_all,
+        inputs=input_image,
+        outputs=[output_headshot, output_passport, output_avatar]
+    )
+    # Examples
+    gr.Examples(
+        examples=[],  # Add example image paths if available
+        inputs=input_image
+    )
+    gr.Markdown(
+        """
+        ---
+        ### Features
+        - 💼 **Professional Headshots**: Perfect for LinkedIn and business profiles
+        - 🛂 **Passport Photos**: Standard 600x600px with white background
+        - 🎭 **AI Avatars**: Stylized versions for social media
+        - ⚡ **GPU-Accelerated**: Fast processing with GFPGAN enhancement
+        © 2025 Vijay S. Chaudhari | Powered by ZeroGPU 🚀
+        """
+    )
+# Launch
+if __name__ == "__main__":
+    demo.queue(max_size=20)
+    demo.launch()

app.py CHANGED Viewed

@@ -138,23 +138,21 @@ def create_passport(img: Image.Image) -> Image.Image:
 @spaces.GPU
 def create_avatar(img: Image.Image) -> Image.Image:
-    """Stylized AI avatar"""
     # Enhance face
     img_enhanced = enhance_face(img)
     # Resize for SD (512x512)
     img_resized = img_enhanced.convert("RGB").resize((512, 512))
-    # Stylize with SD prompt
     #prompt = "highly detailed, digital portrait, professional lighting, cinematic style, artistic AI avatar"
     #prompt = "stylized yet realistic portrait, balanced lighting, subtle gradient background, sharp focus on face"
     #prompt = "studio portrait, even lighting, neutral background, realistic skin, confident pose"
-    prompt = "realistic professional headshot, soft studio lighting, neutral background, crisp details, natural skin tone"
     with torch.autocast("cuda"):
-        result = sd_pipe(prompt=prompt, image=img_resized, strength=0.4, guidance_scale=5.0)
     avatar = result.images[0]
@@ -176,37 +174,80 @@ with gr.Blocks(theme=gr.themes.Soft(), title="FaceForge AI") as demo:
     gr.Markdown(
         """
         # 🎨 FaceForge AI
-        ### GPU-Accelerated Professional Headshot & Avatar Generator
-        Upload your photo and generate professional headshots, passport photos, and AI avatars instantly!
         """
     )
     with gr.Row():
-        with gr.Column():
             input_image = gr.Image(type="pil", label="📷 Upload Your Photo")
             process_btn = gr.Button("✨ Generate All Images", variant="primary", size="lg")
-        with gr.Column():
             gr.Markdown("### Results")
-    with gr.Row():
-        output_headshot = gr.Image(label="💼 Professional Headshot", type="pil")
-        output_passport = gr.Image(label="🛂 Passport Photo", type="pil")
-        output_avatar = gr.Image(label="🎭 AI Avatar", type="pil")
-    # Process button
     process_btn.click(
-        fn=process_all,
-        inputs=input_image,
         outputs=[output_headshot, output_passport, output_avatar]
     )
-    # Examples
-    gr.Examples(
-        examples=[],  # Add example image paths if available
-        inputs=input_image
-    )
     gr.Markdown(
         """
         ---

 @spaces.GPU
 def create_avatar(img: Image.Image) -> Image.Image:
+    """Stylized AI avatar using Stable Diffusion Img2Img with user inputs"""
     # Enhance face
     img_enhanced = enhance_face(img)
     # Resize for SD (512x512)
     img_resized = img_enhanced.convert("RGB").resize((512, 512))
+    # Stylize with SD prompt. We are selecting these from UI now.
     #prompt = "highly detailed, digital portrait, professional lighting, cinematic style, artistic AI avatar"
     #prompt = "stylized yet realistic portrait, balanced lighting, subtle gradient background, sharp focus on face"
     #prompt = "studio portrait, even lighting, neutral background, realistic skin, confident pose"
+    #prompt = "realistic professional headshot, soft studio lighting, neutral background, crisp details, natural skin tone"
     with torch.autocast("cuda"):
+        result = sd_pipe(prompt=prompt, image=img_resized, strength=strength, guidance_scale=guidance_scale)
     avatar = result.images[0]
     gr.Markdown(
         """
         # 🎨 FaceForge AI
+        ### GPU-Accelerated Professional Headshot & Avatar Generator
+        Upload your photo and choose or customize how your AI avatar is generated.
         """
     )
+    # --- Define a mapping: Short Label -> Full Prompt Text ---
+    PROMPT_MAP = {
+        "🎬 Cinematic Portrait": "highly detailed, digital portrait, professional lighting, cinematic style, artistic AI avatar",
+        "🎨 Stylized Realism": "stylized yet realistic portrait, balanced lighting, subtle gradient background, sharp focus on face",
+        "🏢 Studio Professional": "studio portrait, even lighting, neutral background, realistic skin, confident pose",
+        "🤵 Natural Headshot": "realistic professional headshot, soft studio lighting, neutral background, crisp details, natural skin tone"
+    }
     with gr.Row():
+        with gr.Column(scale=1):
             input_image = gr.Image(type="pil", label="📷 Upload Your Photo")
+            gr.Markdown("### ⚙️ Avatar Generation Settings")
+            # Dropdown shows short labels only
+            preset_prompt = gr.Dropdown(
+                label="🎨 Choose Avatar Style Preset",
+                choices=list(PROMPT_MAP.keys()),
+                value="🤵 Natural Headshot"
+            )
+            # Optional custom prompt box for flexibility
+            custom_prompt = gr.Textbox(
+                label="✏️ Custom Prompt (optional)",
+                placeholder="Enter your own prompt or leave blank to use preset...",
+                lines=2
+            )
+            strength_slider = gr.Slider(
+                label="🎛️ Style Strength (0.0 = keep original, 1.0 = full restyle)",
+                minimum=0.1,
+                maximum=1.0,
+                value=0.45,
+                step=0.05
+            )
+            guidance_slider = gr.Slider(
+                label="🎯 Prompt Guidance Scale (higher = more prompt influence)",
+                minimum=1.0,
+                maximum=10.0,
+                value=5.5,
+                step=0.5
+            )
             process_btn = gr.Button("✨ Generate All Images", variant="primary", size="lg")
+        with gr.Column(scale=1):
             gr.Markdown("### Results")
+            output_headshot = gr.Image(label="💼 Professional Headshot", type="pil")
+            output_passport = gr.Image(label="🛂 Passport Photo", type="pil")
+            output_avatar = gr.Image(label="🎭 AI Avatar", type="pil")
+    # --- Updated process function mapping with label → full prompt translation ---
+    def process_all_with_params(img, preset_label, custom, strength, guidance):
+        # Map the selected label to its full prompt text
+        preset_prompt = PROMPT_MAP[preset_label]
+        # Use custom prompt if provided, otherwise fallback to preset
+        final_prompt = custom.strip() if custom and custom.strip() != "" else preset_prompt
+        headshot = create_headshot(img)
+        passport = create_passport(img)
+        avatar = create_avatar(img, final_prompt, strength, guidance)
+        return headshot, passport, avatar
     process_btn.click(
+        fn=process_all_with_params,
+        inputs=[input_image, preset_prompt, custom_prompt, strength_slider, guidance_slider],
         outputs=[output_headshot, output_passport, output_avatar]
     )
     gr.Markdown(
         """
         ---

app.py.orig DELETED Viewed

@@ -1,14 +0,0 @@
-import gradio as gr
-import spaces
-import torch
-zero = torch.Tensor([0]).cuda()
-print(zero.device) # <-- 'cpu' 🤔
-@spaces.GPU
-def greet(n):
-    print(zero.device) # <-- 'cuda:0' 🤗
-    return f"Hello {zero + n} Tensor"
-demo = gr.Interface(fn=greet, inputs=gr.Number(), outputs=gr.Text())
-demo.launch()

requirement.txt.bk DELETED Viewed

@@ -1,34 +0,0 @@
-# ---------- Core AI / Diffusion Stack ----------
-opencv-python-headless==4.9.0.80
-torch==2.2.1
-torchvision==0.17.1
-torchaudio==2.2.1
-diffusers==0.27.2
-transformers==4.39.0
-accelerate==0.28.0
-safetensors==0.4.2
-# ---------- Image Enhancement / Face Models ----------
-gfpgan==1.3.8
-realesrgan==0.3.0
-basicsr==1.4.2
-facexlib==0.3.0
-# ---------- Utility / Image Processing ----------
-opencv-python-headless==4.9.0.80
-rembg==2.0.57
-Pillow==10.2.0
-numpy==1.26.4
-torchvision==0.17.1
-torch==2.2.1
-torchaudio==2.2.1
-# ---------- Gradio / Hugging Face Runtime ----------
-gradio==4.39.0
-spaces==0.24.0
-huggingface-hub==0.24.0
-# ---------- Optional Stability / Safety ----------
-einops==0.7.0
-timm==0.9.12