pixagram-neo-backup

Runtime error

App Files Files Community

primerz commited on Nov 1

Commit

802a1b7

verified ·

1 Parent(s): a628de7

Update app.py

Browse files

Files changed (1) hide show

app.py +57 -63

app.py CHANGED Viewed

@@ -1,5 +1,6 @@
 """
 Pixagram AI Pixel Art Generator - Gradio Interface
 """
 import spaces
 import gradio as gr
@@ -10,7 +11,7 @@ from generator import RetroArtConverter
 # Initialize converter
-print("Initializing RetroArt Converter...")
 converter = RetroArtConverter()
@@ -98,16 +99,16 @@ def process_image(
         raise gr.Error(f"Generation failed: {str(e)}")
-# Build model status text
 def get_model_status():
     """Generate model status markdown"""
     if converter.models_loaded:
         status_text = "**[OK] Loaded Models:**\n"
         status_text += f"- Custom Checkpoint (Horizon): {'[OK] Loaded' if converter.models_loaded['custom_checkpoint'] else '[OK] Using SDXL base'}\n"
         status_text += f"- LORA (RetroArt): {'[OK] Loaded' if converter.models_loaded['lora'] else ' Disabled'}\n"
-        status_text += f"- InstantID: {'[OK] Loaded' if converter.models_loaded['instantid'] else ' Disabled'}\n"
         status_text += f"- Zoe Depth: {'[OK] Loaded' if converter.models_loaded['zoe_depth'] else ' Fallback'}\n"
-        status_text += f"- IP-Adapter (Face Embeddings): {'[OK] Loaded' if converter.models_loaded.get('ip_adapter', False) else ' Keypoints only'}\n"
         return status_text
     return "**Model status unavailable**"
@@ -169,22 +170,22 @@ with gr.Blocks(title="Pixagram - AI Pixel Art Generator", theme=gr.themes.Soft()
     # Model status
     gr.Markdown(get_model_status())
-    # Scheduler info
     scheduler_info = f"""
     **[CONFIG] Advanced Configuration:**
-    - Pipeline: **Img2Img** (structure preservation)
-    - Face System: **CLIP + InsightFace** (dual embeddings)
-    - **[ADVANCED] Enhanced Resampler:** 10 layers, 20 heads (+3-5% quality)
-    - **[ADVANCED] Adaptive Attention:** Context-aware scaling (+2-3% quality)
-    - **[ADVANCED] Multi-Scale Processing:** 3-scale face analysis (+1-2% quality)
-    - **[ADVANCED] Adaptive Parameters:** Auto-adjust for face quality (+2-3% consistency)
-    - **[ADVANCED] Face-Aware Color Matching:** LAB space with saturation preservation (+1-2% quality)
     - Scheduler: **LCM** (12 steps, fast generation)
     - Recommended CFG: **1.15-1.5** (optimized for LCM)
     - Identity Boost: **1.15x** (for maximum face fidelity)
     - CLIP Skip: **2** (enhanced style control)
     - LORA Trigger: `{TRIGGER_WORD}` (auto-added)
-    - **Total Improvement:** +10-15% over base = **96-99% face similarity**
     """
     gr.Markdown(scheduler_info)
@@ -205,43 +206,51 @@ with gr.Blocks(title="Pixagram - AI Pixel Art Generator", theme=gr.themes.Soft()
                 lines=2
             )
-            with gr.Accordion(f" LCM Settings", open=True):
-                # Preset selector
                 with gr.Row():
-                    gr.Markdown("### Quick Presets (Click to apply)")
                 with gr.Row():
-                    preset_btn_1 = gr.Button("Ultra\nFidelity", size="sm", variant="secondary")
-                    preset_btn_2 = gr.Button("Premium\nPortrait", size="sm", variant="primary")
-                    preset_btn_3 = gr.Button("Balanced\nPortrait [DEFAULT]", size="sm", variant="secondary")
-                    preset_btn_4 = gr.Button("Artistic\nExcellence", size="sm", variant="secondary")
-                    preset_btn_5 = gr.Button("Style\nFocus", size="sm", variant="secondary")
-                    preset_btn_6 = gr.Button("Subtle\nEnhancement", size="sm", variant="secondary")
                 preset_status = gr.Textbox(
-                    label="Current Configuration",
-                    value="Default: Balanced Portrait",
-                    interactive=False,
-                    lines=2
                 )
                 gr.Markdown("### Core Parameters")
-                steps = gr.Slider(
-                    minimum=4,
-                    maximum=50,
-                    value=DEFAULT_PARAMS['num_inference_steps'],
-                    step=1,
-                    label=f" Inference Steps (LCM optimized for 12)"
-                )
                 with gr.Row():
-                    guidance_scale = gr.Slider(
-                        minimum=0.5,
                         maximum=2.0,
-                        value=DEFAULT_PARAMS['guidance_scale'],
                         step=0.05,
-                        label="Guidance Scale (CFG)\nHigher = stronger adherence to prompt"
                     )
                     strength = gr.Slider(
@@ -280,14 +289,6 @@ with gr.Blocks(title="Pixagram - AI Pixel Art Generator", theme=gr.themes.Soft()
                     label="InstantID ControlNet Scale (facial keypoints structure)"
                 )
-                identity_preservation = gr.Slider(
-                    minimum=0.3,
-                    maximum=2.0,
-                    value=DEFAULT_PARAMS['identity_preservation'],
-                    step=0.05,
-                    label="Identity Preservation (IP-Adapter scale)\nHigher = stronger face preservation"
-                )
                 enable_color_matching = gr.Checkbox(
                     value=DEFAULT_PARAMS['enable_color_matching'],
                     label="[OPTIONAL] Enable Color Matching (gentle skin tone adjustment)",
@@ -328,17 +329,11 @@ with gr.Blocks(title="Pixagram - AI Pixel Art Generator", theme=gr.themes.Soft()
             gr.Markdown(f"""
             ### Tips for Maximum Quality Results:
-            **[OPTIMIZATIONS] Advanced Optimizations Active:**
-            - **Enhanced Resampler:** 10 layers, 20 heads (+3-5% quality)
-            - **Adaptive Attention:** Context-aware scaling (+2-3% quality)
-            - **Multi-Scale Processing:** 3-scale face analysis (+1-2% quality)
-            - **Adaptive Parameters:** Auto-adjust based on face quality (+2-3% consistency)
-            - **Enhanced Color Matching:** Face-aware LAB color space (+1-2% quality)
-            **Expected Quality:**
-            - Base system: 90-93% face similarity
-            - With optimizations: 96-99% face similarity
-            - Ultra Fidelity preset: 97-99%+ face similarity
             **[PRESETS] Optimized Preset Guide:**
             - **Ultra Fidelity:** 96-98% similarity, minimal transformation
@@ -359,7 +354,7 @@ with gr.Blocks(title="Pixagram - AI Pixel Art Generator", theme=gr.themes.Soft()
               - `0.38-0.45`: Maximum fidelity (Ultra/Subtle presets)
               - `0.48-0.55`: Balanced quality (Premium/Balanced presets)
               - `0.58-0.68`: Artistic freedom (Artistic/Style presets)
-            - **Identity Preservation**: Face embedding strength (auto-boosted 1.15x)
             - **Guidance Scale (CFG)**: LCM-optimized range 1.1-1.5
             - **LORA Scale**: Pixel art intensity (inverse to identity)
@@ -383,10 +378,9 @@ with gr.Blocks(title="Pixagram - AI Pixel Art Generator", theme=gr.themes.Soft()
             6. Fix seed for consistent testing
             **[TECHNICAL] System Details:**
-            - Enhanced Resampler: 10 layers, 20 heads, 1280 dim
-            - Attention: Adaptive per-layer scaling
-            - Face Processing: Multi-scale (0.75x, 1x, 1.25x)
-            - Color Matching: LAB space, face-aware masking
             - Resolution: Auto-optimized to 896x1152 or 832x1216
             """)
@@ -452,4 +446,4 @@ if __name__ == "__main__":
         server_port=7860,
         share=True,
         show_api=True
-    )

 """
 Pixagram AI Pixel Art Generator - Gradio Interface
+UPDATED VERSION with InstantID pipeline status
 """
 import spaces
 import gradio as gr
 # Initialize converter
+print("Initializing RetroArt Converter with InstantID...")
 converter = RetroArtConverter()
         raise gr.Error(f"Generation failed: {str(e)}")
+# UPDATED: Build model status text with InstantID info
 def get_model_status():
     """Generate model status markdown"""
     if converter.models_loaded:
         status_text = "**[OK] Loaded Models:**\n"
         status_text += f"- Custom Checkpoint (Horizon): {'[OK] Loaded' if converter.models_loaded['custom_checkpoint'] else '[OK] Using SDXL base'}\n"
         status_text += f"- LORA (RetroArt): {'[OK] Loaded' if converter.models_loaded['lora'] else ' Disabled'}\n"
+        status_text += f"- InstantID Pipeline: {'[OK] Loaded with Face + Depth' if converter.models_loaded['instantid'] else ' Disabled'}\n"
         status_text += f"- Zoe Depth: {'[OK] Loaded' if converter.models_loaded['zoe_depth'] else ' Fallback'}\n"
+        status_text += "- IP-Adapter: [OK] Built into InstantID pipeline\n"
         return status_text
     return "**Model status unavailable**"
     # Model status
     gr.Markdown(get_model_status())
+    # UPDATED: Scheduler info with InstantID details
     scheduler_info = f"""
     **[CONFIG] Advanced Configuration:**
+    - Pipeline: **InstantID Img2Img** (native face preservation)
+    - Face System: **InstantID + InsightFace** (512D embeddings)
+    - **[INSTANTID] Built-in Resampler:** 8 layers, 16 heads (official)
+    - **[INSTANTID] IP-Adapter:** Native attention processors
+    - **[INSTANTID] Dual ControlNets:** Face keypoints + Depth
+    - **[ADVANCED] Adaptive Parameters:** Auto-adjust for face quality
+    - **[ADVANCED] Face-Aware Color Matching:** LAB space with saturation preservation
     - Scheduler: **LCM** (12 steps, fast generation)
     - Recommended CFG: **1.15-1.5** (optimized for LCM)
     - Identity Boost: **1.15x** (for maximum face fidelity)
     - CLIP Skip: **2** (enhanced style control)
     - LORA Trigger: `{TRIGGER_WORD}` (auto-added)
+    - **Expected Quality:** 95-98% face similarity
     """
     gr.Markdown(scheduler_info)
                 lines=2
             )
+            with gr.Accordion(" Presets", open=True):
                 with gr.Row():
+                    preset_btn_1 = gr.Button("Ultra Fidelity (96-98%)", variant="secondary", size="sm")
+                    preset_btn_2 = gr.Button("Premium Portrait", variant="primary", size="sm")
+                    preset_btn_3 = gr.Button("Balanced Portrait", variant="secondary", size="sm")
                 with gr.Row():
+                    preset_btn_4 = gr.Button("Artistic Excellence", variant="secondary", size="sm")
+                    preset_btn_5 = gr.Button("Style Focus", variant="secondary", size="sm")
+                    preset_btn_6 = gr.Button("Subtle Enhancement", variant="secondary", size="sm")
                 preset_status = gr.Textbox(
+                    label="",
+                    value="Select a preset above or adjust parameters manually",
+                    lines=2,
+                    interactive=False
                 )
+            with gr.Accordion(" Generation Parameters", open=True):
+                with gr.Row():
+                    steps = gr.Slider(
+                        minimum=4,
+                        maximum=25,
+                        value=DEFAULT_PARAMS['num_inference_steps'],
+                        step=1,
+                        label="Inference Steps\nLCM works best at 8-14 steps"
+                    )
+                    guidance_scale = gr.Slider(
+                        minimum=1.0,
+                        maximum=2.0,
+                        value=DEFAULT_PARAMS['guidance_scale'],
+                        step=0.05,
+                        label="Guidance Scale (CFG)\nLower for LCM (1.1-1.5)"
+                    )
                 gr.Markdown("### Core Parameters")
                 with gr.Row():
+                    identity_preservation = gr.Slider(
+                        minimum=0.3,
                         maximum=2.0,
+                        value=DEFAULT_PARAMS['identity_preservation'],
                         step=0.05,
+                        label="Identity Preservation (IP-Adapter)\nHigher = stronger face"
                     )
                     strength = gr.Slider(
                     label="InstantID ControlNet Scale (facial keypoints structure)"
                 )
                 enable_color_matching = gr.Checkbox(
                     value=DEFAULT_PARAMS['enable_color_matching'],
                     label="[OPTIONAL] Enable Color Matching (gentle skin tone adjustment)",
             gr.Markdown(f"""
             ### Tips for Maximum Quality Results:
+            **[INSTANTID] InstantID Pipeline Active:**
+            - Built-in Resampler: 8 layers, 16 query tokens
+            - IP-Adapter: Native face preservation
+            - Dual ControlNets: Keypoints + Depth
+            - Expected quality: 95-98% face similarity
             **[PRESETS] Optimized Preset Guide:**
             - **Ultra Fidelity:** 96-98% similarity, minimal transformation
               - `0.38-0.45`: Maximum fidelity (Ultra/Subtle presets)
               - `0.48-0.55`: Balanced quality (Premium/Balanced presets)
               - `0.58-0.68`: Artistic freedom (Artistic/Style presets)
+            - **Identity Preservation**: IP-Adapter face embedding strength (auto-boosted 1.15x)
             - **Guidance Scale (CFG)**: LCM-optimized range 1.1-1.5
             - **LORA Scale**: Pixel art intensity (inverse to identity)
             6. Fix seed for consistent testing
             **[TECHNICAL] System Details:**
+            - InstantID Pipeline: Official implementation
+            - Face embeddings: InsightFace 512D → 16×2048D tokens
+            - ControlNets: Dual (Identity + Depth)
             - Resolution: Auto-optimized to 896x1152 or 832x1216
             """)
         server_port=7860,
         share=True,
         show_api=True
+    )