Spaces:

00Boobs00
/

anycoder-2fc97463

Sleeping

App Files Files Community

00Boobs00 commited on Jan 17

Commit

aab6df4

verified ·

1 Parent(s): 6bc490c

Upload folder using huggingface_hub

Browse files

Files changed (2) hide show

app.py +331 -0
requirements.txt +4 -0

app.py ADDED Viewed

	@@ -0,0 +1,331 @@

+import gradio as gr
+from typing import Optional, List, Dict, Any
+import numpy as np
+import time
+from utils import WANVideoGenerator, LoRAManager, NSFWChecker
+from config import MODEL_CONFIGS, AVAILABLE_LORAS, NSFW_CONFIG
+# Initialize core components
+generator = WANVideoGenerator()
+lora_manager = LoRAManager()
+nsfw_checker = NSFWChecker()
+def generate_video(
+    image: np.ndarray,
+    prompt: str,
+    selected_model: str,
+    enabled_loras: List[str],
+    enable_nsfw: bool,
+    video_length: int,
+    resolution: str,
+    progress=gr.Progress()
+) -> tuple[str, str, Dict[str, Any]]:
+    """
+    Main video generation function with WAN-scale processing
+    Args:
+        image: Input image as numpy array
+        prompt: Optional text prompt for video generation
+        selected_model: Selected WAN model variant
+        enabled_loras: List of active LoRA adapters
+        enable_nsfw: Whether to allow NSFW content generation
+        video_length: Target video length in frames
+        resolution: Output resolution preset
+        progress: Gradio progress tracker
+    Returns:
+        Tuple of (video_path, status_message, generation_metadata)
+    """
+    try:
+        # Step 1: Validate inputs
+        progress(0.1, desc="🔍 Validating inputs...")
+        if image is None:
+            raise gr.Error("No image provided. Please upload an image to generate video.")
+        # Step 2: NSFW check if enabled
+        if enable_nsfw and NSFW_CONFIG["require_confirmation"]:
+            progress(0.15, desc="⚠️ NSFW mode active - bypassing standard filters")
+        elif not enable_nsfw:
+            progress(0.15, desc="🛡️ Running safety checks...")
+            if nsfw_checker.check_image(image):
+                raise gr.Error("Input image flagged by safety filter. Enable NSFW mode to bypass.")
+        # Step 3: Load selected model and LoRAs
+        progress(0.2, desc=f"📦 Loading {selected_model} model...")
+        generator.load_model(selected_model)
+        progress(0.3, desc=f"🔌 Activating {len(enabled_loras)} LoRA adapters...")
+        active_loras = lora_manager.load_loras(enabled_loras)
+        # Step 4: Generate video frames
+        progress(0.4, desc="🎬 Generating video frames...")
+        frames = []
+        for i in range(video_length):
+            progress(0.4 + (i / video_length) * 0.5,
+                    desc=f"Rendering frame {i+1}/{video_length}...")
+            frame = generator.generate_frame(
+                image=image,
+                prompt=prompt,
+                frame_index=i,
+                total_frames=video_length,
+                active_loras=active_loras
+            )
+            frames.append(frame)
+            time.sleep(0.1)  # Simulate processing time
+        # Step 5: Compile video
+        progress(0.95, desc="🎥 Compiling final video...")
+        output_path = generator.compile_video(
+            frames=frames,
+            resolution=resolution,
+            fps=30
+        )
+        # Step 6: Prepare metadata
+        metadata = {
+            "model": selected_model,
+            "loras": enabled_loras,
+            "nsfw_mode": enable_nsfw,
+            "resolution": resolution,
+            "frames": video_length,
+            "prompt": prompt or "No prompt provided",
+            "status": "✅ Generation complete"
+        }
+        progress(1.0, desc="✅ Done!")
+        return output_path, "Video generated successfully!", metadata
+    except Exception as e:
+        raise gr.Error(f"Generation failed: {str(e)}")
+def update_lora_visibility(enable_nsfw: bool) -> Dict[str, Any]:
+    """Update LoRA options based on NSFW mode"""
+    if enable_nsfw:
+        return gr.Dropdown(
+            choices=list(AVAILABLE_LORAS.keys()),
+            value=[],
+            multiselect=True,
+            label="🎨 Active LoRA Adapters (NSFW options unlocked)"
+        )
+    else:
+        safe_loras = {k: v for k, v in AVAILABLE_LORAS.items() if not v.get("nsfw", False)}
+        return gr.Dropdown(
+            choices=list(safe_loras.keys()),
+            value=[],
+            multiselect=True,
+            label="🎨 Active LoRA Adapters (Safe mode)"
+        )
+def create_interface():
+    """Create the main Gradio interface"""
+    with gr.Blocks() as demo:
+        gr.HTML("""
+        <div style='text-align: center; padding: 20px;'>
+            <h1>🥊 WAN-Scale Image-to-Video Architecture 🥊</h1>
+            <p>Built with anycoder - <a href='https://huggingface.co/spaces/akhaliq/anycoder' target='_blank'>View on Hugging Face</a></p>
+            <p style='font-size: 1.2em; color: #666;'>Turn static images into dynamic videos with WAN foundation models</p>
+        </div>
+        """)
+        # Global state
+        generation_state = gr.State({"session_id": None})
+        with gr.Row():
+            # Sidebar for controls
+            with gr.Sidebar(position="left", width=320):
+                gr.Markdown("### ⚙️ Generation Settings")
+                model_selector = gr.Dropdown(
+                    choices=list(MODEL_CONFIGS.keys()),
+                    value="wan-2.1-14b",
+                    label="🤖 WAN Model",
+                    info="Select foundation model variant"
+                )
+                nsfw_toggle = gr.Checkbox(
+                    value=False,
+                    label="🔞 Enable NSFW Content",
+                    info="Bypass safety filters (requires confirmation)"
+                )
+                lora_selector = gr.Dropdown(
+                    choices=[k for k, v in AVAILABLE_LORAS.items() if not v.get("nsfw", False)],
+                    value=[],
+                    multiselect=True,
+                    label="🎨 Active LoRA Adapters",
+                    info="Select style and domain adapters"
+                )
+                with gr.Accordion("📐 Video Settings", open=False):
+                    video_length = gr.Slider(
+                        minimum=16,
+                        maximum=128,
+                        value=32,
+                        step=8,
+                        label="Video Length (frames)"
+                    )
+                    resolution = gr.Radio(
+                        choices=["512x512", "768x768", "1024x576", "1920x1080"],
+                        value="768x768",
+                        label="Resolution"
+                    )
+                with gr.Accordion("🚀 Advanced Options", open=False):
+                    inference_steps = gr.Slider(
+                        minimum=10,
+                        maximum=100,
+                        value=50,
+                        label="Inference Steps"
+                    )
+                    cfg_scale = gr.Slider(
+                        minimum=1.0,
+                        maximum=20.0,
+                        value=7.5,
+                        step=0.5,
+                        label="CFG Scale"
+                    )
+                # Status indicators
+                model_status = gr.Label(
+                    value={"Status": "Ready", "VRAM": "24GB Available"},
+                    label="System Status"
+                )
+            # Main content area
+            with gr.Column():
+                gr.Markdown("### 📤 Input Image")
+                input_image = gr.Image(
+                    label="Upload Starting Frame",
+                    type="numpy",
+                    height=400,
+                    sources=["upload", "webcam", "clipboard"]
+                )
+                gr.Markdown("### 📝 Optional Text Prompt")
+                prompt_box = gr.Textbox(
+                    placeholder="Describe the motion, style, or scene...",
+                    label="Prompt (optional)",
+                    lines=2,
+                    max_lines=4
+                )
+                with gr.Row():
+                    generate_btn = gr.Button(
+                        "🎬 Generate Video",
+                        variant="primary",
+                        scale=2
+                    )
+                    clear_btn = gr.ClearButton(
+                        components=[input_image, prompt_box],
+                        value="🗑️ Clear"
+                    )
+                # Progress tracking
+                progress_bar = gr.Progress()
+                status_text = gr.Textbox(
+                    label="Status",
+                    interactive=False,
+                    show_copy_button=True
+                )
+                gr.Markdown("### 📼 Output Video")
+                output_video = gr.Video(
+                    label="Generated Video",
+                    height=400,
+                    autoplay=True,
+                    show_download_button=True
+                )
+                # Generation metadata
+                with gr.Accordion("📊 Generation Details", open=False):
+                    metadata_json = gr.JSON(
+                        label="Metadata",
+                        open=False
+                    )
+        # Event handlers
+        nsfw_toggle.change(
+            fn=update_lora_visibility,
+            inputs=nsfw_toggle,
+            outputs=lora_selector,
+            api_visibility="private"
+        )
+        generate_btn.click(
+            fn=generate_video,
+            inputs=[
+                input_image,
+                prompt_box,
+                model_selector,
+                lora_selector,
+                nsfw_toggle,
+                video_length,
+                resolution
+            ],
+            outputs=[
+                output_video,
+                status_text,
+                metadata_json
+            ],
+            api_visibility="public",
+            concurrency_limit=2  # Limit concurrent generations
+        )
+        # Update model status on selection
+        model_selector.change(
+            fn=lambda x: {"Status": f"Loaded {x}", "VRAM": "24GB Used"},
+            inputs=model_selector,
+            outputs=model_status,
+            api_visibility="private"
+        )
+        # Demo load event
+        demo.load(
+            fn=lambda: "System initialized and ready",
+            outputs=status_text,
+            api_visibility="private"
+        )
+    return demo
+# Create and launch the application
+if __name__ == "__main__":
+    demo = create_interface()
+    demo.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        share=False,
+        debug=False,
+        show_error=True,
+        max_threads=4,
+        theme=gr.themes.Soft(
+            primary_hue="purple",
+            secondary_hue="indigo",
+            neutral_hue="slate",
+            font=gr.themes.GoogleFont("Inter"),
+            text_size="lg",
+            spacing_size="lg",
+            radius_size="md"
+        ).set(
+            button_primary_background_fill="*primary_600",
+            button_primary_background_fill_hover="*primary_700",
+            block_title_text_weight="600",
+            block_background_fill="*neutral_50"
+        ),
+        footer_links=[
+            {"label": "Built with anycoder", "url": "https://huggingface.co/spaces/akhaliq/anycoder"},
+            {"label": "Model Docs", "url": "https://huggingface.co/docs"},
+            {"label": "API Reference", "url": "/docs"}
+        ],
+        css="""
+        .gradio-container { max-width: 1400px; margin: auto; }
+        .contain { display: flex; flex-direction: column; height: 100vh; }
+        #component-0 { height: 100%; }
+        .gr-button { font-weight: 600; }
+        .gr-markdown { text-align: center; }
+        """
+    )

requirements.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+config
+gradio
+numpy
+utils