ltx-2-TURBO

Running on Zero

App Files Files Community

Opera8 commited on Feb 21

Commit

e9ca807

verified ·

1 Parent(s): 7de629a

Update app.py

Browse files

Files changed (1) hide show

app.py +111 -400

app.py CHANGED Viewed

@@ -2319,7 +2319,7 @@ def apply_example(idx: str):
 ####################################################################################################
-### PART 20: Gradio UI Layout & Launch
 ####################################################################################################
 # JS Function to handle download request via PostMessage
@@ -2329,30 +2329,11 @@ async (video) => {
         alert("لطفاً ابتدا ویدیو را تولید کنید.");
         return;
     }
-    // Gradio Video component passes an object or string
-    let fileUrl = "";
-    if (typeof video === 'string') {
-        fileUrl = video;
-    } else if (video && video.url) {
-        fileUrl = video.url;
-    } else if (video && video.path) {
-        fileUrl = video.path;
-    }
-    // Fix relative paths to absolute URLs for the parent iframe
     if (fileUrl && !fileUrl.startsWith('http')) {
-        // Remove leading slash if exists to prevent double slash with origin
         let cleanPath = fileUrl.startsWith('/') ? fileUrl.substring(1) : fileUrl;
-        // Check if it's already a file route
-        if (cleanPath.startsWith('file=')) {
-             fileUrl = window.location.origin + "/" + cleanPath;
-        } else {
-             fileUrl = window.location.origin + "/file=" + cleanPath;
-        }
     }
     if (fileUrl) {
         console.log("Sending download request for:", fileUrl);
         window.parent.postMessage({ type: 'DOWNLOAD_REQUEST', url: fileUrl }, '*');
@@ -2360,125 +2341,75 @@ async (video) => {
 }
 """
-# این تابع جاوااسکریپت جدید برای بهینه سازی پرامپت است
-# این کد در مرورگر کاربر اجرا می شود
-js_enhancer_and_trigger = """
 async (firstFrame, promptText, mode) => {
-    // گرفتن دکمه ها و جعبه متن از طریق DOM
-    const enhancerBtn = document.querySelector("#enhancer_btn button");
-    const realGenerateBtn = document.querySelector("#real_generate_btn button");
-    const promptTextarea = document.querySelector("#prompt_ui textarea");
-    // اگر حالت انتخابی نیازی به بهینه سازی ندارد، مستقیما ویدیو را بساز
     if (mode !== 'تبدیل تصویر به ویدیو' && mode !== 'تکمیل فریم‌های میانی') {
-        realGenerateBtn.click();
-        return [firstFrame, promptText, mode]; // بازگشت مقادیر بدون تغییر
     }
     // API بهینه ساز به تصویر نیاز دارد
     if (!firstFrame) {
-        alert("برای بهینه سازی پرامپت، لطفاً ابتدا یک تصویر در قسمت 'تصویر اول' آپلود کنید.");
-        return [firstFrame, promptText, mode];
     }
-    const originalButtonText = enhancerBtn.textContent;
-    enhancerBtn.disabled = true;
-    enhancerBtn.textContent = "⏳ در حال بهینه سازی پرامپت...";
     try {
-        // داده های تصویر را از URL آن دریافت می کنیم
         const response = await fetch(firstFrame.url);
         const imageBlob = await response.blob();
-        // آماده سازی FormData برای ارسال به API
         const formData = new FormData();
-        // نام فایل را برای سازگاری با API تنظیم می کنیم
         const imageFile = new File([imageBlob], "image.jpg", { type: "image/jpeg" });
         formData.append('image', imageFile);
         formData.append('prompt', promptText);
         formData.append('is_extension', 'false');
-        // ارسال درخواست به API بهینه ساز
         const apiResponse = await fetch('https://ezmarynoori-vidtolani.hf.space/api/enhance-animation-prompt', {
             method: 'POST',
             body: formData
         });
-        const data = await apiResponse.json();
         if (!apiResponse.ok) {
-            throw new Error(data.error || 'خطا در بهینه سازی پرامپت از سمت سرور.');
         }
-        const enhancedPrompt = data.animation_prompt;
-        console.log("Original Prompt:", promptText);
-        console.log("Enhanced Prompt:", enhancedPrompt);
-        // پرامپت جدید را در جعبه متن قرار می دهیم
-        promptTextarea.value = enhancedPrompt;
-        // یک رویداد input ایجاد می کنیم تا Gradio متوجه تغییر شود
-        promptTextarea.dispatchEvent(new Event('input', { bubbles: true }));
-        // حالا دکمه پنهان ساخت ویدیو را کلیک می کنیم
-        realGenerateBtn.click();
     } catch (error) {
-        console.error("Enhancement Error:", error);
-        alert(`خطایی در بهینه سازی پرامپت رخ داد: ${error.message}`);
-    } finally {
-        // دکمه را به حالت اولیه برمی گردانیم
-        enhancerBtn.disabled = false;
-        enhancerBtn.textContent = originalButtonText;
     }
-    // مقادیر ورودی را برمیگردانیم تا زنجیره گرادیو قطع نشود
-    // گرچه پرامپت اصلی دیگر استفاده نمی شود چون ما آن را مستقیما در DOM تغییر دادیم
-    return [firstFrame, promptText, mode];
 }
 """
 def apply_example(idx: str):
     idx = int(idx)
-    # Read the example row from your list
     img, prompt_txt, cam, res, mode, vid, aud, end_img = examples_list[idx]
-    img_path = img if img else None
-    vid_path = vid if vid else None
-    aud_path = aud if aud else None
-    input_image_update = img_path
-    prompt_update = prompt_txt
-    camera_update = cam
-    resolution_update = res
-    mode_update = mode
-    video_update = gr.update(value=vid_path, visible=(mode == "Motion Control"))
-    audio_update = aud_path
-    end_image = end_img
-    # Clear the output video AND Hide download button when loading a new example
-    output_video_update = gr.update(value=None)
-    download_btn_update = gr.update(visible=False)
     return (
-        input_image_update,
-        prompt_update,
-        camera_update,
-        resolution_update,
-        mode_update,
-        video_update,
-        audio_update,
-        audio_update,
-        end_image,
-        output_video_update,
-        download_btn_update
     )
 with gr.Blocks(title="LTX-2 Video Distilled 🎥🔈") as demo:
-    # Updated Header to Persian
     gr.HTML(
         """
         <div style="text-align: center; padding: 20px;">
@@ -2492,9 +2423,12 @@ with gr.Blocks(title="LTX-2 Video Distilled 🎥🔈") as demo:
         """
     )
     with gr.Column(elem_id="col-container"):
         with gr.Row(elem_id="mode-row"):
-            # Updated choices to Persian
             radioanimated_mode = RadioAnimated(
                 choices=["تبدیل تصویر به ویدیو", "تکمیل فریم‌های میانی"],
                 value="تبدیل تصویر به ویدیو",
@@ -2502,335 +2436,134 @@ with gr.Blocks(title="LTX-2 Video Distilled 🎥🔈") as demo:
             )
         with gr.Row():
             with gr.Column(elem_id="step-column"):
                 with gr.Row():
                     first_frame = gr.Image(
                         label="تصویر اول (برای بهینه‌سازی پرامپت الزامی است)",
                         type="filepath",
                         height=256
                     )
                     end_frame = gr.Image(
                         label="تصویر آخر (اختیاری)",
                         type="filepath",
                         height=256,
                         visible=False,
                     )
-                    # input_video is defined but hidden
-                    input_video = gr.Video(
-                        label="Motion Reference Video",
-                        height=256,
-                        visible=False,
-                    )
-                relocate = gr.HTML(
-                    value="",
-                    html_template="<div></div>",
-                    js_on_load=r"""
                 (() => {
                   function moveIntoFooter() {
-                    const promptRoot = document.querySelector("#prompt_ui");
-                    if (!promptRoot) return false;
-                    const footer = promptRoot.querySelector(".ds-footer");
-                    if (!footer) return false;
                     const dur = document.querySelector("#duration_ui .cd-wrap");
                     const res = document.querySelector("#resolution_ui .cd-wrap");
                     const cam = document.querySelector("#camera_ui .cd-wrap");
                     if (!dur || !res || !cam) return false;
-                    footer.appendChild(dur);
-                    footer.appendChild(res);
-                    footer.appendChild(cam);
                     return true;
                   }
-                  const tick = () => {
-                    if (!moveIntoFooter()) requestAnimationFrame(tick);
-                  };
                   requestAnimationFrame(tick);
                 })();
-                """
-                )
-                prompt_ui = PromptBox(
-                    value="این تصویر را با حرکت سینمایی و انیمیشن روان زنده کن",
-                    elem_id="prompt_ui",
-                )
-                # Hidden real audio input (backend value)
-                audio_input = gr.File(
-                    label="Audio (Optional)",
-                    file_types=["audio"],
-                    type="filepath",
-                    elem_id="audio_input_hidden",
-                )
-                # Custom UI that feeds the hidden gr.Audio above
-                audio_ui = AudioDropUpload(
-                    target_audio_elem_id="audio_input_hidden",
-                    elem_id="audio_ui",
-                )
-                prompt = gr.Textbox(
-                    label="Prompt",
-                    value="این تصویر را با حرکت سینمایی و انیمیشن روان زنده کن",
-                    lines=3,
-                    max_lines=3,
-                    placeholder="حرکت و انیمیشن مورد نظر خود را توصیف کنید...",
-                    visible=False
-                )
-                enhance_prompt = gr.Checkbox(
-                        label="Enhance Prompt",
-                        value=True,
-                        visible=False
-                    )
                 with gr.Accordion("تنظیمات پیشرفته", open=False, visible=False):
-                    seed = gr.Slider(
-                        label="سید (Seed)",
-                        minimum=0,
-                        maximum=MAX_SEED,
-                        value=DEFAULT_SEED,
-                        step=1
-                    )
                     randomize_seed = gr.Checkbox(label="استفاده از سید تصادفی", value=True)
             with gr.Column(elem_id="step-column"):
                 output_video = gr.Video(label="ویدیوی ساخته شده", autoplay=True, height=512)
                 with gr.Row():
-                    download_btn = gr.Button(
-                        "📥 دانلود ویدیو",
-                        variant="secondary",
-                        size="sm",
-                        scale=0,
-                        visible=False
-                    )
                 with gr.Row(elem_id="controls-row"):
-                        duration_ui = CameraDropdown(
-                            choices=["3s", "5s", "10s"],
-                            value="5s",
-                            title="مدت زمان ویدیو",
-                            elem_id="duration_ui"
-                        )
-                        duration = gr.Slider(
-                            label="Duration (seconds)",
-                            minimum=1.0,
-                            maximum=10.0,
-                            value=5.0,
-                            step=0.1,
-                            visible=False
-                        )
-                        ICON_16_9 = """<svg viewBox="0 0 24 24" fill="none" aria-hidden="true">
-                          <rect x="3" y="7" width="18" height="10" rx="2" stroke="currentColor" stroke-width="2"/>
-                        </svg>"""
-                        ICON_1_1 = """<svg viewBox="0 0 24 24" fill="none" aria-hidden="true">
-                          <rect x="6" y="6" width="12" height="12" rx="2" stroke="currentColor" stroke-width="2"/>
-                        </svg>"""
-                        ICON_9_16 = """<svg viewBox="0 0 24 24" fill="none" aria-hidden="true">
-                          <rect x="7" y="3" width="10" height="18" rx="2" stroke="currentColor" stroke-width="2"/>
-                        </svg>"""
                         resolution_ui = CameraDropdown(
-                            choices=[
-                                {"label": "16:9", "value": "16:9", "icon": ICON_16_9},
-                                {"label": "1:1",  "value": "1:1",  "icon": ICON_1_1},
-                                {"label": "9:16", "value": "9:16", "icon": ICON_9_16},
-                            ],
-                            value="16:9",
-                            title="ابعاد تصویر",
-                            elem_id="resolution_ui"
                         )
                         width = gr.Number(label="Width", value=DEFAULT_1_STAGE_WIDTH, precision=0, visible=False)
                         height = gr.Number(label="Height", value=DEFAULT_1_STAGE_HEIGHT, precision=0, visible=False)
-                        camera_ui = CameraDropdown(
-                            choices=[name for name, _ in VISIBLE_RUNTIME_LORA_CHOICES],
-                            value="No LoRA",
-                            title="افکت دوربین (LoRA)",
-                            elem_id="camera_ui",
-                        )
-                        # Hidden real dropdown (backend value)
-                        camera_lora = gr.Dropdown(
-                            label="Camera Control LoRA",
-                            choices=[name for name, _ in VISIBLE_RUNTIME_LORA_CHOICES],
-                            value="No LoRA",
-                            visible=False
-                        )
-                # دکمه اصلی که کاربر می بیند و فرآیند بهینه سازی را شروع می کند
-                enhancer_btn = gr.Button("🤩 ساخت ویدیو", variant="primary", elem_classes="button-gradient", elem_id="enhancer_btn")
-                # دکمه پنهان که پس از بهینه سازی توسط جاوااسکریپت کلیک می شود
-                real_generate_btn = gr.Button("Hidden Generate", visible=False, elem_id="real_generate_btn")
-    camera_ui.change(
-        fn=lambda x: x,
-        inputs=camera_ui,
-        outputs=camera_lora,
-        api_visibility="private"
-    )
-    radioanimated_mode.change(
-    fn=on_mode_change,
-        inputs=radioanimated_mode,
-        outputs=[input_video, end_frame],
-        api_visibility="private",
-    )
-    duration_ui.change(
-        fn=apply_duration,
-        inputs=duration_ui,
-        outputs=[duration],
-        api_visibility="private"
-    )
-    resolution_ui.change(
-        fn=apply_resolution,
-        inputs=resolution_ui,
-        outputs=[width, height],
-        api_visibility="private"
-    )
-    prompt_ui.change(
-        fn=lambda x: x,
-        inputs=prompt_ui,
-        outputs=prompt,
-        api_visibility="private"
-    )
-    # مرحله 1: دکمه قابل مشاهده، جاوا اسکریپت بهینه ساز را اجرا می کند
-    enhancer_btn.click(
-        fn=None, # هیچ تابع پایتونی اجرا نمی شود
-        inputs=[first_frame, prompt, radioanimated_mode],
-        js=js_enhancer_and_trigger # فقط جاوااسکریپت اجرا می شود
-    )
-    # مرحله 2: دکمه پنهان، تابع اصلی ساخت ویدیو در پایتون را اجرا می کند
-    real_generate_btn.click(
         fn=generate_video,
         inputs=[
-            first_frame,
-            end_frame,
-            prompt, # این prompt حالا توسط جاوااسکریپت بهینه شده است
-            duration,
-            input_video,
-            radioanimated_mode,
-            enhance_prompt, # این گزینه دیگر استفاده نمی شود چون بهینه سازی سمت مرورگر است
-            seed,
-            randomize_seed,
-            height,
-            width,
-            camera_lora,
-            audio_input
         ],
         outputs=[output_video]
-    ).then(
-        fn=lambda: gr.update(visible=True), # بعد از اتمام ساخت، دکمه دانلود ظاهر می شود
         outputs=[download_btn]
     )
-    # اتصال دکمه دانلود به جاوا اسکریپت
-    download_btn.click(
-        fn=None,
-        inputs=[output_video],
-        js=js_download_video
-    )
-    # Updated Examples to use Persian modes
     examples_list = [
-        [
-            "examples/supergirl-2.png",
-            "A fuzzy puppet superhero character resembling a female puppet with blonde hair and a blue superhero suit sleeping in bed and just waking up, she gradually gets up, rubbing her eyes and looking at her dog that just popped on the bed. the scene feels chaotic, comedic, and emotional with expressive puppet reactions, cinematic lighting, smooth camera motion, shallow depth of field, and high-quality puppet-style animation",
-            "Static",
-            "16:9",
-            "تبدیل تصویر به ویدیو",
-            None,
-            "examples/supergirl.m4a",
-            None,
-        ],
-        [
-            "examples/frame3.png",
-            "a woman in a white dress standing in a supermarket, looking at a stack of pomegranates, she picks one and takes a bite, the camera zooms in to a close up of the pomegranate seeds. A calm music is playing in the supermarket and you can hear her taking a bite.",
-            "Zoom In",
-            "16:9",
-            "تکمیل فریم‌های میانی",
-            None,
-            None,
-            "examples/frame4.png",
-        ],
-        [
-            "examples/supergirl.png",
-            "A fuzzy puppet superhero character resembling a female puppet with blonde hair and a blue superhero suit stands inside an icy cave made of frozen walls and icicles, she looks panicked and frantic, rapidly turning her head left and right and scanning the cave while waving her arms and shouting angrily and desperately, mouthing the words “where the hell is my dog,” her movements exaggerated and puppet-like with high energy and urgency, suddenly a second puppet dog bursts into frame from the side, jumping up excitedly and tackling her affectionately while licking her face repeatedly, she freezes in surprise and then breaks into relief and laughter as the dog continues licking her, the scene feels chaotic, comedic, and emotional with expressive puppet reactions, cinematic lighting, smooth camera motion, shallow depth of field, and high-quality puppet-style animation",
-            "No LoRA",
-            "16:9",
-            "تبدیل تصویر به ویدیو",
-            None,
-            None,
-            None,
-        ],
-        [
-            "examples/highland.png",
-            "Realistic POV selfie-style video in a snowy, foggy field. Two shaggy Highland cows with long curved horns stand ahead. The camera is handheld and slightly shaky. The woman filming talks nervously and excitedly in a vlog tone: \"Oh my god guys… look how big those horns are… I’m kinda scared.\" The cow on the left walks toward the camera in a cute, bouncy, hopping way, curious and gentle. Snow crunches under its hooves, breath visible in the cold air. The horns look massive from the POV. As the cow gets very close, its wet nose with slight dripping fills part of the frame. She laughs nervously but reaches out and pets the cow. The cow makes deep, soft, interesting mooing and snorting sounds, calm and friendly. Ultra-realistic, natural lighting, immersive audio, documentary-style realism.",
-            "No LoRA",
-            "16:9",
-            "تبدیل تصویر به ویدیو",
-            None,
-            None,
-            None,
-        ],
-        [
-            "examples/wednesday.png",
-            "A cinematic dolly out of Wednesday Addams frozen mid-dance on a dark, blue-lit ballroom floor as students move indistinctly behind her, their footsteps and muffled music reduced to a distant, underwater thrum; the audio foregrounds her steady breathing and the faint rustle of fabric as she slowly raises one arm, never breaking eye contact with the camera, then after a deliberately long silence she speaks in a flat, dry, perfectly controlled voice, “I don’t dance… I vibe code,” each word crisp and unemotional, followed by an abrupt cutoff of her voice as the background sound swells slightly, reinforcing the deadpan humor, with precise lip sync, minimal facial movement, stark gothic lighting, and cinematic realism.",
-             "Zoom Out",
-            "16:9",
-            "تبدیل تصویر به ویدیو",
-            None,
-            None,
-            None,
-        ],
-        [
-            "examples/astronaut.png",
-            "An astronaut hatches from a fragile egg on the surface of the Moon, the shell cracking and peeling apart in gentle low-gravity motion. Fine lunar dust lifts and drifts outward with each movement, floating in slow arcs before settling back onto the ground. The astronaut pushes free in a deliberate, weightless motion, small fragments of the egg tumbling and spinning through the air. In the background, the deep darkness of space subtly shifts as stars glide with the camera's movement, emphasizing vast depth and scale. The camera performs a smooth, cinematic slow push-in, with natural parallax between the foreground dust, the astronaut, and the distant starfield. Ultra-realistic detail, physically accurate low-gravity motion, cinematic lighting, and a breath-taking, movie-like shot.",
-            "Static",
-            "1:1",
-            "تبدیل تصویر به ویدیو",
-            None,
-            None,
-            None,
-        ],
     ]
-    examples_obj = create_examples(
-        examples=examples_list,
-        fn=generate_video_example,
-        inputs=[first_frame, prompt_ui, camera_ui, resolution_ui, radioanimated_mode, input_video, audio_input, end_frame],
-        outputs = [output_video],
-        label="نمونه‌ها",
-        cache_examples=True,
-        visible=False
-    )
     preset_gallery = PresetGallery(
         items=[
             {"thumb": "examples/supergirl-2.png", "label": "تصویر و صدا به ویدیو"},
@@ -2843,35 +2576,13 @@ with gr.Blocks(title="LTX-2 Video Distilled 🎥🔈") as demo:
         title="برای شروع روی یکی از نمونه‌ها کلیک کنید",
     )
-    def on_audio_ui_change(v):
-        # Our JS sends "__CLEAR__" when the user presses the X
-        if v == "__CLEAR__" or v is None or v == "":
-            return None
-        # For normal events (uploads), do nothing (keep whatever gr.File already has)
-        return gr.update()
-    audio_ui.change(
-        fn=on_audio_ui_change,
-        inputs=audio_ui,
-        outputs=audio_input,
-        api_visibility="private",
-    )
     preset_gallery.change(
         fn=apply_example,
         inputs=preset_gallery,
         outputs=[
-            first_frame,
-            prompt_ui,
-            camera_ui,
-            resolution_ui,
-            radioanimated_mode,
-            input_video,
-            audio_input,
-            audio_ui,
-            end_frame,
-            output_video, # Clears the output video
-            download_btn  # Hides the download button
         ],
         api_visibility="private",
     )

 ####################################################################################################
+### PART 20: Gradio UI Layout & Launch (REVISED & FIXED)
 ####################################################################################################
 # JS Function to handle download request via PostMessage
         alert("لطفاً ابتدا ویدیو را تولید کنید.");
         return;
     }
+    let fileUrl = typeof video === 'string' ? video : (video && (video.url || video.path));
     if (fileUrl && !fileUrl.startsWith('http')) {
         let cleanPath = fileUrl.startsWith('/') ? fileUrl.substring(1) : fileUrl;
+        fileUrl = window.location.origin + (cleanPath.startsWith('file=') ? "/" + cleanPath : "/file=" + cleanPath);
     }
     if (fileUrl) {
         console.log("Sending download request for:", fileUrl);
         window.parent.postMessage({ type: 'DOWNLOAD_REQUEST', url: fileUrl }, '*');
 }
 """
+# این تابع جاوااسکریپت فقط مسئول فراخوانی API بهینه ساز است
+# ورودی ها را از پایتون می گیرد و خروجی (پرامپت بهینه شده) را به پایتون برمی گرداند
+js_enhancer_api_call = """
 async (firstFrame, promptText, mode) => {
+    // اگر حالت انتخابی نیازی به بهینه سازی ندارد، پرامپت اصلی را برگردان
     if (mode !== 'تبدیل تصویر به ویدیو' && mode !== 'تکمیل فریم‌های میانی') {
+        return promptText;
     }
     // API بهینه ساز به تصویر نیاز دارد
     if (!firstFrame) {
+        // چون این مرحله در میانه راه است، به کاربر اطلاع داده و با پرامپت اصلی ادامه می دهیم
+        console.warn("Enhancement skipped: First frame image is required.");
+        return promptText;
     }
     try {
         const response = await fetch(firstFrame.url);
         const imageBlob = await response.blob();
         const formData = new FormData();
         const imageFile = new File([imageBlob], "image.jpg", { type: "image/jpeg" });
         formData.append('image', imageFile);
         formData.append('prompt', promptText);
         formData.append('is_extension', 'false');
         const apiResponse = await fetch('https://ezmarynoori-vidtolani.hf.space/api/enhance-animation-prompt', {
             method: 'POST',
             body: formData
         });
         if (!apiResponse.ok) {
+            const errorData = await apiResponse.json();
+            throw new Error(errorData.error || 'خطای ناشناخته از سرور بهینه ساز.');
         }
+        const data = await apiResponse.json();
+        console.log("Enhanced Prompt received:", data.animation_prompt);
+        // پرامپت بهینه شده را برای مرحله بعد در گرادیو برگردان
+        return data.animation_prompt;
     } catch (error) {
+        console.error("Enhancement API Error:", error);
+        // در صورت خطا، پرامپت اصلی را برگردان تا فرآیند ساخت ویدیو متوقف نشود
+        return promptText;
     }
 }
 """
 def apply_example(idx: str):
     idx = int(idx)
     img, prompt_txt, cam, res, mode, vid, aud, end_img = examples_list[idx]
     return (
+        img or None,
+        prompt_txt,
+        cam,
+        res,
+        mode,
+        gr.update(value=vid or None, visible=(mode == "Motion Control")),
+        aud or None,
+        aud or None,
+        end_img or None,
+        gr.update(value=None),
+        gr.update(visible=False)
     )
 with gr.Blocks(title="LTX-2 Video Distilled 🎥🔈") as demo:
     gr.HTML(
         """
         <div style="text-align: center; padding: 20px;">
         """
     )
+    # State components to pass data between Python and JS
+    # این کامپوننت ها برای کاربر قابل مشاهده نیستند
+    enhanced_prompt_state = gr.State("")
     with gr.Column(elem_id="col-container"):
         with gr.Row(elem_id="mode-row"):
             radioanimated_mode = RadioAnimated(
                 choices=["تبدیل تصویر به ویدیو", "تکمیل فریم‌های میانی"],
                 value="تبدیل تصویر به ویدیو",
             )
         with gr.Row():
             with gr.Column(elem_id="step-column"):
                 with gr.Row():
                     first_frame = gr.Image(
                         label="تصویر اول (برای بهینه‌سازی پرامپت الزامی است)",
                         type="filepath",
                         height=256
                     )
                     end_frame = gr.Image(
                         label="تصویر آخر (اختیاری)",
                         type="filepath",
                         height=256,
                         visible=False,
                     )
+                    input_video = gr.Video(label="Motion Reference Video", height=256, visible=False)
+                relocate = gr.HTML(value="", html_template="<div></div>", js_on_load=r"""
                 (() => {
                   function moveIntoFooter() {
+                    const promptRoot = document.querySelector("#prompt_ui"); if (!promptRoot) return false;
+                    const footer = promptRoot.querySelector(".ds-footer"); if (!footer) return false;
                     const dur = document.querySelector("#duration_ui .cd-wrap");
                     const res = document.querySelector("#resolution_ui .cd-wrap");
                     const cam = document.querySelector("#camera_ui .cd-wrap");
                     if (!dur || !res || !cam) return false;
+                    footer.appendChild(dur); footer.appendChild(res); footer.appendChild(cam);
                     return true;
                   }
+                  const tick = () => { if (!moveIntoFooter()) requestAnimationFrame(tick); };
                   requestAnimationFrame(tick);
                 })();
+                """)
+                prompt_ui = PromptBox(value="این تصویر را با حرکت سینمایی و انیمیشن روان زنده کن", elem_id="prompt_ui")
+                audio_input = gr.File(label="Audio (Optional)", file_types=["audio"], type="filepath", elem_id="audio_input_hidden")
+                audio_ui = AudioDropUpload(target_audio_elem_id="audio_input_hidden", elem_id="audio_ui")
+                prompt = gr.Textbox(label="Prompt", value="این تصویر را با حرکت سینمایی و انیمیشن روان زنده کن", lines=3, max_lines=3, placeholder="حرکت و انیمیشن مورد نظر خود را توصیف کنید...", visible=False)
+                enhance_prompt = gr.Checkbox(label="Enhance Prompt", value=True, visible=False)
                 with gr.Accordion("تنظیمات پیشرفته", open=False, visible=False):
+                    seed = gr.Slider(label="سید (Seed)", minimum=0, maximum=MAX_SEED, value=DEFAULT_SEED, step=1)
                     randomize_seed = gr.Checkbox(label="استفاده از سید تصادفی", value=True)
             with gr.Column(elem_id="step-column"):
                 output_video = gr.Video(label="ویدیوی ساخته شده", autoplay=True, height=512)
                 with gr.Row():
+                    download_btn = gr.Button("📥 دانلود ویدیو", variant="secondary", size="sm", scale=0, visible=False)
                 with gr.Row(elem_id="controls-row"):
+                        duration_ui = CameraDropdown(choices=["3s", "5s", "10s"], value="5s", title="مدت زمان ویدیو", elem_id="duration_ui")
+                        duration = gr.Slider(label="Duration (seconds)", minimum=1.0, maximum=10.0, value=5.0, step=0.1, visible=False)
+                        ICON_16_9 = """<svg viewBox="0 0 24 24" fill="none" aria-hidden="true"><rect x="3" y="7" width="18" height="10" rx="2" stroke="currentColor" stroke-width="2"/></svg>"""
+                        ICON_1_1 = """<svg viewBox="0 0 24 24" fill="none" aria-hidden="true"><rect x="6" y="6" width="12" height="12" rx="2" stroke="currentColor" stroke-width="2"/></svg>"""
+                        ICON_9_16 = """<svg viewBox="0 0 24 24" fill="none" aria-hidden="true"><rect x="7" y="3" width="10" height="18" rx="2" stroke="currentColor" stroke-width="2"/></svg>"""
                         resolution_ui = CameraDropdown(
+                            choices=[{"label": "16:9", "value": "16:9", "icon": ICON_16_9}, {"label": "1:1",  "value": "1:1",  "icon": ICON_1_1}, {"label": "9:16", "value": "9:16", "icon": ICON_9_16}],
+                            value="16:9", title="ابعاد تصویر", elem_id="resolution_ui"
                         )
                         width = gr.Number(label="Width", value=DEFAULT_1_STAGE_WIDTH, precision=0, visible=False)
                         height = gr.Number(label="Height", value=DEFAULT_1_STAGE_HEIGHT, precision=0, visible=False)
+                        camera_ui = CameraDropdown(choices=[name for name, _ in VISIBLE_RUNTIME_LORA_CHOICES], value="No LoRA", title="افکت دوربین (LoRA)", elem_id="camera_ui")
+                        camera_lora = gr.Dropdown(label="Camera Control LoRA", choices=[name for name, _ in VISIBLE_RUNTIME_LORA_CHOICES], value="No LoRA", visible=False)
+                generate_btn = gr.Button("🤩 ساخت ویدیو", variant="primary", elem_classes="button-gradient")
+    # توابع کمکی برای به‌روزرسانی UI
+    def lock_ui():
+        return gr.Button(value="⏳ در حال بهینه سازی پرامپت...", interactive=False)
+    def re_enable_ui():
+        return gr.Button(value="🤩 ساخت ویدیو", interactive=True)
+    # اتصال رویدادها
+    camera_ui.change(fn=lambda x: x, inputs=camera_ui, outputs=camera_lora, api_visibility="private")
+    radioanimated_mode.change(fn=on_mode_change, inputs=radioanimated_mode, outputs=[input_video, end_frame], api_visibility="private")
+    duration_ui.change(fn=apply_duration, inputs=duration_ui, outputs=[duration], api_visibility="private")
+    resolution_ui.change(fn=apply_resolution, inputs=resolution_ui, outputs=[width, height], api_visibility="private")
+    prompt_ui.change(fn=lambda x: x, inputs=prompt_ui, outputs=prompt, api_visibility="private")
+    audio_ui.change(fn=lambda v: None if v == "__CLEAR__" or not v else gr.update(), inputs=audio_ui, outputs=audio_input, api_visibility="private")
+    download_btn.click(fn=None, inputs=[output_video], js=js_download_video)
+    # --- زنجیره اصلی رویداد ساخت ویدیو ---
+    # 1. وقتی کاربر روی دکمه کلیک می کند، ابتدا UI را قفل کرده و متن دکمه را تغییر می دهیم.
+    # این تابع پایتون هیچ کاری جز آماده سازی UI انجام نمی دهد.
+    generate_btn.click(
+        fn=lock_ui,
+        outputs=[generate_btn]
+    ) \
+    .then(
+        # 2. سپس، تابع جاوااسکریپت را برای بهینه سازی پرامپت فراخوانی می کنیم.
+        # ورودی های آن از کامپوننت های گرادیو گرفته شده و خروجی آن در یک State ذخیره می شود.
+        fn=None,
+        inputs=[first_frame, prompt, radioanimated_mode],
+        outputs=[enhanced_prompt_state],
+        js=js_enhancer_api_call
+    ) \
+    .then(
+        # 3. حالا، تابع اصلی ساخت ویدیو را با پرامپت بهینه شده (که از State خوانده می شود) اجرا می کنیم.
         fn=generate_video,
         inputs=[
+            first_frame, end_frame, enhanced_prompt_state, duration, input_video,
+            radioanimated_mode, enhance_prompt, seed, randomize_seed,
+            height, width, camera_lora, audio_input
         ],
         outputs=[output_video]
+    ) \
+    .then(
+        # 4. پس از اتمام ساخت ویدیو، دکمه دانلود را نمایش می دهیم.
+        fn=lambda: gr.update(visible=True),
         outputs=[download_btn]
+    ) \
+    .then(
+        # 5. در نهایت، UI را دوباره فعال می کنیم.
+        fn=re_enable_ui,
+        outputs=[generate_btn]
     )
+    # منطق نمونه ها
     examples_list = [
+        ["examples/supergirl-2.png", "A fuzzy puppet superhero...", "Static", "16:9", "تبدیل تصویر به ویدیو", None, "examples/supergirl.m4a", None],
+        ["examples/frame3.png", "a woman in a white dress...", "Zoom In", "16:9", "تکمیل فریم‌های میانی", None, None, "examples/frame4.png"],
+        ["examples/supergirl.png", "A fuzzy puppet superhero character...", "No LoRA", "16:9", "تبدیل تصویر به ویدیو", None, None, None],
+        ["examples/highland.png", "Realistic POV selfie-style video...", "No LoRA", "16:9", "تبدیل تصویر به ویدیو", None, None, None],
+        ["examples/wednesday.png", "A cinematic dolly out of Wednesday Addams...", "Zoom Out", "16:9", "تبدیل تصویر به ویدیو", None, None, None],
+        ["examples/astronaut.png", "An astronaut hatches from a fragile egg...", "Static", "1:1", "تبدیل تصویر به ویدیو", None, None, None],
     ]
     preset_gallery = PresetGallery(
         items=[
             {"thumb": "examples/supergirl-2.png", "label": "تصویر و صدا به ویدیو"},
         title="برای شروع روی یکی از نمونه‌ها کلیک کنید",
     )
     preset_gallery.change(
         fn=apply_example,
         inputs=preset_gallery,
         outputs=[
+            first_frame, prompt_ui, camera_ui, resolution_ui, radioanimated_mode,
+            input_video, audio_input, audio_ui, end_frame,
+            output_video, download_btn
         ],
         api_visibility="private",
     )