Spaces:

lulavc
/

AnimaStudio

Running on Zero

App Files Files Community

lulavc commited on Mar 4

Commit

ca047eb

1 Parent(s): a628050

fix: Gradio 6.x compat — remove info= from Image/Audio/Video, show_download_button→buttons

Browse files

Files changed (1) hide show

app.py +12 -17

app.py CHANGED Viewed

@@ -357,13 +357,13 @@ def switch_language(lang: str):
     # 26 outputs — must match _lang_out list order below
     return (
         # Phase 1 (16)
-        gr.update(label=t["portrait_label"],   info=t["portrait_info"]),
         gr.update(label=t["input_mode_label"], choices=mode_choices, value="text"),
         gr.update(label=t["text_label"],        placeholder=t["text_ph"]),
         gr.update(label=t["tts_lang_label"]),
-        gr.update(label=t["voice_ref_label"],   info=t["voice_ref_info"]),
         gr.update(label=t["emotion_label"],     info=t["emotion_info"]),
-        gr.update(label=t["audio_label"],       info=t["audio_info"]),
         gr.update(label=t["aspect_label"]),
         gr.update(label=t["advanced"]),
         gr.update(label=t["steps_label"],       info=t["steps_info"]),
@@ -374,9 +374,9 @@ def switch_language(lang: str):
         gr.update(visible=False),   # audio_group
         gr.update(label=t["output_label"]),
         # Phase 2 (10)
-        gr.update(label=t["dub_video_label"],   info=t["dub_video_info"]),
         gr.update(label=t["dub_target_label"]),
-        gr.update(label=t["dub_voice_label"],   info=t["dub_voice_info"]),
         gr.update(label=t["dub_emotion_label"]),
         gr.update(value=t["dub_btn"]),
         gr.update(label=t["dub_output_label"]),
@@ -426,8 +426,7 @@ with gr.Blocks(title="AnimaStudio 🎬") as demo:
             with gr.Row(equal_height=False):
                 with gr.Column(scale=1, min_width=360):
                     portrait = gr.Image(
-                        label="Portrait Photo",
-                        info="Upload a clear, front-facing face photo",
                         type="pil",
                         sources=["upload", "webcam"],
                     )
@@ -446,16 +445,14 @@ with gr.Blocks(title="AnimaStudio 🎬") as demo:
                         tts_language = gr.Dropdown(choices=TTS_LANGUAGES, value="English", label="Speech Language")
                         with gr.Row():
                             voice_ref = gr.Audio(
-                                label="Voice Reference",
-                                info="Optional: upload audio to clone the voice style",
                                 type="filepath", sources=["upload"],
                             )
                         emotion = gr.Slider(0.0, 1.0, value=0.5, step=0.05,
                                             label="Emotion Intensity", info="0 = neutral · 1 = very expressive")
                     with gr.Group(visible=False) as audio_group:
                         audio_upload = gr.Audio(
-                            label="Audio File",
-                            info="Upload WAV, MP3, or FLAC · max 30 seconds",
                             type="filepath", sources=["upload", "microphone"],
                         )
                     aspect_ratio = gr.Dropdown(choices=list(ASPECT_PRESETS.keys()),
@@ -471,18 +468,16 @@ with gr.Blocks(title="AnimaStudio 🎬") as demo:
                 with gr.Column(scale=1, min_width=440):
                     output_video = gr.Video(label="Generated Video", format="mp4", autoplay=True,
-                                            height=640, elem_id="output-video", show_download_button=True)
         # ══ Tab 2: Dub Video ═══════════════════════════════════════════════════
         with gr.Tab("🎙️ Dub Video", id="tab-dub"):
             with gr.Row(equal_height=False):
                 with gr.Column(scale=1, min_width=360):
-                    dub_video_input = gr.Video(label="Input Video",
-                                               info="Upload a video to dub (max 60 seconds)",
                                                sources=["upload"])
                     dub_target_lang = gr.Dropdown(choices=TTS_LANGUAGES, value="English", label="Target Language")
-                    dub_voice_ref = gr.Audio(label="Voice Reference",
-                                             info="Optional: upload audio to clone voice style for dubbing",
                                              type="filepath", sources=["upload"])
                     dub_emotion = gr.Slider(0.0, 1.0, value=0.5, step=0.05, label="Emotion Intensity")
                     dub_btn = gr.Button("🎙️  Dub Video", variant="primary", elem_id="dub-btn", size="lg")
@@ -497,7 +492,7 @@ with gr.Blocks(title="AnimaStudio 🎬") as demo:
                 with gr.Column(scale=1, min_width=440):
                     dub_output_video = gr.Video(label="Dubbed Video", format="mp4", autoplay=True,
-                                                height=480, elem_id="dub-output-video", show_download_button=True)
                     with gr.Accordion("Details", open=False) as dub_details_acc:
                         dub_transcript_box = gr.Textbox(label="Detected Transcript", interactive=False, lines=4)
                         dub_translation_box = gr.Textbox(label="Translation", interactive=False, lines=4)

     # 26 outputs — must match _lang_out list order below
     return (
         # Phase 1 (16)
+        gr.update(label=t["portrait_label"]),
         gr.update(label=t["input_mode_label"], choices=mode_choices, value="text"),
         gr.update(label=t["text_label"],        placeholder=t["text_ph"]),
         gr.update(label=t["tts_lang_label"]),
+        gr.update(label=t["voice_ref_label"]),
         gr.update(label=t["emotion_label"],     info=t["emotion_info"]),
+        gr.update(label=t["audio_label"]),
         gr.update(label=t["aspect_label"]),
         gr.update(label=t["advanced"]),
         gr.update(label=t["steps_label"],       info=t["steps_info"]),
         gr.update(visible=False),   # audio_group
         gr.update(label=t["output_label"]),
         # Phase 2 (10)
+        gr.update(label=t["dub_video_label"]),
         gr.update(label=t["dub_target_label"]),
+        gr.update(label=t["dub_voice_label"]),
         gr.update(label=t["dub_emotion_label"]),
         gr.update(value=t["dub_btn"]),
         gr.update(label=t["dub_output_label"]),
             with gr.Row(equal_height=False):
                 with gr.Column(scale=1, min_width=360):
                     portrait = gr.Image(
+                        label="Portrait Photo · front-facing face",
                         type="pil",
                         sources=["upload", "webcam"],
                     )
                         tts_language = gr.Dropdown(choices=TTS_LANGUAGES, value="English", label="Speech Language")
                         with gr.Row():
                             voice_ref = gr.Audio(
+                                label="Voice Reference (optional — clone voice style)",
                                 type="filepath", sources=["upload"],
                             )
                         emotion = gr.Slider(0.0, 1.0, value=0.5, step=0.05,
                                             label="Emotion Intensity", info="0 = neutral · 1 = very expressive")
                     with gr.Group(visible=False) as audio_group:
                         audio_upload = gr.Audio(
+                            label="Audio File · WAV/MP3/FLAC · max 30 s",
                             type="filepath", sources=["upload", "microphone"],
                         )
                     aspect_ratio = gr.Dropdown(choices=list(ASPECT_PRESETS.keys()),
                 with gr.Column(scale=1, min_width=440):
                     output_video = gr.Video(label="Generated Video", format="mp4", autoplay=True,
+                                            height=640, elem_id="output-video", buttons=["download"])
         # ══ Tab 2: Dub Video ═══════════════════════════════════════════════════
         with gr.Tab("🎙️ Dub Video", id="tab-dub"):
             with gr.Row(equal_height=False):
                 with gr.Column(scale=1, min_width=360):
+                    dub_video_input = gr.Video(label="Input Video · max 60 seconds",
                                                sources=["upload"])
                     dub_target_lang = gr.Dropdown(choices=TTS_LANGUAGES, value="English", label="Target Language")
+                    dub_voice_ref = gr.Audio(label="Voice Reference (optional — clone voice style)",
                                              type="filepath", sources=["upload"])
                     dub_emotion = gr.Slider(0.0, 1.0, value=0.5, step=0.05, label="Emotion Intensity")
                     dub_btn = gr.Button("🎙️  Dub Video", variant="primary", elem_id="dub-btn", size="lg")
                 with gr.Column(scale=1, min_width=440):
                     dub_output_video = gr.Video(label="Dubbed Video", format="mp4", autoplay=True,
+                                                height=480, elem_id="dub-output-video", buttons=["download"])
                     with gr.Accordion("Details", open=False) as dub_details_acc:
                         dub_transcript_box = gr.Textbox(label="Detected Transcript", interactive=False, lines=4)
                         dub_translation_box = gr.Textbox(label="Translation", interactive=False, lines=4)