Spaces:

lulavc
/

AnimaStudio

Running on Zero

App Files Files Community

lulavc commited on Mar 4

Commit

673f772

1 Parent(s): 34fc3ab

fix: force wav format on audio inputs to fix recording on Linux/webm browsers

Browse files

Files changed (1) hide show

app.py +4 -1

app.py CHANGED Viewed

@@ -447,6 +447,7 @@ with gr.Blocks(title="AnimaStudio 🎬") as demo:
                             voice_ref = gr.Audio(
                                 label="Voice Reference (optional — clone voice style)",
                                 type="filepath", sources=["upload", "microphone"],
                             )
                         emotion = gr.Slider(0.0, 1.0, value=0.5, step=0.05,
                                             label="Emotion Intensity", info="0 = neutral · 1 = very expressive")
@@ -454,6 +455,7 @@ with gr.Blocks(title="AnimaStudio 🎬") as demo:
                         audio_upload = gr.Audio(
                             label="Audio File · WAV/MP3/FLAC · max 30 s",
                             type="filepath", sources=["upload", "microphone"],
                         )
                     aspect_ratio = gr.Dropdown(choices=list(ASPECT_PRESETS.keys()),
                                                value="◻ 1:1  · 512×512", label="Format")
@@ -478,7 +480,8 @@ with gr.Blocks(title="AnimaStudio 🎬") as demo:
                                                sources=["upload"])
                     dub_target_lang = gr.Dropdown(choices=TTS_LANGUAGES, value="English", label="Target Language")
                     dub_voice_ref = gr.Audio(label="Voice Reference (optional — clone voice style)",
-                                             type="filepath", sources=["upload", "microphone"])
                     dub_emotion = gr.Slider(0.0, 1.0, value=0.5, step=0.05, label="Emotion Intensity")
                     dub_btn = gr.Button("🎙️  Dub Video", variant="primary", elem_id="dub-btn", size="lg")
                     gr.HTML("""

                             voice_ref = gr.Audio(
                                 label="Voice Reference (optional — clone voice style)",
                                 type="filepath", sources=["upload", "microphone"],
+                                format="wav",
                             )
                         emotion = gr.Slider(0.0, 1.0, value=0.5, step=0.05,
                                             label="Emotion Intensity", info="0 = neutral · 1 = very expressive")
                         audio_upload = gr.Audio(
                             label="Audio File · WAV/MP3/FLAC · max 30 s",
                             type="filepath", sources=["upload", "microphone"],
+                            format="wav",
                         )
                     aspect_ratio = gr.Dropdown(choices=list(ASPECT_PRESETS.keys()),
                                                value="◻ 1:1  · 512×512", label="Format")
                                                sources=["upload"])
                     dub_target_lang = gr.Dropdown(choices=TTS_LANGUAGES, value="English", label="Target Language")
                     dub_voice_ref = gr.Audio(label="Voice Reference (optional — clone voice style)",
+                                             type="filepath", sources=["upload", "microphone"],
+                                             format="wav")
                     dub_emotion = gr.Slider(0.0, 1.0, value=0.5, step=0.05, label="Emotion Intensity")
                     dub_btn = gr.Button("🎙️  Dub Video", variant="primary", elem_id="dub-btn", size="lg")
                     gr.HTML("""