Spaces:
Build error
Build error
积极的屁孩 commited on
Commit ·
fbb3473
1
Parent(s): b4485a3
adjustments
Browse files
app.py
CHANGED
|
@@ -628,24 +628,34 @@ def vevo_tts(text, ref_wav, timbre_ref_wav=None, src_language="en", ref_language
|
|
| 628 |
# 创建Gradio界面
|
| 629 |
with gr.Blocks(title="VEVO DEMO") as demo:
|
| 630 |
gr.Markdown("# VEVO DEMO")
|
| 631 |
-
gr.Markdown("## Controllable Zero-Shot Voice Conversion and Style Transfer")
|
| 632 |
|
| 633 |
with gr.Tab("Vevo-Timbre"):
|
| 634 |
gr.Markdown("### Vevo-Timbre: Maintain style but transfer timbre")
|
| 635 |
with gr.Row():
|
| 636 |
with gr.Column():
|
| 637 |
-
timbre_content = gr.Audio(label="
|
| 638 |
timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
|
| 639 |
timbre_button = gr.Button("Generate")
|
| 640 |
with gr.Column():
|
| 641 |
timbre_output = gr.Audio(label="Result")
|
| 642 |
timbre_button.click(vevo_timbre, inputs=[timbre_content, timbre_reference], outputs=timbre_output)
|
| 643 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 644 |
with gr.Tab("Vevo-Voice"):
|
| 645 |
gr.Markdown("### Vevo-Voice: Transfers both style and timbre with separate references")
|
| 646 |
with gr.Row():
|
| 647 |
with gr.Column():
|
| 648 |
-
voice_content = gr.Audio(label="
|
| 649 |
voice_style_reference = gr.Audio(label="Style Reference", type="numpy")
|
| 650 |
voice_timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
|
| 651 |
voice_button = gr.Button("Generate")
|
|
@@ -653,16 +663,7 @@ with gr.Blocks(title="VEVO DEMO") as demo:
|
|
| 653 |
voice_output = gr.Audio(label="Result")
|
| 654 |
voice_button.click(vevo_voice, inputs=[voice_content, voice_style_reference, voice_timbre_reference], outputs=voice_output)
|
| 655 |
|
| 656 |
-
|
| 657 |
-
gr.Markdown("### Vevo-Style: Maintain timbre but transfer style (accent, emotion, etc.)")
|
| 658 |
-
with gr.Row():
|
| 659 |
-
with gr.Column():
|
| 660 |
-
style_content = gr.Audio(label="Content Audio", type="numpy")
|
| 661 |
-
style_reference = gr.Audio(label="Style Reference", type="numpy")
|
| 662 |
-
style_button = gr.Button("Generate")
|
| 663 |
-
with gr.Column():
|
| 664 |
-
style_output = gr.Audio(label="Result")
|
| 665 |
-
style_button.click(vevo_style, inputs=[style_content, style_reference], outputs=style_output)
|
| 666 |
|
| 667 |
with gr.Tab("Vevo-TTS"):
|
| 668 |
gr.Markdown("### Vevo-TTS: Text-to-speech with separate style and timbre references")
|
|
|
|
| 628 |
# 创建Gradio界面
|
| 629 |
with gr.Blocks(title="VEVO DEMO") as demo:
|
| 630 |
gr.Markdown("# VEVO DEMO")
|
|
|
|
| 631 |
|
| 632 |
with gr.Tab("Vevo-Timbre"):
|
| 633 |
gr.Markdown("### Vevo-Timbre: Maintain style but transfer timbre")
|
| 634 |
with gr.Row():
|
| 635 |
with gr.Column():
|
| 636 |
+
timbre_content = gr.Audio(label="Source Audio", type="numpy")
|
| 637 |
timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
|
| 638 |
timbre_button = gr.Button("Generate")
|
| 639 |
with gr.Column():
|
| 640 |
timbre_output = gr.Audio(label="Result")
|
| 641 |
timbre_button.click(vevo_timbre, inputs=[timbre_content, timbre_reference], outputs=timbre_output)
|
| 642 |
+
|
| 643 |
+
with gr.Tab("Vevo-Style"):
|
| 644 |
+
gr.Markdown("### Vevo-Style: Maintain timbre but transfer style (accent, emotion, etc.)")
|
| 645 |
+
with gr.Row():
|
| 646 |
+
with gr.Column():
|
| 647 |
+
style_content = gr.Audio(label="Source Audio", type="numpy")
|
| 648 |
+
style_reference = gr.Audio(label="Style Reference", type="numpy")
|
| 649 |
+
style_button = gr.Button("Generate")
|
| 650 |
+
with gr.Column():
|
| 651 |
+
style_output = gr.Audio(label="Result")
|
| 652 |
+
style_button.click(vevo_style, inputs=[style_content, style_reference], outputs=style_output)
|
| 653 |
+
|
| 654 |
with gr.Tab("Vevo-Voice"):
|
| 655 |
gr.Markdown("### Vevo-Voice: Transfers both style and timbre with separate references")
|
| 656 |
with gr.Row():
|
| 657 |
with gr.Column():
|
| 658 |
+
voice_content = gr.Audio(label="Source Audio", type="numpy")
|
| 659 |
voice_style_reference = gr.Audio(label="Style Reference", type="numpy")
|
| 660 |
voice_timbre_reference = gr.Audio(label="Timbre Reference", type="numpy")
|
| 661 |
voice_button = gr.Button("Generate")
|
|
|
|
| 663 |
voice_output = gr.Audio(label="Result")
|
| 664 |
voice_button.click(vevo_voice, inputs=[voice_content, voice_style_reference, voice_timbre_reference], outputs=voice_output)
|
| 665 |
|
| 666 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 667 |
|
| 668 |
with gr.Tab("Vevo-TTS"):
|
| 669 |
gr.Markdown("### Vevo-TTS: Text-to-speech with separate style and timbre references")
|