Update Modules/Generate_Speech.py
Browse files
Modules/Generate_Speech.py
CHANGED
|
@@ -651,18 +651,18 @@ def build_interface() -> gr.Interface:
|
|
| 651 |
return gr.Interface(
|
| 652 |
fn=Generate_Speech,
|
| 653 |
inputs=[
|
| 654 |
-
gr.Textbox(label="Text", placeholder="Type text to synthesize…", lines=4),
|
| 655 |
-
gr.Dropdown(label="Model", choices=["Supertonic", "Kokoro"], value="Supertonic"),
|
| 656 |
-
gr.Slider(minimum=0.5, maximum=2.0, value=1.3, step=0.1, label="Speed"),
|
| 657 |
-
gr.Slider(minimum=1, maximum=50, value=5, step=1, label="Steps", info="Supertonic only"),
|
| 658 |
gr.Dropdown(
|
| 659 |
label="Voice",
|
| 660 |
choices=all_voices,
|
| 661 |
value="F1",
|
| 662 |
info="Select voice (F1/F2/M1/M2 for Supertonic, others for Kokoro)",
|
| 663 |
),
|
| 664 |
-
gr.Slider(minimum=0.0, maximum=2.0, value=0.3, step=0.1, label="Silence Duration", info="Supertonic only"),
|
| 665 |
-
gr.Slider(minimum=50, maximum=1000, value=300, step=10, label="Max Chunk Size", info="Supertonic only"),
|
| 666 |
],
|
| 667 |
outputs=gr.Audio(label="Audio", type="filepath", format="wav"),
|
| 668 |
title="Generate Speech",
|
|
|
|
| 651 |
return gr.Interface(
|
| 652 |
fn=Generate_Speech,
|
| 653 |
inputs=[
|
| 654 |
+
gr.Textbox(label="Text", placeholder="Type text to synthesize…", lines=4, info="The text to synthesize (English)"),
|
| 655 |
+
gr.Dropdown(label="Model", choices=["Supertonic", "Kokoro"], value="Supertonic", info="The TTS model to use"),
|
| 656 |
+
gr.Slider(minimum=0.5, maximum=2.0, value=1.3, step=0.1, label="Speed", info="Speech speed multiplier (1.0 = normal)"),
|
| 657 |
+
gr.Slider(minimum=1, maximum=50, value=5, step=1, label="Steps", info="Supertonic only: Diffusion steps (1-50)"),
|
| 658 |
gr.Dropdown(
|
| 659 |
label="Voice",
|
| 660 |
choices=all_voices,
|
| 661 |
value="F1",
|
| 662 |
info="Select voice (F1/F2/M1/M2 for Supertonic, others for Kokoro)",
|
| 663 |
),
|
| 664 |
+
gr.Slider(minimum=0.0, maximum=2.0, value=0.3, step=0.1, label="Silence Duration", info="Supertonic only: Silence duration between chunks"),
|
| 665 |
+
gr.Slider(minimum=50, maximum=1000, value=300, step=10, label="Max Chunk Size", info="Supertonic only: Max text chunk length"),
|
| 666 |
],
|
| 667 |
outputs=gr.Audio(label="Audio", type="filepath", format="wav"),
|
| 668 |
title="Generate Speech",
|