Nymbo commited on
Commit
36c9a15
·
verified ·
1 Parent(s): 3d1f292

Update Modules/Generate_Speech.py

Browse files
Files changed (1) hide show
  1. Modules/Generate_Speech.py +6 -6
Modules/Generate_Speech.py CHANGED
@@ -651,18 +651,18 @@ def build_interface() -> gr.Interface:
651
  return gr.Interface(
652
  fn=Generate_Speech,
653
  inputs=[
654
- gr.Textbox(label="Text", placeholder="Type text to synthesize…", lines=4),
655
- gr.Dropdown(label="Model", choices=["Supertonic", "Kokoro"], value="Supertonic"),
656
- gr.Slider(minimum=0.5, maximum=2.0, value=1.3, step=0.1, label="Speed"),
657
- gr.Slider(minimum=1, maximum=50, value=5, step=1, label="Steps", info="Supertonic only"),
658
  gr.Dropdown(
659
  label="Voice",
660
  choices=all_voices,
661
  value="F1",
662
  info="Select voice (F1/F2/M1/M2 for Supertonic, others for Kokoro)",
663
  ),
664
- gr.Slider(minimum=0.0, maximum=2.0, value=0.3, step=0.1, label="Silence Duration", info="Supertonic only"),
665
- gr.Slider(minimum=50, maximum=1000, value=300, step=10, label="Max Chunk Size", info="Supertonic only"),
666
  ],
667
  outputs=gr.Audio(label="Audio", type="filepath", format="wav"),
668
  title="Generate Speech",
 
651
  return gr.Interface(
652
  fn=Generate_Speech,
653
  inputs=[
654
+ gr.Textbox(label="Text", placeholder="Type text to synthesize…", lines=4, info="The text to synthesize (English)"),
655
+ gr.Dropdown(label="Model", choices=["Supertonic", "Kokoro"], value="Supertonic", info="The TTS model to use"),
656
+ gr.Slider(minimum=0.5, maximum=2.0, value=1.3, step=0.1, label="Speed", info="Speech speed multiplier (1.0 = normal)"),
657
+ gr.Slider(minimum=1, maximum=50, value=5, step=1, label="Steps", info="Supertonic only: Diffusion steps (1-50)"),
658
  gr.Dropdown(
659
  label="Voice",
660
  choices=all_voices,
661
  value="F1",
662
  info="Select voice (F1/F2/M1/M2 for Supertonic, others for Kokoro)",
663
  ),
664
+ gr.Slider(minimum=0.0, maximum=2.0, value=0.3, step=0.1, label="Silence Duration", info="Supertonic only: Silence duration between chunks"),
665
+ gr.Slider(minimum=50, maximum=1000, value=300, step=10, label="Max Chunk Size", info="Supertonic only: Max text chunk length"),
666
  ],
667
  outputs=gr.Audio(label="Audio", type="filepath", format="wav"),
668
  title="Generate Speech",