Spaces:

Nymbo
/

Tools

Running

Nymbo commited on 16 days ago

Commit

9f7596f

verified ·

1 Parent(s): 379c8b8

Update Modules/Generate_Speech.py

Files changed (1) hide show

Modules/Generate_Speech.py CHANGED Viewed

@@ -507,9 +507,9 @@ def List_Supertonic_Voices() -> list[str]:
 # Single source of truth for the LLM-facing tool description
 TOOL_SUMMARY = (
-    "Synthesize speech from text using Supertonic (default) or Kokoro-82M. "
-    "Supertonic: high quality, slower, supports steps/silence/chunking. Default voice 'F1'. "
-    "Kokoro: faster, supports many languages/accents. Default voice 'af_heart'. "
     "Return the generated media to the user in this format `![Alt text](URL)`."
 )
@@ -648,7 +648,8 @@ def build_interface() -> gr.Blocks:
     supertonic_voices = get_supertonic_voices()
     with gr.Blocks(title="Generate Speech") as demo:
-        gr.Markdown("<div style=\"text-align:center\">Generate speech with Supertonic (default) or Kokoro-82M.</div>")
         with gr.Row():
             with gr.Column():
@@ -667,9 +668,9 @@ def build_interface() -> gr.Blocks:
                 # Supertonic specific
                 with gr.Group() as supertonic_params:
-                    steps_slider = gr.Slider(minimum=1, maximum=50, value=5, step=1, label="Steps (Supertonic only)")
-                    silence_slider = gr.Slider(minimum=0.0, maximum=2.0, value=0.3, step=0.1, label="Silence Duration (Supertonic only)")
-                    chunk_slider = gr.Slider(minimum=50, maximum=1000, value=300, step=10, label="Max Chunk Size (Supertonic only)")
                 with gr.Row():
                     clear_btn = gr.Button("Clear")

 # Single source of truth for the LLM-facing tool description
 TOOL_SUMMARY = (
+    "Synthesize speech from text using Supertonic-66M (default) or Kokoro-82M. "
+    "Supertonic: faster, supports steps/silence/chunking. Default voice 'F1'. "
+    "Kokoro: slower, supports many languages/accents. Default voice 'af_heart'. "
     "Return the generated media to the user in this format `![Alt text](URL)`."
 )
     supertonic_voices = get_supertonic_voices()
     with gr.Blocks(title="Generate Speech") as demo:
+        gr.Markdown("<h1 style='text-align: center; margin-bottom: 1rem'>Generate Speech</h1>")
+        gr.Markdown("<div style=\"text-align:center\">Generate speech with Supertonic-66M or Kokoro-82M. Runs on CPU.</div>")
         with gr.Row():
             with gr.Column():
                 # Supertonic specific
                 with gr.Group() as supertonic_params:
+                    steps_slider = gr.Slider(minimum=1, maximum=50, value=5, step=1, label="Steps", info="Supertonic only")
+                    silence_slider = gr.Slider(minimum=0.0, maximum=2.0, value=0.3, step=0.1, label="Silence Duration", info="Supertonic only")
+                    chunk_slider = gr.Slider(minimum=50, maximum=1000, value=300, step=10, label="Max Chunk Size", info="Supertonic only")
                 with gr.Row():
                     clear_btn = gr.Button("Clear")