Spaces:

backtracking
/

tiny-tts-demo

Running

App Files Files Community

backtracking commited on about 22 hours ago

Commit

a74b4e6

verified ·

1 Parent(s): 18a8b23

Upload app.py with huggingface_hub

Browse files

Files changed (1) hide show

app.py +30 -26

app.py CHANGED Viewed

@@ -4,65 +4,69 @@ from tiny_tts import TinyTTS
 # Download required NLTK data for g2p-en
 try:
-    nltk.download('averaged_perceptron_tagger_eng')
-    nltk.download('averaged_perceptron_tagger')
-    nltk.download('cmudict')
 except Exception as e:
     print(f"NLTK download warning: {e}")
-# Initialize the model (auto-downloads if needed)
 print("Initializing TinyTTS...")
 tts = TinyTTS()
 print("Model loaded successfully!")
-def synthesize_audio(text, speaker):
     output_path = "output.wav"
     try:
-        tts.speak(text, output_path=output_path, speaker=speaker)
         return output_path
     except Exception as e:
         return f"Error: {e}"
-# Define available speakers
-# Define available speakers
-available_speakers = list(tts.model.SPK2ID.keys()) if hasattr(tts.model, "SPK2ID") else ["female"]
 # Create Gradio interface
 with gr.Blocks(title="TinyTTS Demo", theme=gr.themes.Soft()) as app:
     gr.Markdown("# 🗣️ TinyTTS")
-    gr.Markdown("**Ultra-lightweight English Text-to-Speech (~9M parameters, ~20MB on disk)**")
-    gr.Markdown("This space runs on CPU efficiently and synthesizes high-quality audio faster than real-time.")
     with gr.Row():
         with gr.Column():
             text_input = gr.Textbox(
-                label="Input Text",
-                placeholder="Enter English text here...",
                 value="The weather is nice today, and I feel very relaxed.",
                 lines=4
             )
-            speaker_dropdown = gr.Dropdown(
-                choices=available_speakers,
-                value="female" if "female" in available_speakers else available_speakers[0],
-                label="Speaker"
             )
-            submit_btn = gr.Button("Synthesize Speech", variant="primary")
         with gr.Column():
             audio_output = gr.Audio(label="Output Audio", type="filepath")
     # Example prompts
     gr.Examples(
         examples=[
-            ["The weather is nice today, and I feel very relaxed.", "female"],
-            ["TinyTTS has only nine million parameters, making it extremely fast on CPUs.", "female"],
         ],
-        inputs=[text_input, speaker_dropdown],
     )
     submit_btn.click(
         fn=synthesize_audio,
-        inputs=[text_input, speaker_dropdown],
         outputs=audio_output
     )

 # Download required NLTK data for g2p-en
 try:
+    nltk.download('averaged_perceptron_tagger_eng', quiet=True)
+    nltk.download('averaged_perceptron_tagger', quiet=True)
+    nltk.download('cmudict', quiet=True)
 except Exception as e:
     print(f"NLTK download warning: {e}")
+# Initialize the model (auto-downloads from HF Hub if needed)
 print("Initializing TinyTTS...")
 tts = TinyTTS()
 print("Model loaded successfully!")
+def synthesize_audio(text, speed):
     output_path = "output.wav"
     try:
+        tts.speak(text, output_path=output_path, speaker="MALE", speed=speed)
         return output_path
     except Exception as e:
         return f"Error: {e}"
 # Create Gradio interface
 with gr.Blocks(title="TinyTTS Demo", theme=gr.themes.Soft()) as app:
     gr.Markdown("# 🗣️ TinyTTS")
+    gr.Markdown(
+        "**Ultra-lightweight English Text-to-Speech — only 1.6M parameters, ~3.4 MB ONNX**\n\n"
+        "Synthesizes high-quality 44.1kHz audio **~53× faster** than real-time on CPU."
+    )
     with gr.Row():
         with gr.Column():
             text_input = gr.Textbox(
+                label="Input Text",
+                placeholder="Enter English text here...",
                 value="The weather is nice today, and I feel very relaxed.",
                 lines=4
             )
+            speed_slider = gr.Slider(
+                minimum=0.5,
+                maximum=2.0,
+                value=1.0,
+                step=0.1,
+                label="Speed (1.0 = normal, >1 = faster, <1 = slower)"
             )
+            submit_btn = gr.Button("🔊 Synthesize Speech", variant="primary")
         with gr.Column():
             audio_output = gr.Audio(label="Output Audio", type="filepath")
     # Example prompts
     gr.Examples(
         examples=[
+            ["The weather is nice today, and I feel very relaxed.", 1.0],
+            ["TinyTTS has only one point six million parameters, making it extremely fast on CPUs.", 1.0],
+            ["This is a speed test. Speaking at one and a half times the normal rate.", 1.5],
+            ["Slow and steady wins the race. Let me speak more carefully.", 0.7],
         ],
+        inputs=[text_input, speed_slider],
     )
     submit_btn.click(
         fn=synthesize_audio,
+        inputs=[text_input, speed_slider],
         outputs=audio_output
     )