Spaces:

DhanuakaDev
/

Sin-Tts-v01

Runtime error

DhanuakaDev commited on Nov 27, 2025

Commit

ceb6264

1 Parent(s): 63ef4fe

changed3 app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,36 +1,38 @@
 import json
-import os
 import numpy as np
 import gradio as gr
-from TTS.utils.synthesizer import Synthesizer
 # ---------- Paths ----------
-MODEL_PATH = "checkpoint_80000.pth"   # or "best_model_23206.pth"
 CONFIG_PATH = "config.json"
-# ---------- Load config to get sample rate ----------
-with open(CONFIG_PATH, "r", encoding="utf-8") as f:
-    cfg = json.load(f)
-SAMPLE_RATE = cfg.get("audio", {}).get("sample_rate", 24000)
-# ---------- Load Coqui TTS Synthesizer ----------
-synthesizer = Synthesizer(
-    tts_checkpoint=MODEL_PATH,
-    tts_config_path=CONFIG_PATH,
-    use_cuda=False,   # Set True only if you enable GPU in the Space
 )
 # ---------- Inference function ----------
 def tts_generate(text: str):
-    if not text.strip():
         return None
-    # Whatever Coqui returns (list, numpy array, etc.)
-    wav = synthesizer.tts(text)
-    # Convert to a 1D numpy array for Gradio
     wav = np.asarray(wav, dtype="float32").flatten()
     # Gradio Audio(type="numpy") expects (sample_rate, np.ndarray)
@@ -41,15 +43,15 @@ demo = gr.Interface(
     fn=tts_generate,
     inputs=gr.Textbox(
         label="Input text",
-        placeholder="Type Sinhala text here…(use Sinhala script, max 120 characters)",
         lines=3,
     ),
     outputs=gr.Audio(
         label="Generated speech",
         type="numpy",
     ),
-    title="Sinhala TTS",
-    description="Sinhala TTS model- Research-stage model",
 )
 if __name__ == "__main__":

 import json
+from pathlib import Path
 import numpy as np
 import gradio as gr
+from TTS.api import TTS
 # ---------- Paths ----------
+MODEL_PATH = "checkpoint_80000.pth"     # or checkpoint_70000.pth if that's the good one
 CONFIG_PATH = "config.json"
+run_dir = Path(".")
+# ---------- Load model ----------
+# In Spaces we will force CPU (gpu=False)
+tts = TTS(
+    model_path=str(run_dir / MODEL_PATH),
+    config_path=str(run_dir / CONFIG_PATH),
+    progress_bar=False,
+    gpu=False,
 )
+# Sample rate from the loaded synthesizer
+SAMPLE_RATE = tts.synthesizer.output_sample_rate
 # ---------- Inference function ----------
 def tts_generate(text: str):
+    text = text.strip()
+    if not text:
         return None
+    # This is the same as your local script
+    wav = tts.tts(text)
+    # Ensure numpy array (1D) for Gradio
     wav = np.asarray(wav, dtype="float32").flatten()
     # Gradio Audio(type="numpy") expects (sample_rate, np.ndarray)
     fn=tts_generate,
     inputs=gr.Textbox(
         label="Input text",
+        placeholder="Type Sinhala text here…",
         lines=3,
     ),
     outputs=gr.Audio(
         label="Generated speech",
         type="numpy",
     ),
+    title="Sinhala TTS ",
+    description="Sinhala TTS model research-stage model.",
 )
 if __name__ == "__main__":