Spaces:

SAD43W
/

speech

Sleeping

SAD43W commited on Jul 26, 2025

Commit

3c08b54

verified ·

1 Parent(s): 44c4441

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,49 +1,24 @@
-import os
-os.environ["COQUI_TOS_AGREED"] = "1"
-import torch
-from torch.serialization import add_safe_globals
-from TTS.tts.configs.xtts_config import XttsConfig
-from TTS.tts.models.xtts import XttsAudioConfig
-from TTS.config.shared_configs import BaseDatasetConfig  # NEW ADD
-add_safe_globals([XttsConfig, XttsAudioConfig, BaseDatasetConfig])
 from TTS.api import TTS
 import gradio as gr
-tts = TTS(model_name="tts_models/multilingual/multi-dataset/xtts_v2")
 tts.to("cuda" if torch.cuda.is_available() else "cpu")
-def synthesize(text, speaker_wav):
     output_path = "output.wav"
-    if speaker_wav is None:
-        return "No voice sample uploaded.", None
-    speaker_path = "temp_speaker.wav"
-    speaker_wav.save(speaker_path)
-    tts.tts_to_file(
-        text=text,
-        speaker_wav=speaker_path,
-        language="en",
-        file_path=output_path
-    )
-    return "Done. Listen below.", output_path
 iface = gr.Interface(
     fn=synthesize,
-    inputs=[
-        gr.Textbox(label="Text to Speak", placeholder="Come closer... I've been waiting in the dark."),
-        gr.Audio(source="upload", type="file", label="Creepy Voice Sample")
-    ],
-    outputs=[
-        gr.Textbox(label="Status"),
-        gr.Audio(label="Result Audio")
-    ],
-    title="XTTS‑V2 Horror Whisperer 👻",
-    description="Upload a voice and make it say creepy stuff. XTTS‑v2 powered, GPU-juiced. 🧟‍♂️💀"
 )
 if __name__ == "__main__":

 from TTS.api import TTS
 import gradio as gr
+import torch
+import os
+os.environ["CUDA_VISIBLE_DEVICES"] = "0"  # Use GPU if available
+tts = TTS(model_name="tts_models/en/ljspeech/tacotron2-DDC")
 tts.to("cuda" if torch.cuda.is_available() else "cpu")
+def synthesize(text):
     output_path = "output.wav"
+    tts.tts_to_file(text=text, file_path=output_path)
+    return output_path
 iface = gr.Interface(
     fn=synthesize,
+    inputs=gr.Textbox(lines=3, label="Enter text to synthesize"),
+    outputs=gr.Audio(type="filepath", label="Generated Speech"),
+    title="Mozilla Tacotron2 TTS - Smooth & Clean",
+    description="Simple text-to-speech using Mozilla's Tacotron2-DDC model. No voice samples required."
 )
 if __name__ == "__main__":