Spaces:

Timemaster
/

multilingual-tts-v2

Running

App Files Files Community

Timemaster commited on Oct 26, 2025

Commit

b0f6a83

verified ·

1 Parent(s): 4ed7f20

Update app.py

Browse files

Files changed (1) hide show

app.py +41 -20

app.py CHANGED Viewed

@@ -1,49 +1,70 @@
-from tts_voice import tts_order_voice
-import edge_tts
 import gradio as gr
 import tempfile
-import anyio
 language_dict = tts_order_voice
 async def text_to_speech_edge(text, language_code):
-    voice = language_dict[language_code]
-    communicate = edge_tts.Communicate(text, voice)
-    with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp_file:
-        tmp_path = tmp_file.name
-    await communicate.save(tmp_path)
-    # Translated output message
-    return "Speech synthesis complete: {}".format(text), tmp_path
-# --- UI TRANSLATION AND MODERN GRADIO SYNTAX ---
-# Input Component: Textbox label translated
 input_text = gr.Textbox(lines=5, label="Input Text")
-# Output Component: Textbox label translated
 output_text = gr.Textbox(label="Output Text")
-# Output Component: Audio label translated
 output_audio = gr.Audio(type="filepath", label="Generated Audio File")
 default_language = list(language_dict.keys())[0]
-# Input Component: Dropdown label translated
 language = gr.Dropdown(
     choices=list(language_dict.keys()),
     value=default_language,
     label="Language / Voice"
 )
-# Interface Translation: Title and Description translated
 interface = gr.Interface(
     fn=text_to_speech_edge,
     inputs=[input_text, language],
     outputs=[output_text, output_audio],
-    title="Edge TTS Text-to-Speech", # Translated title
-    description="Convert text into high-quality audio using various Edge TTS voices." # Added description in English
 )
 if __name__ == "__main__":
     interface.launch()

+# WARNING: This file assumes you have a tts_voice.py file with English-translated keys.
 import gradio as gr
 import tempfile
+import edge_tts
+import anyio
+# Import the translated voice mapping (assuming you kept it)
+from tts_voice import tts_order_voice
 language_dict = tts_order_voice
+# HARDCODED ENDPOINT: This is the fix to bypass connection instability
+VOICE_SERVICE_ENDPOINT = "wss://speech.platform.bing.com/consumer/speech/synthesize/readaloud/v1"
 async def text_to_speech_edge(text, language_code):
+    # Input Validation (kept from previous successful step)
+    if not text or not text.strip():
+        return "ERROR: Input text cannot be empty. Please enter text.", None
+    try:
+        voice = language_dict[language_code]
+        # Initialize Communicate with the specific endpoint
+        communicate = edge_tts.Communicate(
+            text,
+            voice,
+            # FORCED FIX: Use a specific, known WebSocket endpoint
+            websocket_url=VOICE_SERVICE_ENDPOINT
+        )
+        with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp_file:
+            tmp_path = tmp_file.name
+        await communicate.save(tmp_path)
+        return "Speech synthesis complete: {}".format(text), tmp_path
+    except edge_tts.exceptions.NoAudioReceived:
+        # Catch the specific error with a clear message
+        return "ERROR: Failed to generate audio. The TTS service is rejecting the request. Check your text length or try a different voice.", None
+    except Exception as e:
+        # Catch any other unexpected errors
+        return f"An unexpected error occurred: {str(e)}", None
+# --- Modern Gradio Component Syntax ---
 input_text = gr.Textbox(lines=5, label="Input Text")
 output_text = gr.Textbox(label="Output Text")
 output_audio = gr.Audio(type="filepath", label="Generated Audio File")
 default_language = list(language_dict.keys())[0]
 language = gr.Dropdown(
     choices=list(language_dict.keys()),
     value=default_language,
     label="Language / Voice"
 )
+# --- Gradio Interface Definition ---
 interface = gr.Interface(
     fn=text_to_speech_edge,
     inputs=[input_text, language],
     outputs=[output_text, output_audio],
+    title="Edge TTS Text-to-Speech",
+    description="Convert text into high-quality audio using various Edge TTS voices."
 )
+# --- Standard Launch Command ---
 if __name__ == "__main__":
     interface.launch()