Spaces:

Nick021402
/

Text2speech

Sleeping

App Files Files Community

Nick021402 commited on May 23, 2025

Commit

f8bacea

verified ·

1 Parent(s): 892b3a1

Update app.py

Browse files

Files changed (1) hide show

app.py +11 -11

app.py CHANGED Viewed

@@ -34,8 +34,8 @@ except Exception as e:
 class LongFormTTS:
     def __init__(self):
         self.tts = tts
-        self.speakers = speakers  # Store available speakers
-        self.sample_rate = 22050  # Coqui default sample rate
     def preprocess_text(self, text):
         """Clean and prepare text for TTS"""
@@ -54,7 +54,6 @@ class LongFormTTS:
         text = re.sub(r'\b(\d{1,4})\b', lambda m: self.number_to_words(int(m.group())), text)
         text = re.sub(r'\b(1[0-9]{3}|20[0-9]{2}|2100)\b', lambda m: m.group(), text)
         text = re.sub(r'[^\w\s\.,!?;:\-\(\)\'"]', ' ', text)
-        text = re.sub(r'\s+', ' ', text)
         return text.strip()
     def number_to_words(self, num):
@@ -158,7 +157,7 @@ def text_to_speech_interface(text, speaker="p225", progress=gr.Progress()):
         if audio is None:
             return None, "❌ Failed to generate audio."
         progress(0.9, desc="💾 Saving audio file...")
-        with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
             sf.write(tmp_file.name, audio, sample_rate)
             audio_path = tmp_file.name
         progress(1.0, desc="✅ Complete!")
@@ -211,13 +210,13 @@ def create_interface():
                     placeholder="Type or paste your text here... (Max 50,000 characters)",
                     lines=10,
                     max_lines=20,
-                    info="Supports any length text with automatic chunking for optimal quality"
                 )
                 char_count = gr.HTML("<span style='color: #666;'>Character count: 0 / 50,000</span>")
                 speaker_dropdown = gr.Dropdown(
                     choices=tts_system.speakers if tts_system else [],
-                    value=tts_system.speakers[0] if tts_system else None,
-                    label="🗣️ Choose Voice"
                 )
                 generate_btn = gr.Button("🎯 Generate Speech", variant="primary", size="lg", scale=1)
             with gr.Column(scale=1):
@@ -230,6 +229,7 @@ def create_interface():
                         <li>⚡ Smart text processing</li>
                         <li>🔧 Auto chunking</li>
                         <li>🎵 Natural-sounding speech</li>
                     </ul>
                 </div>
                 """)
@@ -240,7 +240,7 @@ def create_interface():
             count = len(text) if text else 0
             color = "#28a745" if count <= 50000 else "#dc3545"
             return f'<span style="color: {color};">Character count: {count:,} / 50,000</span>'
         text_input.change(fn=update_char_count, inputs=[text_input], outputs=[char_count])
         generate_btn.click(
@@ -252,9 +252,9 @@ def create_interface():
         gr.Examples(
             examples=[
-                ["Hello! Welcome to our advanced text-to-speech system. This technology can convert any written text into natural-sounding human speech.", "p225"],
-                ["The quick brown fox jumps over the lazy dog. This pangram contains every letter of the English alphabet and is perfect for testing speech synthesis.", "p226"],
-                ["Artificial intelligence has revolutionized many aspects of our daily lives.", "p227"],
             ],
             inputs=[text_input, speaker_dropdown],
             label="📚 Try These Examples"

 class LongFormTTS:
     def __init__(self):
         self.tts = tts
+        self.speakers = speakers or ["p225", "p226", "p227", "p228"]  # fallback static list
+        self.sample_rate = 22050  # Default sample rate for Coqui TTS
     def preprocess_text(self, text):
         """Clean and prepare text for TTS"""
         text = re.sub(r'\b(\d{1,4})\b', lambda m: self.number_to_words(int(m.group())), text)
         text = re.sub(r'\b(1[0-9]{3}|20[0-9]{2}|2100)\b', lambda m: m.group(), text)
         text = re.sub(r'[^\w\s\.,!?;:\-\(\)\'"]', ' ', text)
         return text.strip()
     def number_to_words(self, num):
         if audio is None:
             return None, "❌ Failed to generate audio."
         progress(0.9, desc="💾 Saving audio file...")
+        with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp_file:
             sf.write(tmp_file.name, audio, sample_rate)
             audio_path = tmp_file.name
         progress(1.0, desc="✅ Complete!")
                     placeholder="Type or paste your text here... (Max 50,000 characters)",
                     lines=10,
                     max_lines=20,
+                    info="Supports any length text with automatic chunking"
                 )
                 char_count = gr.HTML("<span style='color: #666;'>Character count: 0 / 50,000</span>")
                 speaker_dropdown = gr.Dropdown(
                     choices=tts_system.speakers if tts_system else [],
+                    value=tts_system.speakers[0] if tts_system and tts_system.speakers else None,
+                    label="🗣️ Select Voice"
                 )
                 generate_btn = gr.Button("🎯 Generate Speech", variant="primary", size="lg", scale=1)
             with gr.Column(scale=1):
                         <li>⚡ Smart text processing</li>
                         <li>🔧 Auto chunking</li>
                         <li>🎵 Natural-sounding speech</li>
+                        <li>🔊 MP3 audio output</li>
                     </ul>
                 </div>
                 """)
             count = len(text) if text else 0
             color = "#28a745" if count <= 50000 else "#dc3545"
             return f'<span style="color: {color};">Character count: {count:,} / 50,000</span>'
         text_input.change(fn=update_char_count, inputs=[text_input], outputs=[char_count])
         generate_btn.click(
         gr.Examples(
             examples=[
+                ["Hello! Welcome to our advanced text-to-speech system.", "p225"],
+                ["The quick brown fox jumps over the lazy dog.", "p226"],
+                ["Artificial intelligence has revolutionized many aspects of our lives.", "p227"],
             ],
             inputs=[text_input, speaker_dropdown],
             label="📚 Try These Examples"