Spaces:

sreepathi-ravikumar
/

backendprocess

Sleeping

App Files Files Community

sreepathi-ravikumar commited on May 8, 2025

Commit

bbec22f

verified ·

1 Parent(s): ef53bee

Rename AudioGeneration.py to tts_engine.py

Browse files

Files changed (2) hide show

AudioGeneration.py +0 -10
tts_engine.py +59 -0

AudioGeneration.py DELETED Viewed

@@ -1,10 +0,0 @@
-from TTS.api import TTS
-import os
-# Initialize the TTS model (use a lightweight but high-quality model)
-tts = TTS(model_name="tts_models/en/ljspeech/tacotron2-DDC", progress_bar=False, gpu=False)
-def generate_audio(text):
-    output_path = "output.wav"
-    tts.tts_to_file(text=text, file_path=output_path)
-    return output_path

tts_engine.py ADDED Viewed

	@@ -0,0 +1,59 @@

+import edge_tts
+import asyncio
+import os
+from pydub import AudioSegment
+from langdetect import detect, LangDetectException
+import logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(_name_)
+class BilingualTTS:
+    def _init_(self):
+        self.voices = {
+            'ta': 'ta-IN-PallaviNeural',  # Tamil voice
+            'en': 'en-US-AriaNeural'     # English voice
+        }
+        self.temp_dir = "/app/temp"
+        os.makedirs(self.temp_dir, exist_ok=True)
+    async def _generate_segment(self, text, voice, idx):
+        output_file = os.path.join(self.temp_dir, f"segment_{idx}.mp3")
+        communicate = edge_tts.Communicate(text, voice)
+        await communicate.save(output_file)
+        return output_file
+    async def generate_audio(self, text):
+        try:
+            # Split text into sentences
+            sentences = [s.strip() for s in text.split('.') if s.strip()]
+            # Generate audio segments
+            tasks = []
+            for idx, sentence in enumerate(sentences):
+                try:
+                    lang = detect(sentence)
+                    voice = self.voices['en'] if lang not in ['ta', 'en'] else self.voices[lang]
+                except LangDetectException:
+                    voice = self.voices['en']
+                tasks.append(self._generate_segment(sentence, voice, idx))
+            # Process all segments concurrently
+            segment_files = await asyncio.gather(*tasks)
+            # Combine audio segments
+            combined = AudioSegment.empty()
+            for sf in segment_files:
+                combined += AudioSegment.from_mp3(sf)
+                os.remove(sf)  # Cleanup
+            # Save final output
+            output_path = os.path.join(self.temp_dir, "final_output.mp3")
+            combined.export(output_path, format="mp3")
+            return output_path
+        except Exception as e:
+            logger.error(f"TTS Generation Error: {str(e)}")
+            raise RuntimeError(f"TTS Failed: {str(e)}")