Spaces:

umarabbas890
/

AIVoiceoverGeneratorwithEmotionControl

Build error

App Files Files Community

umarabbas890 commited on Jun 18, 2025

Commit

a2ae3c3

verified ·

1 Parent(s): 2acb2e9

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -31

app.py CHANGED Viewed

@@ -1,9 +1,7 @@
 import os
-os.environ["COQUI_TOS_AGREED"] = "1"  # Automatically accept Coqui ToS
 import torch.serialization
-# Add required Coqui XTTS classes to the trusted list
 torch.serialization.add_safe_globals([
     __import__("TTS.tts.configs.xtts_config").tts.configs.xtts_config.XttsConfig,
     __import__("TTS.tts.models.xtts").tts.models.xtts.XttsAudioConfig,
@@ -11,59 +9,53 @@ torch.serialization.add_safe_globals([
     __import__("TTS.config.shared_configs").config.shared_configs.BaseDatasetConfig
 ])
 import gradio as gr
 import torch
 import torchaudio
 from TTS.api import TTS
 import uuid
-# 🛠️ PyTorch 2.6+ fix for loading XTTS
-import torch.serialization
-torch.serialization.add_safe_globals([__import__("TTS.tts.configs.xtts_config").tts.configs.xtts_config.XttsConfig])
-# Load the XTTS model
 model_name = "tts_models/multilingual/multi-dataset/xtts_v2"
 tts = TTS(model_name=model_name, progress_bar=False, gpu=False)
-# Emotions mapped to style embeddings
-emotion_styles = {
-    "Neutral": "neutral",
-    "Sad": "sad",
-    "Happy": "happy",
-    "Angry": "angry",
-    "Excited": "excited"
 }
-# Generate voice and save as MP3
-import os
-def generate_voice(text, speaker_audio_path):
     if not os.path.isfile(speaker_audio_path):
         raise FileNotFoundError(f"Speaker audio file not found: {speaker_audio_path}")
     tts.tts_to_file(
         text=text,
         speaker_wav=speaker_audio_path,
         language="en",
-        file_path="output.wav"
     )
-    return "output.wav"
-    # Convert to MP3 using pydub
-    mp3_path = output_path.replace(".wav", ".mp3")
-    sound = AudioSegment.from_wav(output_path)
     sound.export(mp3_path, format="mp3")
     return mp3_path, mp3_path
-# Gradio Interface
 with gr.Blocks() as demo:
-    gr.Markdown("## 🎙️ AI Voiceover Generator with Emotion Control\nConvert your script into a voiceover with the tone you choose!")
     with gr.Row():
         script_input = gr.Textbox(label="Enter Your Script", lines=5, placeholder="Type your video script here...")

 import os
+os.environ["COQUI_TOS_AGREED"] = "1"
 import torch.serialization
 torch.serialization.add_safe_globals([
     __import__("TTS.tts.configs.xtts_config").tts.configs.xtts_config.XttsConfig,
     __import__("TTS.tts.models.xtts").tts.models.xtts.XttsAudioConfig,
     __import__("TTS.config.shared_configs").config.shared_configs.BaseDatasetConfig
 ])
 import gradio as gr
 import torch
 import torchaudio
 from TTS.api import TTS
+from pydub import AudioSegment
 import uuid
+# Load XTTS model
 model_name = "tts_models/multilingual/multi-dataset/xtts_v2"
 tts = TTS(model_name=model_name, progress_bar=False, gpu=False)
+# Map emotions to file paths
+emotion_to_file = {
+    "Neutral": "samples/neutral.wav",
+    "Sad": "samples/sad.wav",
+    "Happy": "samples/happy.wav",
+    "Angry": "samples/angry.wav",
+    "Excited": "samples/excited.wav"
 }
+# Voice generator
+def generate_voice(text, emotion):
+    speaker_audio_path = emotion_to_file.get(emotion)
     if not os.path.isfile(speaker_audio_path):
         raise FileNotFoundError(f"Speaker audio file not found: {speaker_audio_path}")
+    # Generate unique filenames to avoid overwrites
+    uid = uuid.uuid4().hex
+    wav_path = f"output_{uid}.wav"
+    mp3_path = f"output_{uid}.mp3"
     tts.tts_to_file(
         text=text,
         speaker_wav=speaker_audio_path,
         language="en",
+        file_path=wav_path
     )
+    # Convert to MP3
+    sound = AudioSegment.from_wav(wav_path)
     sound.export(mp3_path, format="mp3")
     return mp3_path, mp3_path
+# Gradio UI
 with gr.Blocks() as demo:
+    gr.Markdown("## 🎙️ AI Voiceover Generator with Emotion Control")
     with gr.Row():
         script_input = gr.Textbox(label="Enter Your Script", lines=5, placeholder="Type your video script here...")