Spaces:

Amir20255
/

Text_To_Speech

Runtime error

Amir20255 commited on May 16, 2025

Commit

f4a1d9e

verified ·

1 Parent(s): fcf61f9

Upload 2 files

Files changed (2) hide show

app.py CHANGED Viewed

@@ -1,39 +1,31 @@
 import gradio as gr
-from TTS.api import TTS
-import os
-# تحميل نموذج FastSpeech 2 (أو نموذج أسرع)
-tts = TTS(model_name="fastspeech2-en-ljspeech", progress_bar=True)
-# دالة لتحويل النص إلى جمل صغيرة بحيث لا تتجاوز 50 كلمة
-def split_text_into_chunks(text, max_words=50):
-    words = text.split()
-    chunks = [words[i:i + max_words] for i in range(0, len(words), max_words)]
-    return [" ".join(chunk) for chunk in chunks]
 # دالة لتحويل النص إلى صوت
 def text_to_speech(text):
-    # تقسيم النص إلى جمل أو مقاطع
-    chunks = split_text_into_chunks(text)
-    # توليد الصوت لكل جزء
-    audio_paths = []
-    for i, chunk in enumerate(chunks):
-        output_file = f"output_{i}.wav"
-        tts.tts_to_file(text=chunk, file_path=output_file)
-        audio_paths.append(output_file)
-    # دمج المقاطع الصوتية معًا
-    final_output = "final_output.wav"
-    with open(final_output, 'wb') as f:
-        for audio_path in audio_paths:
-            with open(audio_path, 'rb') as audio_file:
-                f.write(audio_file.read())
-            os.remove(audio_path)  # حذف الملفات المؤقتة بعد الدمج
-    return final_output
-# واجهة المستخدم مع Gradio
 iface = gr.Interface(fn=text_to_speech, inputs="text", outputs="audio", live=True)
 # تشغيل التطبيق

 import gradio as gr
+import torchaudio
+from speechbrain.pretrained import FastSpeech2
+from speechbrain.pretrained import HIFIGAN
+# تحميل النموذج الصوتي
+fastspeech2 = FastSpeech2.from_hparams(
+    source="speechbrain/tts-fastspeech2-ljspeech",
+    savedir="tmpdir_tts"
+)
+hifi_gan = HIFIGAN.from_hparams(
+    source="speechbrain/tts-hifigan-ljspeech",
+    savedir="tmpdir_vocoder"
+)
 # دالة لتحويل النص إلى صوت
 def text_to_speech(text):
+    mel_output, durations, pitch, energy = fastspeech2.encode_text(
+        [text],
+        pace=1.0,
+        pitch_rate=1.0,
+        energy_rate=1.0
+    )
+    waveform = hifi_gan.decode_batch(mel_output)
+    torchaudio.save("output.wav", waveform.squeeze(1), 22050)
+    return "output.wav"
+# واجهة المستخدم باستخدام Gradio
 iface = gr.Interface(fn=text_to_speech, inputs="text", outputs="audio", live=True)
 # تشغيل التطبيق

requirements.txt CHANGED Viewed

@@ -1,8 +1,4 @@
-TTS
-numpy<=1.26
-pydub
-numba<0.59
 speechbrain==0.5.12
 gradio==3.10.0
 torch==1.12.1
-librosa==0.9.2

 speechbrain==0.5.12
 gradio==3.10.0
 torch==1.12.1
+torchaudio==0.12.1