Update app.py
Browse files
app.py
CHANGED
|
@@ -1,6 +1,7 @@
|
|
| 1 |
import os
|
| 2 |
import gradio as gr
|
| 3 |
import torch
|
|
|
|
| 4 |
|
| 5 |
# ✅ Forzar consentimiento de licencia
|
| 6 |
os.environ["COQUI_TOS_AGREED"] = "1"
|
|
@@ -19,11 +20,11 @@ from TTS.api import TTS
|
|
| 19 |
tts = TTS(model_name="tts_models/multilingual/multi-dataset/xtts_v2")
|
| 20 |
|
| 21 |
# 🎤 Función principal
|
| 22 |
-
def generate_audio(text, language, speaker_wav
|
| 23 |
if speaker_wav is not None:
|
| 24 |
-
|
| 25 |
-
|
| 26 |
-
|
| 27 |
|
| 28 |
# 🎛️ Interfaz
|
| 29 |
iface = gr.Interface(
|
|
@@ -31,7 +32,7 @@ iface = gr.Interface(
|
|
| 31 |
inputs=[
|
| 32 |
gr.Text(label="Texto"),
|
| 33 |
gr.Text(label="Idioma (ej: 'es', 'en')"),
|
| 34 |
-
gr.Audio(type="filepath", label="Audio de voz
|
| 35 |
],
|
| 36 |
outputs=gr.Audio(label="Audio generado")
|
| 37 |
)
|
|
|
|
| 1 |
import os
|
| 2 |
import gradio as gr
|
| 3 |
import torch
|
| 4 |
+
import numpy as np
|
| 5 |
|
| 6 |
# ✅ Forzar consentimiento de licencia
|
| 7 |
os.environ["COQUI_TOS_AGREED"] = "1"
|
|
|
|
| 20 |
tts = TTS(model_name="tts_models/multilingual/multi-dataset/xtts_v2")
|
| 21 |
|
| 22 |
# 🎤 Función principal
|
| 23 |
+
def generate_audio(text, language, speaker_wav):
|
| 24 |
if speaker_wav is not None:
|
| 25 |
+
audio = tts.tts(text=text, speaker_wav=speaker_wav, language=language)
|
| 26 |
+
audio_np = np.array(audio, dtype=np.float16)
|
| 27 |
+
return (22050, audio_np)
|
| 28 |
|
| 29 |
# 🎛️ Interfaz
|
| 30 |
iface = gr.Interface(
|
|
|
|
| 32 |
inputs=[
|
| 33 |
gr.Text(label="Texto"),
|
| 34 |
gr.Text(label="Idioma (ej: 'es', 'en')"),
|
| 35 |
+
gr.Audio(type="filepath", label="Audio de voz")
|
| 36 |
],
|
| 37 |
outputs=gr.Audio(label="Audio generado")
|
| 38 |
)
|