Spaces:

tarawele1
/

Mandeka-TTS

Sleeping

App Files Files Community

tarawele1 commited on Apr 24

Commit

e2dbfa0

verified ·

1 Parent(s): 8c52a5a

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -38

app.py CHANGED Viewed

@@ -1,49 +1,47 @@
 import gradio as gr
-from TTS.utils.synthesizer import Synthesizer
-import os
-# 1. Chargement de votre modèle Bambara
-# Assurez-vous que les noms correspondent bien aux fichiers que vous avez uploadés
-config_path = "config.json"
-model_path = "best_model.pth"
-print("Chargement du modèle TTS...")
-synth = Synthesizer(
-    tts_checkpoint=model_path,
-    tts_config_path=config_path
-)
-# 2. Fonction qui s'exécute quand l'utilisateur clique sur "Générer"
-def lire_bambara(texte):
-    # CORRECTION : On remplace les caractères spéciaux bambara par des caractères latins standard
-    # (le PDF original avait perdu ces caractères à l'affichage)
-    texte_nettoye = texte.replace('ɛ', 'e').replace('ɔ', 'o').replace('Ɛ', 'E').replace('Ɔ', 'O')
-    # Synthèse de la voix avec le texte nettoyé
-    wav = synth.tts(text=texte_nettoye)
-    # Sauvegarde temporaire du fichier audio
-    output_path = "output.wav"
-    synth.save_wav(wav, output_path)
-    return output_path
-# 3. Création de l'interface graphique avec Gradio
-interface = gr.Interface(
-    fn=lire_bambara,
-    inputs=gr.Textbox(
-        label="Texte en Bambara",
-        placeholder="Aw ni ce, ne be bamanankan fo..."
-    ),
     outputs=gr.Audio(label="Audio généré", type="filepath"),
     title="Synthèse Vocale en Bambara",
-    description="Entrez du texte en bambara, et le modèle générera la voix correspondante.",
     examples=[
-        ["Ikireni jamanakuntigi Volodymyr Zelenskyy."],
-        ["Siyasa koo be ka wuli."]
-    ]
 )
-# 4. Lancement de l'application
-interface.launch()

 import gradio as gr
+from transformers import VitsModel, AutoTokenizer
+import torch
+import scipy.io.wavfile
+import tempfile
+# 1. Chargement du "cerveau" bambara de Meta (S'exécute une seule fois au démarrage)
+model_name = "facebook/mms-tts-bam"
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = VitsModel.from_pretrained(model_name)
+def text_to_speech(texte):
+    if not texte.strip():
+        return None
+    # 2. Traduction du texte en langage machine
+    inputs = tokenizer(texte, return_tensors="pt")
+    # 3. Génération de l'audio
+    with torch.no_grad():
+        output = model(**inputs).waveform
+    # 4. Création d'un fichier audio temporaire
+    frequence = model.config.sampling_rate
+    donnees_audio = output[0].numpy()
+    with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as temp_audio:
+        scipy.io.wavfile.write(temp_audio.name, rate=frequence, data=donnees_audio)
+        return temp_audio.name
+# 5. Création de l'interface graphique (Gradio)
+demo = gr.Interface(
+    fn=text_to_speech,
+    inputs=gr.Textbox(label="Texte en Bambara", placeholder="Tapez votre texte ici...", lines=3),
     outputs=gr.Audio(label="Audio généré", type="filepath"),
     title="Synthèse Vocale en Bambara",
+    description="Entrez du texte en bambara. Cette application utilise le modèle officiel d'intelligence artificielle MMS de Meta pour générer la voix correspondante.",
     examples=[
+        ["Ikirɛni jamanakuntigi Volodymyr Zelenskyy."],
+        ["Siyasa koo bɛ ka wuli."],
+        ["Aw ni cɛ, ne bɛ bamanankan fɔ."]
+    ],
+    theme=gr.themes.Soft()
 )
+if __name__ == "__main__":
+    demo.launch()