Spaces:
Running
Running
Ronaldo commited on
Commit Β·
b2105a3
1
Parent(s): 3b67889
first commit
Browse files- README.md +2 -1
- app.py +15 -10
- requirements.txt +3 -3
README.md
CHANGED
|
@@ -4,7 +4,7 @@ emoji: ποΈ
|
|
| 4 |
colorFrom: blue
|
| 5 |
colorTo: green
|
| 6 |
sdk: gradio
|
| 7 |
-
sdk_version: "4.
|
| 8 |
python_version: "3.10"
|
| 9 |
app_file: app.py
|
| 10 |
pinned: false
|
|
@@ -92,6 +92,7 @@ L'interface Gradio s'ouvrira automatiquement sur `http://localhost:7860`
|
|
| 92 |
- π§π― Mina (gej)
|
| 93 |
- π§π― Ditammari (tbz)
|
| 94 |
- π³π¬ Yoruba (yor)
|
|
|
|
| 95 |
- π¬π§ English (eng)
|
| 96 |
|
| 97 |
### Onglet 3: βΉοΈ Γ propos
|
|
|
|
| 4 |
colorFrom: blue
|
| 5 |
colorTo: green
|
| 6 |
sdk: gradio
|
| 7 |
+
sdk_version: "4.44.1"
|
| 8 |
python_version: "3.10"
|
| 9 |
app_file: app.py
|
| 10 |
pinned: false
|
|
|
|
| 92 |
- π§π― Mina (gej)
|
| 93 |
- π§π― Ditammari (tbz)
|
| 94 |
- π³π¬ Yoruba (yor)
|
| 95 |
+
- π§π― Fon (fon)
|
| 96 |
- π¬π§ English (eng)
|
| 97 |
|
| 98 |
### Onglet 3: βΉοΈ Γ propos
|
app.py
CHANGED
|
@@ -23,6 +23,7 @@ LANGUAGE_MAPPING = {
|
|
| 23 |
"Mina (gej)": "facebook/mms-tts-gej",
|
| 24 |
"Ditammari (tbz)": "facebook/mms-tts-tbz",
|
| 25 |
"Yoruba (yor)": "facebook/mms-tts-yor",
|
|
|
|
| 26 |
"English (eng)": "facebook/mms-tts-eng",
|
| 27 |
}
|
| 28 |
|
|
@@ -96,12 +97,15 @@ def process_audio(audio_data):
|
|
| 96 |
logger.error(f"Erreur traitement audio: {e}")
|
| 97 |
raise
|
| 98 |
|
| 99 |
-
def transcribe_audio(audio,
|
| 100 |
"""Transcrit l'audio en texte (ASR)"""
|
| 101 |
if audio is None:
|
| 102 |
return "β Veuillez enregistrer ou uploader un fichier audio"
|
| 103 |
|
| 104 |
try:
|
|
|
|
|
|
|
|
|
|
| 105 |
audio_processed = process_audio(audio)
|
| 106 |
model, processor = load_asr_model()
|
| 107 |
processor.current_lang = language
|
|
@@ -170,15 +174,15 @@ with gr.Blocks(title="ποΈ MMS ASR/TTS - Speech AI", theme=gr.themes.Soft())
|
|
| 170 |
)
|
| 171 |
language_asr = gr.Dropdown(
|
| 172 |
choices=[
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 173 |
"English (eng)",
|
| 174 |
-
"French (fra)",
|
| 175 |
-
"Spanish (spa)",
|
| 176 |
-
"German (deu)",
|
| 177 |
-
"Portuguese (por)",
|
| 178 |
-
"Arabic (ara)",
|
| 179 |
-
"Hindi (hin)",
|
| 180 |
-
"Chinese (zho)",
|
| 181 |
-
"Japanese (jpn)",
|
| 182 |
],
|
| 183 |
value="English (eng)",
|
| 184 |
label="π Langue"
|
|
@@ -279,6 +283,7 @@ with gr.Blocks(title="ποΈ MMS ASR/TTS - Speech AI", theme=gr.themes.Soft())
|
|
| 279 |
<li>π§π― Mina (gej)</li>
|
| 280 |
<li>π§π― Ditammari (tbz)</li>
|
| 281 |
<li>π³π¬ Yoruba (yor)</li>
|
|
|
|
| 282 |
<li>π¬π§ English (eng)</li>
|
| 283 |
</ul>
|
| 284 |
|
|
@@ -312,4 +317,4 @@ with gr.Blocks(title="ποΈ MMS ASR/TTS - Speech AI", theme=gr.themes.Soft())
|
|
| 312 |
if __name__ == "__main__":
|
| 313 |
logger.info(f"π DΓ©marrage de l'interface Gradio")
|
| 314 |
logger.info(f"π Device: {get_device()}")
|
| 315 |
-
demo.launch(share=
|
|
|
|
| 23 |
"Mina (gej)": "facebook/mms-tts-gej",
|
| 24 |
"Ditammari (tbz)": "facebook/mms-tts-tbz",
|
| 25 |
"Yoruba (yor)": "facebook/mms-tts-yor",
|
| 26 |
+
"Fon (fon)": "facebook/mms-tts-fon",
|
| 27 |
"English (eng)": "facebook/mms-tts-eng",
|
| 28 |
}
|
| 29 |
|
|
|
|
| 97 |
logger.error(f"Erreur traitement audio: {e}")
|
| 98 |
raise
|
| 99 |
|
| 100 |
+
def transcribe_audio(audio, language_label):
|
| 101 |
"""Transcrit l'audio en texte (ASR)"""
|
| 102 |
if audio is None:
|
| 103 |
return "β Veuillez enregistrer ou uploader un fichier audio"
|
| 104 |
|
| 105 |
try:
|
| 106 |
+
# Extrait le code de langue du format "Langue (code)"
|
| 107 |
+
language = language_label.split("(")[-1].rstrip(")")
|
| 108 |
+
|
| 109 |
audio_processed = process_audio(audio)
|
| 110 |
model, processor = load_asr_model()
|
| 111 |
processor.current_lang = language
|
|
|
|
| 174 |
)
|
| 175 |
language_asr = gr.Dropdown(
|
| 176 |
choices=[
|
| 177 |
+
"Biali (beh)",
|
| 178 |
+
"Baatombu (bba)",
|
| 179 |
+
"Dendi (ddn)",
|
| 180 |
+
"ΓwΓ© (ewe)",
|
| 181 |
+
"Mina (gej)",
|
| 182 |
+
"Ditammari (tbz)",
|
| 183 |
+
"Yoruba (yor)",
|
| 184 |
+
"Fon (fon)",
|
| 185 |
"English (eng)",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 186 |
],
|
| 187 |
value="English (eng)",
|
| 188 |
label="π Langue"
|
|
|
|
| 283 |
<li>π§π― Mina (gej)</li>
|
| 284 |
<li>π§π― Ditammari (tbz)</li>
|
| 285 |
<li>π³π¬ Yoruba (yor)</li>
|
| 286 |
+
<li>π§π― Fon (fon)</li>
|
| 287 |
<li>π¬π§ English (eng)</li>
|
| 288 |
</ul>
|
| 289 |
|
|
|
|
| 317 |
if __name__ == "__main__":
|
| 318 |
logger.info(f"π DΓ©marrage de l'interface Gradio")
|
| 319 |
logger.info(f"π Device: {get_device()}")
|
| 320 |
+
demo.launch(share=False, debug=False)
|
requirements.txt
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
-
gradio==4.
|
| 2 |
-
transformers==4.
|
| 3 |
torch==2.1.1
|
| 4 |
torchaudio==2.1.1
|
| 5 |
-
librosa==0.10.
|
| 6 |
soundfile==0.12.1
|
| 7 |
numpy==1.24.3
|
|
|
|
| 1 |
+
gradio==4.44.1
|
| 2 |
+
transformers==4.40.0
|
| 3 |
torch==2.1.1
|
| 4 |
torchaudio==2.1.1
|
| 5 |
+
librosa==0.10.1
|
| 6 |
soundfile==0.12.1
|
| 7 |
numpy==1.24.3
|