Ronaldo commited on
Commit
b2105a3
Β·
1 Parent(s): 3b67889

first commit

Browse files
Files changed (3) hide show
  1. README.md +2 -1
  2. app.py +15 -10
  3. requirements.txt +3 -3
README.md CHANGED
@@ -4,7 +4,7 @@ emoji: πŸŽ™οΈ
4
  colorFrom: blue
5
  colorTo: green
6
  sdk: gradio
7
- sdk_version: "4.26.0"
8
  python_version: "3.10"
9
  app_file: app.py
10
  pinned: false
@@ -92,6 +92,7 @@ L'interface Gradio s'ouvrira automatiquement sur `http://localhost:7860`
92
  - πŸ‡§πŸ‡― Mina (gej)
93
  - πŸ‡§πŸ‡― Ditammari (tbz)
94
  - πŸ‡³πŸ‡¬ Yoruba (yor)
 
95
  - πŸ‡¬πŸ‡§ English (eng)
96
 
97
  ### Onglet 3: ℹ️ Γ€ propos
 
4
  colorFrom: blue
5
  colorTo: green
6
  sdk: gradio
7
+ sdk_version: "4.44.1"
8
  python_version: "3.10"
9
  app_file: app.py
10
  pinned: false
 
92
  - πŸ‡§πŸ‡― Mina (gej)
93
  - πŸ‡§πŸ‡― Ditammari (tbz)
94
  - πŸ‡³πŸ‡¬ Yoruba (yor)
95
+ - πŸ‡§πŸ‡― Fon (fon)
96
  - πŸ‡¬πŸ‡§ English (eng)
97
 
98
  ### Onglet 3: ℹ️ Γ€ propos
app.py CHANGED
@@ -23,6 +23,7 @@ LANGUAGE_MAPPING = {
23
  "Mina (gej)": "facebook/mms-tts-gej",
24
  "Ditammari (tbz)": "facebook/mms-tts-tbz",
25
  "Yoruba (yor)": "facebook/mms-tts-yor",
 
26
  "English (eng)": "facebook/mms-tts-eng",
27
  }
28
 
@@ -96,12 +97,15 @@ def process_audio(audio_data):
96
  logger.error(f"Erreur traitement audio: {e}")
97
  raise
98
 
99
- def transcribe_audio(audio, language):
100
  """Transcrit l'audio en texte (ASR)"""
101
  if audio is None:
102
  return "❌ Veuillez enregistrer ou uploader un fichier audio"
103
 
104
  try:
 
 
 
105
  audio_processed = process_audio(audio)
106
  model, processor = load_asr_model()
107
  processor.current_lang = language
@@ -170,15 +174,15 @@ with gr.Blocks(title="πŸŽ™οΈ MMS ASR/TTS - Speech AI", theme=gr.themes.Soft())
170
  )
171
  language_asr = gr.Dropdown(
172
  choices=[
 
 
 
 
 
 
 
 
173
  "English (eng)",
174
- "French (fra)",
175
- "Spanish (spa)",
176
- "German (deu)",
177
- "Portuguese (por)",
178
- "Arabic (ara)",
179
- "Hindi (hin)",
180
- "Chinese (zho)",
181
- "Japanese (jpn)",
182
  ],
183
  value="English (eng)",
184
  label="🌐 Langue"
@@ -279,6 +283,7 @@ with gr.Blocks(title="πŸŽ™οΈ MMS ASR/TTS - Speech AI", theme=gr.themes.Soft())
279
  <li>πŸ‡§πŸ‡― Mina (gej)</li>
280
  <li>πŸ‡§πŸ‡― Ditammari (tbz)</li>
281
  <li>πŸ‡³πŸ‡¬ Yoruba (yor)</li>
 
282
  <li>πŸ‡¬πŸ‡§ English (eng)</li>
283
  </ul>
284
 
@@ -312,4 +317,4 @@ with gr.Blocks(title="πŸŽ™οΈ MMS ASR/TTS - Speech AI", theme=gr.themes.Soft())
312
  if __name__ == "__main__":
313
  logger.info(f"πŸš€ DΓ©marrage de l'interface Gradio")
314
  logger.info(f"πŸ“Š Device: {get_device()}")
315
- demo.launch(share=True, debug=False)
 
23
  "Mina (gej)": "facebook/mms-tts-gej",
24
  "Ditammari (tbz)": "facebook/mms-tts-tbz",
25
  "Yoruba (yor)": "facebook/mms-tts-yor",
26
+ "Fon (fon)": "facebook/mms-tts-fon",
27
  "English (eng)": "facebook/mms-tts-eng",
28
  }
29
 
 
97
  logger.error(f"Erreur traitement audio: {e}")
98
  raise
99
 
100
+ def transcribe_audio(audio, language_label):
101
  """Transcrit l'audio en texte (ASR)"""
102
  if audio is None:
103
  return "❌ Veuillez enregistrer ou uploader un fichier audio"
104
 
105
  try:
106
+ # Extrait le code de langue du format "Langue (code)"
107
+ language = language_label.split("(")[-1].rstrip(")")
108
+
109
  audio_processed = process_audio(audio)
110
  model, processor = load_asr_model()
111
  processor.current_lang = language
 
174
  )
175
  language_asr = gr.Dropdown(
176
  choices=[
177
+ "Biali (beh)",
178
+ "Baatombu (bba)",
179
+ "Dendi (ddn)",
180
+ "Γ‰wΓ© (ewe)",
181
+ "Mina (gej)",
182
+ "Ditammari (tbz)",
183
+ "Yoruba (yor)",
184
+ "Fon (fon)",
185
  "English (eng)",
 
 
 
 
 
 
 
 
186
  ],
187
  value="English (eng)",
188
  label="🌐 Langue"
 
283
  <li>πŸ‡§πŸ‡― Mina (gej)</li>
284
  <li>πŸ‡§πŸ‡― Ditammari (tbz)</li>
285
  <li>πŸ‡³πŸ‡¬ Yoruba (yor)</li>
286
+ <li>πŸ‡§πŸ‡― Fon (fon)</li>
287
  <li>πŸ‡¬πŸ‡§ English (eng)</li>
288
  </ul>
289
 
 
317
  if __name__ == "__main__":
318
  logger.info(f"πŸš€ DΓ©marrage de l'interface Gradio")
319
  logger.info(f"πŸ“Š Device: {get_device()}")
320
+ demo.launch(share=False, debug=False)
requirements.txt CHANGED
@@ -1,7 +1,7 @@
1
- gradio==4.26.0
2
- transformers==4.36.2
3
  torch==2.1.1
4
  torchaudio==2.1.1
5
- librosa==0.10.0
6
  soundfile==0.12.1
7
  numpy==1.24.3
 
1
+ gradio==4.44.1
2
+ transformers==4.40.0
3
  torch==2.1.1
4
  torchaudio==2.1.1
5
+ librosa==0.10.1
6
  soundfile==0.12.1
7
  numpy==1.24.3