Spaces:

Oluko
/

yoruba-practice

Sleeping

App Files Files Community

Olaolu Olugbenle commited on Dec 15, 2025

Commit

909d8d8

1 Parent(s): 6640d8a

removed tts elems in gradio

Browse files

Files changed (1) hide show

app.py +52 -52

app.py CHANGED Viewed

@@ -193,7 +193,7 @@ def transcribe_and_translate(file_path, mode: str):
 #     sr = audio.frame_rate
 #     samples = np.array(audio.get_array_of_samples())
-#     #TODO: WHAT DOES THIS DO AND WHY?
 #     if audio.channels > 1:
 #         samples = samples.reshape((-1, audio.channels))
 #     # normalize integer samples -> float32 in [-1, 1]
@@ -310,62 +310,59 @@ with gr.Blocks(title="Olùkọ́ | Learn Yoruba") as app:
     gr.Markdown("# 🇳🇬 Olùkọ́")
     gr.Markdown("Comprehensive Yoruba learning tool!")
-    with gr.Row():
-        # direction selector
-        mode = gr.Radio(
-            choices=["Yoruba → English", "English → Yoruba"],
-            value="Yoruba → English",
-            label="Direction"
-        )
-    # single editable textbox + microphone next to it
-    with gr.Row():
-        #User input textbox
-        output_transcription = gr.Textbox(
-            label="✍️ Speak/Type...",
-            interactive=True,
-            placeholder="Type here or press the mic to speak..."
-        )
-        # User input microphone
-        mic_recorder = gr.Audio(
-            sources="microphone",
-            type="filepath",
-            label="🎙️",
-            show_label=True
-        )
     #Store translation textbox + TTS model in same row
     with gr.Row():
         #Translation textbox
         output_translation = gr.Textbox(label="💬 Translation")
-        #Button for TTS
-        tts_button = gr.Button("Play TTS")
-        #Audio for TTS playback
-        tts_audio = gr.Audio(label="TTS Playback", type="numpy", interactive=False)
-    def _on_tts_click(text, direction):
-        """Generate TTS from the translation textbox (no disk write)
-        and return (sr, samples)."""
-        if not text:
-            return None
-        # select language/voice mapping as needed
-        if direction == "English → Yoruba":
-            lang = "yo"
-            voice = "Femi"
-        else:
-            lang = "en"
-            voice = "Mary"
-        try:
-            result = synthesize_tts_to_array(text, language=lang, voice=voice)
-            return result  # (sr, numpy_array) or None
-        except Exception as e:
-            print("TTS generation failed:", e)
-            return None
     # when the mic finishes: transcribe + translate and populate both boxes
     mic_recorder.change(
@@ -381,13 +378,13 @@ with gr.Blocks(title="Olùkọ́ | Learn Yoruba") as app:
         outputs=output_translation,
     )
-    #If the TTS_Button is pushed, call the _on_tts_click function
     #Send the output audi0 (sr, numpy_array) to the tts_audio block
-    tts_button.click(
-        _on_tts_click,
-        inputs=[output_translation, mode],
-        outputs=tts_audio
-    )
 # ===========================
 #  APP LAUNCH
@@ -396,3 +393,6 @@ with gr.Blocks(title="Olùkọ́ | Learn Yoruba") as app:
 if __name__ == "__main__":
     app.launch() #server_name="0.0.0.0", server_port=7860)

 #     sr = audio.frame_rate
 #     samples = np.array(audio.get_array_of_samples())
+#     #TODO
 #     if audio.channels > 1:
 #         samples = samples.reshape((-1, audio.channels))
 #     # normalize integer samples -> float32 in [-1, 1]
     gr.Markdown("# 🇳🇬 Olùkọ́")
     gr.Markdown("Comprehensive Yoruba learning tool!")
+    # direction selector
+    mode = gr.Radio(
+        choices=["Yoruba → English", "English → Yoruba"],
+        value="Yoruba → English",
+        label="Direction"
+    )
+    # User input microphone
+    mic_recorder = gr.Audio(
+        type="filepath",
+        label="🎙️",
+        show_label=True
+    )
+    # single editable textbox + microphone next to it
+    #User input textbox
+    output_transcription = gr.Textbox(
+        label="✍️ Speak/Type...",
+        interactive=True
+    )
     #Store translation textbox + TTS model in same row
     with gr.Row():
         #Translation textbox
         output_translation = gr.Textbox(label="💬 Translation")
+        #Button for TTS. TODO
+        # tts_button = gr.Button("Play TTS")
+        #Audio for TTS playback. TODO
+        # tts_audio = gr.Audio(label="TTS Playback", type="numpy", interactive=False)
+    #TODO
+    # def _on_tts_click(text, direction):
+    #     """Generate TTS from the translation textbox (no disk write)
+    #     and return (sr, samples)."""
+    #     if not text:
+    #         return None
+    #     # select language/voice mapping as needed
+    #     if direction == "English → Yoruba":
+    #         lang = "yo"
+    #         voice = "Femi"
+    #     else:
+    #         lang = "en"
+    #         voice = "Mary"
+    #     try:
+    #         result = synthesize_tts_to_array(text, language=lang, voice=voice)
+    #         return result  # (sr, numpy_array) or None
+    #     except Exception as e:
+    #         print("TTS generation failed:", e)
+    #         return None
     # when the mic finishes: transcribe + translate and populate both boxes
     mic_recorder.change(
         outputs=output_translation,
     )
+    #TODO If the TTS_Button is pushed, call the _on_tts_click function
     #Send the output audi0 (sr, numpy_array) to the tts_audio block
+    # tts_button.click(
+    #     _on_tts_click,
+    #     inputs=[output_translation, mode],
+    #     outputs=tts_audio
+    # )
 # ===========================
 #  APP LAUNCH
 if __name__ == "__main__":
     app.launch() #server_name="0.0.0.0", server_port=7860)