Spaces:

Umar4321
/

Pashto-Translator

Sleeping

App Files Files Community

Umar4321 commited on Aug 25, 2025

Commit

02cc100

verified ·

1 Parent(s): 80283da

Update app.py

Browse files

Files changed (1) hide show

app.py +66 -32

app.py CHANGED Viewed

@@ -4,13 +4,27 @@ from transformers import pipeline
 from gtts import gTTS
 import tempfile
 import os
 # ------------------------------
-# Setup models
 # ------------------------------
-stt_model = pipeline("automatic-speech-recognition", model="openai/whisper-small")  # Pashto supported
-translator_en = pipeline("translation", model="Helsinki-NLP/opus-mt-ps-en")  # Pashto → English
-translator_ur = pipeline("translation", model="Helsinki-NLP/opus-mt-ps-ur")  # Pashto → Urdu
 # ------------------------------
 # Streamlit UI
@@ -29,33 +43,53 @@ wav_audio_data = st_audiorec()
 if wav_audio_data is not None:
     st.audio(wav_audio_data, format="audio/wav")
-    # ------------------------------
-    # Step 1: Speech to Text (Pashto)
-    # ------------------------------
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_wav:
         temp_wav.write(wav_audio_data)
-        temp_wav.flush()
-        pashto_text = stt_model(temp_wav.name)["text"]
-    st.subheader("Pashto transcription:")
-    st.info(pashto_text)
-    # ------------------------------
-    # Step 2: Translation
-    # ------------------------------
-    if target_lang == "English":
-        translated = translator_en(pashto_text)[0]["translation_text"]
-    else:
-        translated = translator_ur(pashto_text)[0]["translation_text"]
-    st.subheader(f"Translated ({target_lang}):")
-    st.success(translated)
-    # ------------------------------
-    # Step 3: Text-to-Speech
-    # ------------------------------
-    tts = gTTS(text=translated, lang="en" if target_lang == "English" else "ur")
-    with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as temp_mp3:
-        tts.save(temp_mp3.name)
-        st.audio(temp_mp3.name, format="audio/mp3")

 from gtts import gTTS
 import tempfile
 import os
+import time
 # ------------------------------
+# Setup models with progress indicators
 # ------------------------------
+@st.cache_resource
+def load_models():
+    with st.spinner("Loading speech-to-text model..."):
+        stt_model = pipeline("automatic-speech-recognition", model="openai/whisper-small")
+    with st.spinner("Loading translation models..."):
+        translator_en = pipeline("translation", model="Helsinki-NLP/opus-mt-ps-en")
+        translator_ur = pipeline("translation", model="Helsinki-NLP/opus-mt-ps-ur")
+    return stt_model, translator_en, translator_ur
+try:
+    stt_model, translator_en, translator_ur = load_models()
+except Exception as e:
+    st.error(f"Error loading models: {str(e)}")
+    st.stop()
 # ------------------------------
 # Streamlit UI
 if wav_audio_data is not None:
     st.audio(wav_audio_data, format="audio/wav")
+    # Save audio to a temporary file with proper handling
     with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_wav:
         temp_wav.write(wav_audio_data)
+        temp_filename = temp_wav.name
+    try:
+        # ------------------------------
+        # Step 1: Speech to Text (Pashto)
+        # ------------------------------
+        with st.spinner("Transcribing speech..."):
+            pashto_text = stt_model(temp_filename)["text"]
+        # Clean up temporary file
+        os.unlink(temp_filename)
+        st.subheader("Pashto transcription:")
+        st.info(pashto_text)
+        # ------------------------------
+        # Step 2: Translation
+        # ------------------------------
+        with st.spinner("Translating..."):
+            if target_lang == "English":
+                translated = translator_en(pashto_text)[0]["translation_text"]
+            else:
+                translated = translator_ur(pashto_text)[0]["translation_text"]
+        st.subheader(f"Translated ({target_lang}):")
+        st.success(translated)
+        # ------------------------------
+        # Step 3: Text-to-Speech
+        # ------------------------------
+        with st.spinner("Generating audio..."):
+            tts = gTTS(text=translated, lang="en" if target_lang == "English" else "ur")
+            # Use BytesIO to avoid file handling issues
+            from io import BytesIO
+            audio_bytes = BytesIO()
+            tts.write_to_fp(audio_bytes)
+            audio_bytes.seek(0)
+            st.audio(audio_bytes, format="audio/mp3")
+    except Exception as e:
+        st.error(f"An error occurred: {str(e)}")
+        # Ensure temporary file is cleaned up even if error occurs
+        if os.path.exists(temp_filename):
+            os.unlink(temp_filename)