Spaces:

tbaig1605
/

language_converter

Sleeping

tbaig1605 commited on May 8, 2025

Commit

e936b80

verified ·

1 Parent(s): 3ddc6a4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,29 +1,37 @@
 import streamlit as st
 from transformers import pipeline
-# Load Whisper model (you can choose base, large, etc.)
-whisper = pipeline("automatic-speech-recognition", model="openai/whisper-base")
-# Streamlit app layout
-st.title("Audio Transcription with Whisper")
-st.write("Upload an audio file and let the model transcribe it into text.")
-# Upload audio file
-audio_file = st.file_uploader("Upload an audio file", type=["mp3", "wav", "flac", "opus", "m4a"])
-if audio_file is not None:
-    # Save the uploaded audio file
-    with open("uploaded_audio.wav", "wb") as f:
-        f.write(audio_file.getbuffer())
-    # Display the audio file name
-    st.audio(audio_file, format="audio/wav")
-    # Run transcription
     st.write("Transcribing...")
-    result = whisper("uploaded_audio.wav")["text"]
-    # Show the transcription result
-    st.subheader("Transcription:")
-    st.write(result)

 import streamlit as st
 from transformers import pipeline
+import torchaudio
+import os
+import ffmpeg
+# Step 1: Upload and convert audio to WAV format
+st.title("Audio Transcription with Whisper (Small Model)")
+uploaded_file = st.file_uploader("Upload an audio file", type=["mp3", "wav", "ogg", "opus"])
+if uploaded_file is not None:
+    # Save the uploaded file
+    audio_path = os.path.join("uploads", uploaded_file.name)
+    with open(audio_path, "wb") as f:
+        f.write(uploaded_file.getbuffer())
+    st.audio(audio_path, format="audio/ogg")
+    # Convert to WAV format using ffmpeg if it's not WAV already
+    wav_path = audio_path.replace(os.path.splitext(audio_path)[-1], ".wav")
+    if not audio_path.endswith(".wav"):
+        ffmpeg.input(audio_path).output(wav_path).run()
+    st.success("Audio converted to WAV format")
+    # Step 2: Load Whisper small model for transcription
+    whisper = pipeline("automatic-speech-recognition", model="openai/whisper-small")
+    # Step 3: Transcribe the audio
     st.write("Transcribing...")
+    transcription = whisper(wav_path)
+    st.write("Transcription result: ", transcription['text'])
+else:
+    st.info("Please upload an audio file to transcribe.")