Spaces:

prasanacodes
/

Indic-Translation-Toolkit

Running

prasanacodes commited on Aug 18, 2025

Commit

afada3a

verified ·

1 Parent(s): 15be79b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -19,14 +19,6 @@ torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
 print(f"Using device: {device}")
-# Initialize the ASR pipeline from Hugging Face Transformers
-transcriber = pipeline(
-    "automatic-speech-recognition",
-    model="openai/whisper-large-v3-turbo",
-    torch_dtype=torch_dtype,
-    device=device,
-)
 # --- Transcription Function ---
 def extract_audio_from_video(video_path, output_audio_path="temp_extracted_audio.wav"):
     """
@@ -60,6 +52,16 @@ def transcribe_audio(audio_path):
     This function takes an audio file path, transcribes it using the Whisper model,
     and returns the transcribed text.
     """
     if audio_path is None:
         return "No audio file provided. Please upload or record an audio file."

 print(f"Using device: {device}")
 # --- Transcription Function ---
 def extract_audio_from_video(video_path, output_audio_path="temp_extracted_audio.wav"):
     """
     This function takes an audio file path, transcribes it using the Whisper model,
     and returns the transcribed text.
     """
+    # Initialize the ASR pipeline from Hugging Face Transformers
+    transcriber = pipeline(
+        "automatic-speech-recognition",
+        model="openai/whisper-large-v3-turbo",
+        torch_dtype=torch_dtype,
+        device=device,
+        language='en',
+    )
     if audio_path is None:
         return "No audio file provided. Please upload or record an audio file."