Spaces:

AitBAD
/

kab-hsf-test

Sleeping

Bouaziz-bad commited on Aug 7, 2025

Commit

f46eab4

1 Parent(s): 8a6c8ee

Introduce modular transcription app: frontend + backend

Files changed (4) hide show

README.md CHANGED Viewed

@@ -11,7 +11,8 @@ tags:
   - audio
   - speech-to-text
   - whisper
-  - transcription
 models:
   - openai/whisper-small
 ---

   - audio
   - speech-to-text
   - whisper
 models:
   - openai/whisper-small
+preload_from_hub:
+  - openai/whisper-small
 ---

app.py CHANGED Viewed

@@ -1,43 +1,33 @@
 import gradio as gr
-import torch
-from transformers import pipeline
-# Load the Whisper model for speech recognition
-device = 0 if torch.cuda.is_available() else -1
-transcriber = pipeline(
-    "automatic-speech-recognition",
-    model="openai/whisper-small",
-    chunk_length_s=30,
-    device=device
-)
 def transcribe_audio(audio_file):
-    """
-    Transcribe uploaded audio file.
-    Args:
-        audio_file (str): Path to the audio file
-    Returns:
-        str: Transcribed text
-    """
-    if audio_file is None:
-        return "Please upload an audio file."
-    # Run transcription
-    result = transcriber(audio_file)
-    return result["text"]
-# Define the Gradio interface
 demo = gr.Interface(
     fn=transcribe_audio,
-    inputs=gr.Audio(sources=["upload", "microphone"], type="filepath"),
-    outputs=gr.Textbox(label="Transcription", lines=8),
     title="🎙️ Audio Transcription with Whisper",
-    description="Upload an audio file or record directly to transcribe it using OpenAI's Whisper model.",
     examples=[
-        ["example.wav"]  # Optional: add a sample audio file named example.wav
     ],
     allow_flagging="never"
 )
 # Launch the app
-demo.launch()

+# app.py
 import gradio as gr
+# Import backend
+from backend import AudioTranscriber
+# Initialize the backend transcriber
+transcriber = AudioTranscriber()
 def transcribe_audio(audio_file):
+    return transcriber.transcribe(audio_file)
+# Define Gradio Interface
 demo = gr.Interface(
     fn=transcribe_audio,
+    inputs=gr.Audio(
+        label="Upload or Record Audio",
+        sources=["upload", "microphone"],
+        type="filepath"
+    ),
+    outputs=gr.Textbox(label="Transcription", lines=6, placeholder="Transcription will appear here..."),
     title="🎙️ Audio Transcription with Whisper",
+    description="Upload an audio file or record your voice. The backend will transcribe it using Whisper.",
     examples=[
+        ["example.wav"]  # Optional: include a sample file
     ],
+    cache_examples=False,
     allow_flagging="never"
 )
 # Launch the app
+if __name__ == "__main__":
+    demo.launch()

backend.py ADDED Viewed

+# backend.py
+from transformers import pipeline
+import torch
+class AudioTranscriber:
+    def __init__(self, model_name="openai/whisper-small"):
+        self.device = 0 if torch.cuda.is_available() else -1
+        print(f"Loading model '{model_name}' on device: {'GPU' if self.device == 0 else 'CPU'}")
+        self.pipe = pipeline(
+            "automatic-speech-recognition",
+            model=model_name,
+            chunk_length_s=30,
+            device=self.device
+        )
+    def transcribe(self, audio_path):
+        """
+        Transcribe an audio file.
+        Args:
+            audio_path (str): Path to the audio file
+        Returns:
+            str: Transcribed text
+        """
+        if audio_path is None:
+            return "No audio file provided."
+        try:
+            result = self.pipe(audio_path)
+            return result.get("text", "").strip()
+        except Exception as e:
+            return f"Transcription error: {str(e)}"

requirements.txt ADDED Viewed

+torch==2.3.1
+transformers==4.41.2
+gradio==4.25.0