Spaces:

Sulav
/

firstspace

Runtime error

Sulav commited on Nov 17, 2022

Commit

befe725

1 Parent(s): 68c142d

replacing transformers pipeline with whisper python library

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,14 +1,36 @@
 import gradio as gr
-from transformers import pipeline
-p = pipeline("automatic-speech-recognition", model='openai/whisper-small')
 def transcribe(audio):
-    text = p(audio)["text"]
-    return text
 gr.Interface(
     fn=transcribe,
-    inputs=gr.Audio(source="microphone", type="filepath"),
-    outputs="text").launch()

+import whisper
 import gradio as gr
+model = whisper.load_model("small")
 def transcribe(audio):
+    #time.sleep(3)
+    # load audio and pad/trim it to fit 30 seconds
+    audio = whisper.load_audio(audio)
+    audio = whisper.pad_or_trim(audio)
+    # make log-Mel spectrogram and move to the same device as the model
+    mel = whisper.log_mel_spectrogram(audio).to(model.device)
+    # detect the spoken language
+    _, probs = model.detect_language(mel)
+    print(f"Detected language: {max(probs, key=probs.get)}")
+    # decode the audio
+    options = whisper.DecodingOptions(fp16 = False)
+    result = whisper.decode(model, mel, options)
+    return result.text
 gr.Interface(
+    title = 'OpenAI Whisper ASR Gradio Web UI',
     fn=transcribe,
+    inputs=[
+        gr.inputs.Audio(source="microphone", type="filepath")
+    ],
+    outputs=[
+        "textbox"
+    ],
+    live=True).launch()