Spaces:

Teapack1
/

Assistant-Audio-Intent-Classification

Sleeping

Teapack1 commited on Nov 23, 2023

Commit

7662dae

1 Parent(s): c0fb8f9

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,18 +4,23 @@ import numpy as np
 transcriber = pipeline("automatic-speech-recognition", model="openai/whisper-base.en")
-def transcribe(audio):
-    sr, y = audio
     y = y.astype(np.float32)
     y /= np.max(np.abs(y))
-    return transcriber({"sampling_rate": sr, "raw": y})["text"]
 demo = gr.Interface(
     transcribe,
-    gr.Audio(sources=["microphone"]),
-    "text",
 )
-demo.launch()

 transcriber = pipeline("automatic-speech-recognition", model="openai/whisper-base.en")
+def transcribe(stream, new_chunk):
+    sr, y = new_chunk
     y = y.astype(np.float32)
     y /= np.max(np.abs(y))
+    if stream is not None:
+        stream = np.concatenate([stream, y])
+    else:
+        stream = y
+    return stream, transcriber({"sampling_rate": sr, "raw": stream})["text"]
 demo = gr.Interface(
     transcribe,
+    ["state", gr.Audio(sources=["microphone"], streaming=True)],
+    ["state", "text"],
+    live=True,
 )
+demo.launch()