Spaces:

Anushkabhat9
/

DeepLearning

Sleeping

Anushkabhat9 commited on Sep 26, 2024

Commit

6892880

verified ·

1 Parent(s): 1082bf2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,23 +1,34 @@
 import torch
 from transformers import pipeline
 from datasets import load_dataset
-device = "cuda:0" if torch.cuda.is_available() else "cpu"
-pipe = pipeline(
   "automatic-speech-recognition",
   model="openai/whisper-small",
   chunk_length_s=30,
-  device=device,
-)
-ds = load_dataset("hf-internal-testing/librispeech_asr_dummy", "clean", split="validation")
-sample = ds[0]["audio"]
-prediction = pipe(sample.copy(), batch_size=8)["text"]
-# we can also return timestamps for the predictions
-prediction = pipe(sample.copy(), batch_size=8, return_timestamps=True)["chunks"]
-print(prediction[0]['text'])

+import gradio as gr
 import torch
 from transformers import pipeline
 from datasets import load_dataset
+# device = "cuda:0" if torch.cuda.is_available() else "cpu"
+# ds = load_dataset("hf-internal-testing/librispeech_asr_dummy", "clean", split="validation")
+# sample = ds[0]["audio"]
+def transcribe_audio(sample):
+ pipe = pipeline(
   "automatic-speech-recognition",
   model="openai/whisper-small",
   chunk_length_s=30,
+ )
+#  prediction = pipe(sample.copy(), batch_size=8)["text"]
+ prediction = pipe(sample.copy(), batch_size=8, return_timestamps=True)["chunks"]
+ return prediction
+# we can also return timestamps for the predictions
+interface = gr.Interface(
+    fn=transcribe_audio,  # The function to be applied to the audio input
+    inputs=gr.Audio(type="filepath"),  # Users can record or upload audio
+    outputs="text",  # The output is the transcription (text)
+    title="Whisper Small ASR",  # Title of your app
+    description="Transcription using Whisper Small."  # Description of your app
+)
+# **This line starts the Gradio app**
+interface.launch()