Spaces:

dmcartor
/

ASR_Starter_Project

Sleeping

dmcartor commited on Jul 26, 2024

Commit

7dfdabd

verified ·

1 Parent(s): 72f0206

App.py update to add recording ability

Added the option to record audio as well as upload an audio file, and made some interface changes for improved interaction.

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,6 +9,11 @@ def transcribe(file):
     result = pipe(file)["text"]
     return result
 # Retain the ChatInterface setup from the existing app.py
 from huggingface_hub import InferenceClient
@@ -46,9 +51,19 @@ def respond(
         response += token
         yield response
-# Create two separate Gradio interfaces
-asr_interface = gr.Interface(fn=transcribe, inputs="file", outputs="text", title="ASR Transcription", description="Upload an audio file and get the transcription.")
 chat_interface = gr.ChatInterface(
     respond,
     additional_inputs=[
@@ -67,10 +82,12 @@ chat_interface = gr.ChatInterface(
 # Combine the two interfaces into a single Gradio Blocks application
 with gr.Blocks() as demo:
     gr.Markdown("# ASR and Chatbot Application")
     asr_interface.render()
     gr.Markdown("----")
     chat_interface.render()
 if __name__ == "__main__":
-    demo.launch()

     result = pipe(file)["text"]
     return result
+# Function to handle direct audio recording
+def record_and_transcribe(audio):
+    result = pipe(audio)["text"]
+    return result
 # Retain the ChatInterface setup from the existing app.py
 from huggingface_hub import InferenceClient
         response += token
         yield response
+# Create the ASR interface with a label and functionality for both file upload and direct recording
+asr_interface = gr.Interface(
+    fn=transcribe,
+    inputs=[
+        gr.File(label="Upload an audio file"),
+        gr.Audio(source="microphone", type="filepath", label="Record audio directly")
+    ],
+    outputs="text",
+    title="ASR Transcription",
+    description="Upload an audio file or record audio directly and get the transcription."
+)
+# Retain the ChatInterface setup from the existing app.py
 chat_interface = gr.ChatInterface(
     respond,
     additional_inputs=[
 # Combine the two interfaces into a single Gradio Blocks application
 with gr.Blocks() as demo:
+    gr.Markdown(" ")  # Adding space between the top and the ASR interface title
     gr.Markdown("# ASR and Chatbot Application")
+    gr.Markdown(" ")  # Adding space between the ASR title and interface
     asr_interface.render()
     gr.Markdown("----")
     chat_interface.render()
 if __name__ == "__main__":
+    demo.launch()