Spaces:

dschandra
/

AIVoice

Sleeping

dschandra commited on Dec 28, 2024

Commit

497eb2a

verified ·

1 Parent(s): 83a6bbe

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -15,7 +15,7 @@ conversational_pipeline = pipeline("text-generation", model="microsoft/DialoGPT-
 def speech_to_text(audio_file):
     """Convert speech in audio file to text using Wav2Vec2"""
-    audio_input, _ = librosa.load(audio_file, sr=16000)
     input_values = processor(audio_input, return_tensors="pt").input_values
     # Perform speech-to-text
@@ -53,12 +53,12 @@ def process_audio(audio_file):
 # Create Gradio interface for audio input/output
 iface = gr.Interface(
     fn=process_audio,
-    inputs=gr.Audio(type="filepath"),  # Updated for Gradio v3.x (type="filepath" for audio input)
-    outputs=[gr.Textbox(), gr.Audio(type="filepath")],  # Updated for Gradio v3.x (type="filepath" for audio output)
     live=True,
     title="Voice Bot with Wav2Vec2.0",
-    description="Speak to the bot and get a response!"
 )
 # Launch the interface
-iface.launch()

 def speech_to_text(audio_file):
     """Convert speech in audio file to text using Wav2Vec2"""
+    audio_input, _ = librosa.load(audio_file, sr=16000)  # Load the audio
     input_values = processor(audio_input, return_tensors="pt").input_values
     # Perform speech-to-text
 # Create Gradio interface for audio input/output
 iface = gr.Interface(
     fn=process_audio,
+    inputs=gr.Audio(source="microphone", type="filepath"),  # Corrected for real-time audio input
+    outputs=[gr.Textbox(), gr.Audio(type="filepath")],  # Corrected for real-time audio output
     live=True,
     title="Voice Bot with Wav2Vec2.0",
+    description="Speak to the bot and get a response instantly! This bot listens and responds like Google Assistant/Siri."
 )
 # Launch the interface
+iface.launch(share=True)