Spaces:

Subbu1304
/

voice_recognize

Runtime error

App Files Files Community

Subbu1304 commited on Feb 4, 2025

Commit

e5790ba

verified ·

1 Parent(s): 59b3579

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -33

app.py CHANGED Viewed

@@ -1,9 +1,6 @@
 import gradio as gr
 import speech_recognition as sr
 import pyttsx3
-import sounddevice as sd
-import numpy as np
-import io
 # Initialize the speech engine
 engine = pyttsx3.init()
@@ -13,38 +10,24 @@ def speak(text):
     engine.say(text)
     engine.runAndWait()
-# Function to listen to user voice input using sounddevice
 def listen():
     recognizer = sr.Recognizer()
-    # Set up sounddevice recording parameters
-    fs = 16000  # Sampling frequency
-    duration = 5  # seconds to record
-    speak("Listening for your input...")
-    # Record audio
-    recording = sd.rec(int(duration * fs), samplerate=fs, channels=1, dtype='int16')
-    sd.wait()
-    # Convert the recording to audio data for recognition
-    audio_data = np.array(recording, dtype=np.float32)
-    audio_data = io.BytesIO(audio_data)
-    # Use SpeechRecognition to process the audio
-    with sr.AudioData(audio_data, fs, 2) as source:
-        audio = recognizer.record(source)
-    print("Recognizing...")
-    try:
-        text = recognizer.recognize_google(audio)
-        print(f"Recognized text: {text}")
-        return text
-    except sr.UnknownValueError:
-        print("Sorry, I could not understand the audio.")
-        return None
-    except sr.RequestError:
-        print("Sorry, the speech recognition service is down.")
-        return None
 # Define the function for Gradio interface
 def voice_login():
@@ -69,3 +52,4 @@ iface = gr.Interface(fn=voice_login, inputs=[], outputs="text", live=True)
 # Launch the interface
 iface.launch()

 import gradio as gr
 import speech_recognition as sr
 import pyttsx3
 # Initialize the speech engine
 engine = pyttsx3.init()
     engine.say(text)
     engine.runAndWait()
+# Function to listen to user voice input using SpeechRecognition
 def listen():
     recognizer = sr.Recognizer()
+    with sr.Microphone() as source:
+        print("Listening for your input...")
+        recognizer.adjust_for_ambient_noise(source)
+        audio = recognizer.listen(source)
+        print("Recognizing...")
+        try:
+            text = recognizer.recognize_google(audio)
+            print(f"Recognized text: {text}")
+            return text
+        except sr.UnknownValueError:
+            print("Sorry, I could not understand the audio.")
+            return None
+        except sr.RequestError:
+            print("Sorry, the speech recognition service is down.")
+            return None
 # Define the function for Gradio interface
 def voice_login():
 # Launch the interface
 iface.launch()