Spaces:

Subbu1304
/

voice_recognize

Runtime error

Subbu1304 commited on Feb 4, 2025

Commit

59b3579

verified ·

1 Parent(s): 8be53af

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,6 +1,9 @@
 import gradio as gr
 import speech_recognition as sr
 import pyttsx3
 # Initialize the speech engine
 engine = pyttsx3.init()
@@ -10,26 +13,38 @@ def speak(text):
     engine.say(text)
     engine.runAndWait()
-# Function to listen to user voice input
 def listen():
     recognizer = sr.Recognizer()
-    microphone = sr.Microphone()
-    with microphone as source:
-        print("Listening for your input...")
-        recognizer.adjust_for_ambient_noise(source)
-        audio = recognizer.listen(source)
-        print("Recognizing...")
-        try:
-            text = recognizer.recognize_google(audio)
-            print(f"Recognized text: {text}")
-            return text
-        except sr.UnknownValueError:
-            print("Sorry, I could not understand the audio.")
-            return None
-        except sr.RequestError:
-            print("Sorry, the speech recognition service is down.")
-            return None
 # Define the function for Gradio interface
 def voice_login():

 import gradio as gr
 import speech_recognition as sr
 import pyttsx3
+import sounddevice as sd
+import numpy as np
+import io
 # Initialize the speech engine
 engine = pyttsx3.init()
     engine.say(text)
     engine.runAndWait()
+# Function to listen to user voice input using sounddevice
 def listen():
     recognizer = sr.Recognizer()
+    # Set up sounddevice recording parameters
+    fs = 16000  # Sampling frequency
+    duration = 5  # seconds to record
+    speak("Listening for your input...")
+    # Record audio
+    recording = sd.rec(int(duration * fs), samplerate=fs, channels=1, dtype='int16')
+    sd.wait()
+    # Convert the recording to audio data for recognition
+    audio_data = np.array(recording, dtype=np.float32)
+    audio_data = io.BytesIO(audio_data)
+    # Use SpeechRecognition to process the audio
+    with sr.AudioData(audio_data, fs, 2) as source:
+        audio = recognizer.record(source)
+    print("Recognizing...")
+    try:
+        text = recognizer.recognize_google(audio)
+        print(f"Recognized text: {text}")
+        return text
+    except sr.UnknownValueError:
+        print("Sorry, I could not understand the audio.")
+        return None
+    except sr.RequestError:
+        print("Sorry, the speech recognition service is down.")
+        return None
 # Define the function for Gradio interface
 def voice_login():