Spaces:

SujanMidatani
/

speechToText

Sleeping

App Files Files Community

SujanMidatani commited on Jun 13, 2023

Commit

f808091

1 Parent(s): 9024b3e

update app.py

Browse files

Files changed (1) hide show

app.py +25 -63

app.py CHANGED Viewed

@@ -1,64 +1,26 @@
-import requests
-import time
-import json
-import gradio as gr
-secret_key = "6d74a4fac397423a8bd3011180b9b979"
-# retrieve transcription results for the task
-def get_results(config):
-  # endpoint to check status of the transcription task
-  endpoint = "https://api.speechtext.ai/results?"
-  # use a loop to check if the task is finished
-  while True:
-    results = requests.get(endpoint, params=config).json()
-    if "status" not in results:
-      break
-    # print("Task status: {}".format(results["status"]))
-    if results["status"] == 'failed':
-      print("The task is failed: {}".format(results))
-      break
-    if results["status"] == 'finished':
-      break
-    # sleep for 15 seconds if the task has the status - 'processing'
-    time.sleep(15)
-  return results
-# loads the audio into memory
-def  spt(audio_file):
-  with open(audio_file, mode="rb") as file:
-    post_body = file.read()
-  # endpoint to start a transcription task
-  endpoint = "https://api.speechtext.ai/recognize?"
-  header = {'Content-Type': "application/octet-stream"}
-  # transcription task options
-  config = {
-    "key" : secret_key,
-    "language" : "en-US",
-    "punctuation" : True,
-    "format" : "m4a"
-  }
-  # send an audio transcription request
-  r = requests.post(endpoint, headers = header, params = config, data = post_body).json()
-  # get the id of the speech recognition task
-  task = r["id"]
-  # print("Task ID: {}".format(task))
-  # get transcription results, summary, and highlights
-  config = {
-    "key" : secret_key,
-    "task" : task,
-    "summary" : True,
-    "summary_size" : 15,
-    "highlights" : True,
-    "max_keywords" : 10
-  }
-  transcription = get_results(config)
-  p=transcription['results']['transcript'].replace('<kw>','').replace('</kw>','')
-  return p
-k=gr.Interface(fn=spt, inputs=gr.Audio(source="microphone", type="filepath"), outputs="text")
 k.launch()

+import sounddevice as sd
+import speech_recognition as sr
+def takeCommand(audio):
+    r = sr.Recognizer()
+    with sr.AudioFile(
+        audio
+    ) as source:  # Replace "audio.wav" with the path to your .wav file
+        # print("Listening...")
+        audio_data = r.record(source)
+    try:
+        # print("Recognizing...")
+        query = r.recognize_google(audio_data, language="en-in")
+        print(f"User said: {query}")
+        return query
+    except sr.UnknownValueError:
+        print("Unable to recognize speech")
+    except sr.RequestError as e:
+        print(f"Error occurred: {e}")
+    return "Some error occurred. Sorry from Jarvis"
+k=gr.Interface(fn=takeCommand, inputs=gr.Audio(source="microphone", type="filepath"), outputs="text")
 k.launch()