Spaces:

SujanMidatani
/

speechToText

Running

App Files Files Community

SujanMidatani commited on Jun 13, 2023

Commit

8c8ff11

1 Parent(s): a5acade

update app.py

Browse files

Files changed (1) hide show

app.py +64 -0

app.py CHANGED Viewed

	@@ -0,0 +1,64 @@

+import requests
+import time
+import json
+import gradio as gr
+secret_key = "6d74a4fac397423a8bd3011180b9b979"
+# retrieve transcription results for the task
+def get_results(config):
+  # endpoint to check status of the transcription task
+  endpoint = "https://api.speechtext.ai/results?"
+  # use a loop to check if the task is finished
+  while True:
+    results = requests.get(endpoint, params=config).json()
+    if "status" not in results:
+      break
+    # print("Task status: {}".format(results["status"]))
+    if results["status"] == 'failed':
+      print("The task is failed: {}".format(results))
+      break
+    if results["status"] == 'finished':
+      break
+    # sleep for 15 seconds if the task has the status - 'processing'
+    time.sleep(15)
+  return results
+# loads the audio into memory
+def  spt(audio_file):
+  with open(audio_file, mode="rb") as file:
+    post_body = file.read()
+  # endpoint to start a transcription task
+  endpoint = "https://api.speechtext.ai/recognize?"
+  header = {'Content-Type': "application/octet-stream"}
+  # transcription task options
+  config = {
+    "key" : secret_key,
+    "language" : "en-US",
+    "punctuation" : True,
+    "format" : "m4a"
+  }
+  # send an audio transcription request
+  r = requests.post(endpoint, headers = header, params = config, data = post_body).json()
+  # get the id of the speech recognition task
+  task = r["id"]
+  # print("Task ID: {}".format(task))
+  # get transcription results, summary, and highlights
+  config = {
+    "key" : secret_key,
+    "task" : task,
+    "summary" : True,
+    "summary_size" : 15,
+    "highlights" : True,
+    "max_keywords" : 10
+  }
+  transcription = get_results(config)
+  p=transcription['results']['transcript'].replace('<kw>','').replace('</kw>','')
+  return p
+k=gr.Interface(fn=spt, inputs=gr.Audio(source="microphone", type="filepath"), outputs="text")
+k.launch()