Spaces:

Udyan
/

Voice-Assistant

Sleeping

Udyan commited on Mar 13

Commit

f2fca2e

verified ·

1 Parent(s): 7e4b494

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,21 +1,19 @@
 import gradio as gr
 from transformers import pipeline
-import soundfile as sf
-import numpy as np
-# Speech-to-text model
 stt = pipeline(
     "automatic-speech-recognition",
     model="openai/whisper-base"
 )
-# Language model
 llm = pipeline(
-    "text2text-generation",
-    model="google/flan-t5-base"
 )
-# Text-to-speech model
 tts = pipeline(
     "text-to-speech",
     model="facebook/fastspeech2-en-ljspeech"
@@ -24,16 +22,16 @@ tts = pipeline(
 def voice_assistant(audio):
-    # Convert speech → text
     speech_text = stt(audio)["text"]
-    # Generate AI response
     response = llm(
         speech_text,
         max_new_tokens=80
     )[0]["generated_text"]
-    # Convert text → speech
     speech_output = tts(response)
     audio_array = speech_output["audio"]

 import gradio as gr
 from transformers import pipeline
+# Speech → Text
 stt = pipeline(
     "automatic-speech-recognition",
     model="openai/whisper-base"
 )
+# LLM
 llm = pipeline(
+    "text-generation",
+    model="distilgpt2"
 )
+# Text → Speech
 tts = pipeline(
     "text-to-speech",
     model="facebook/fastspeech2-en-ljspeech"
 def voice_assistant(audio):
+    # speech to text
     speech_text = stt(audio)["text"]
+    # AI response
     response = llm(
         speech_text,
         max_new_tokens=80
     )[0]["generated_text"]
+    # text to speech
     speech_output = tts(response)
     audio_array = speech_output["audio"]