Spaces:

agnixcode
/

voice_chatbot

Sleeping

Dua Rajper commited on Mar 3, 2025

Commit

5cce8b9

verified ·

1 Parent(s): ae8b1c6

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -82,7 +82,7 @@ if webrtc_ctx.audio_processor:
             speech, _ = sf.read("recorded_audio.wav")
             output = stt_pipe(speech)  # Transcribe with timestamps
-            # Display the full transcribed text
             st.write("Transcribed Text:", output['text'])
             # Display the text with timestamps (optional)
@@ -93,17 +93,30 @@ if webrtc_ctx.audio_processor:
             # Generate response using Groq API
             try:
                 chat_completion = groq_client.chat.completions.create(
                     messages=[{"role": "user", "content": output['text']}],
                     model="mixtral-8x7b-32768",
                     temperature=0.5,
                     max_tokens=1024
                 )
                 response = chat_completion.choices[0].message.content
                 st.write("Generated Response:", response)
                 # Convert response to speech
                 speech, *_ = tts_model(response, spembs=tts_model.spembs[0])  # Use the first speaker embedding
                 sf.write("response.wav", speech, 22050)
                 st.audio("response.wav")
             except Exception as e:

             speech, _ = sf.read("recorded_audio.wav")
             output = stt_pipe(speech)  # Transcribe with timestamps
+            # Debug: Print the transcribed text
             st.write("Transcribed Text:", output['text'])
             # Display the text with timestamps (optional)
             # Generate response using Groq API
             try:
+                # Debug: Print the input text
+                st.write("Input Text:", output['text'])
                 chat_completion = groq_client.chat.completions.create(
                     messages=[{"role": "user", "content": output['text']}],
                     model="mixtral-8x7b-32768",
                     temperature=0.5,
                     max_tokens=1024
                 )
+                # Debug: Print the API response
+                st.write("API Response:", chat_completion)
+                # Extract the generated response
                 response = chat_completion.choices[0].message.content
                 st.write("Generated Response:", response)
                 # Convert response to speech
                 speech, *_ = tts_model(response, spembs=tts_model.spembs[0])  # Use the first speaker embedding
+                # Debug: Print the TTS output
+                st.write("TTS Output:", speech)
+                # Save and play the speech
                 sf.write("response.wav", speech, 22050)
                 st.audio("response.wav")
             except Exception as e: