Spaces:

geethareddy
/

voicebased

Sleeping

App Files Files Community

geethareddy commited on Jan 29, 2025

Commit

575b90c

verified ·

1 Parent(s): 974001b

Update app.py

Browse files

Files changed (1) hide show

app.py +67 -35

app.py CHANGED Viewed

@@ -1,40 +1,72 @@
-from flask import Flask, request, jsonify
-from transformers import pipeline
 import os
-app = Flask(__name__)
-# Load ASR model
-asr_pipeline = pipeline("automatic-speech-recognition", model="openai/whisper-small")
-# Store user details
 user_data = {"name": "", "email": ""}
-@app.route("/voice_input", methods=["POST"])
-def voice_input():
-    if "audio" not in request.files:
-        return jsonify({"error": "No audio file received"}), 400
-    file = request.files["audio"]
-    file_path = "temp.wav"
-    file.save(file_path)
-    try:
-        # Convert Speech to Text
-        text = asr_pipeline(file_path)["text"]
-        # Store name or email based on input
-        if user_data["name"] == "":
-            user_data["name"] = text
-            return jsonify({"message": f"Name recorded: {text}"})
-        elif user_data["email"] == "":
-            user_data["email"] = text
-            return jsonify({"message": f"Email recorded: {text}"})
-        return jsonify({"message": "All details recorded", "data": user_data})
-    except Exception as e:
-        return jsonify({"error": str(e)}), 500
-if __name__ == "__main__":
-    app.run(debug=True, host="0.0.0.0", port=5000)

+import gradio as gr
+import whisper
+import time
 import os
+# Load Whisper ASR Model
+model = whisper.load_model("base")
+# Store User Data
 user_data = {"name": "", "email": ""}
+# Function to Play Welcome Message
+def welcome_message():
+    return "Welcome to Biryani Hub. Tell me your name."
+# Function to Capture Name
+def capture_name(audio):
+    global user_data
+    if audio is None:
+        return "No audio detected. Please try again."
+    # Save the audio
+    audio_path = "name.wav"
+    audio.export(audio_path, format="wav")
+    # Convert Speech to Text
+    result = model.transcribe(audio_path)
+    user_data["name"] = result["text"]
+    return f"Hello, {user_data['name']}! Please provide your email address."
+# Function to Capture Email
+def capture_email(audio):
+    global user_data
+    if audio is None:
+        return "No audio detected. Please try again."
+    # Save the audio
+    audio_path = "email.wav"
+    audio.export(audio_path, format="wav")
+    # Convert Speech to Text
+    result = model.transcribe(audio_path)
+    user_data["email"] = result["text"]
+    return f"Thank you, {user_data['name']}! We have saved your email: {user_data['email']}."
+# Create Gradio UI
+with gr.Blocks() as demo:
+    gr.Markdown("# 🎙️ Voice-Enabled Restaurant Menu - Biryani Hub")
+    # Welcome Message
+    welcome = gr.Textbox(value=welcome_message(), interactive=False)
+    # Step 1: Capture Name
+    gr.Markdown("### 🗣️ Step 1: Say Your Name")
+    name_input = gr.Audio(source="microphone", type="file")
+    name_output = gr.Textbox()
+    name_button = gr.Button("Submit Name")
+    # Step 2: Capture Email
+    gr.Markdown("### 📧 Step 2: Say Your Email")
+    email_input = gr.Audio(source="microphone", type="file")
+    email_output = gr.Textbox()
+    email_button = gr.Button("Submit Email")
+    # Capture Name and Email
+    name_button.click(capture_name, inputs=name_input, outputs=name_output)
+    email_button.click(capture_email, inputs=email_input, outputs=email_output)
+# Launch the App
+demo.launch()