Spaces:

geethareddy
/

voice1

Sleeping

App Files Files Community

geethareddy commited on Jan 16, 2025

Commit

c44e6ef

verified ·

1 Parent(s): 1812cce

Update app.py

Browse files

Files changed (1) hide show

app.py +188 -264

app.py CHANGED Viewed

@@ -1,200 +1,31 @@
-import os
-import speech_recognition as sr
-import logging
 from flask import Flask, render_template_string, request, jsonify
 from tempfile import NamedTemporaryFile
 import ffmpeg
-from fuzzywuzzy import process, fuzz
-# Initialize Flask app
 app = Flask(__name__)
 logging.basicConfig(level=logging.INFO)
 # Global variables
-cart = []  # Stores items as [item_name, price, quantity] in the cart
-menu_preferences = None  # Tracks the current menu preference
-section_preferences = None  # Tracks the current section preference
-default_sections = {
-    "biryanis": ["veg biryani", "paneer biryani", "chicken biryani", "mutton biryani"],
-    "starters": ["samosa", "onion pakoda", "chilli gobi", "chicken manchurian", "veg manchurian"],
-    "curries": ["paneer butter", "chicken curry", "fish curry", "chilli chicken"],
-    "desserts": ["gulab jamun", "ice cream"],
-    "soft drinks": ["cola", "lemon soda"]
 }
-prices = {
-    "samosa": 9,
-    "onion pakoda": 10,
-    "chilli gobi": 12,
-    "chicken biryani": 14,
-    "mutton biryani": 16,
-    "veg biryani": 12,
-    "paneer butter": 10,
-    "fish curry": 12,
-    "chicken manchurian": 14,
-    "veg manchurian": 12,
-    "chilli chicken": 14,
-    "paneer biryani": 13,
-    "chicken curry": 14,
-    "gulab jamun": 8,
-    "ice cream": 6,
-    "cola": 5,
-    "lemon soda": 6
-}
-@app.route("/")
-def index():
-    return render_template_string(html_code)
-@app.route("/reset-cart", methods=["GET"])
-def reset_cart():
-    global cart, menu_preferences, section_preferences
-    cart = []
-    menu_preferences = None
-    section_preferences = None
-    return "Cart reset successfully."
-@app.route("/process-audio", methods=["POST"])
-def process_audio():
-    try:
-        # Handle audio input
-        audio_file = request.files.get("audio")
-        if not audio_file:
-            return jsonify({"response": "Oops! I didn't catch any audio. Please try again."}), 400
-        # Save and convert audio to WAV format
-        temp_file = NamedTemporaryFile(delete=False, suffix=".webm")
-        audio_file.save(temp_file.name)
-        converted_file = NamedTemporaryFile(delete=False, suffix=".wav")
-        ffmpeg.input(temp_file.name).output(
-            converted_file.name, acodec="pcm_s16le", ac=1, ar="16000"
-        ).run(overwrite_output=True)
-        # Recognize speech
-        recognizer = sr.Recognizer()
-        recognizer.dynamic_energy_threshold = True
-        recognizer.energy_threshold = 4000  # Increased sensitivity
-        with sr.AudioFile(converted_file.name) as source:
-            recognizer.adjust_for_ambient_noise(source, duration=1)
-            audio_data = recognizer.record(source)
-        # Try using the Google API for speech recognition
-        try:
-            raw_command = recognizer.recognize_google(audio_data).lower()
-        except sr.UnknownValueError:
-            raw_command = "Sorry, I couldn't understand that."
-        except sr.RequestError as e:
-            raw_command = f"Request error from the service: {e}"
-        logging.info(f"User said: {raw_command}")  # Print user speech in the console
-        # Display the transcribed text and AI voice response
-        response = process_command(raw_command)
-    except Exception as e:
-        response = f"An error occurred: {str(e)}"
-    finally:
-        os.unlink(temp_file.name)
-        os.unlink(converted_file.name)
-    return jsonify({"response": response})
-def preprocess_command(command):
-    """
-    Normalize the user command to improve matching.
-    """
-    command = command.strip().lower()
-    return command
-def process_command(command):
-    global cart, menu_preferences, section_preferences
-    # Finalize order
-    if "final order" in command or "complete order" in command:
-        if not cart:
-            return "Your cart is empty. Please add items before finalizing the order."
-        order_summary = "\n".join([f"{item[2]} x {item[0]} for {item[1] * item[2]} INR" for item in cart])
-        total_price = sum(item[1] * item[2] for item in cart)
-        cart.clear()  # Clear the cart after finalizing
-        menu_preferences = None
-        section_preferences = None
-        return f"Your order has been placed successfully:\n{order_summary}\nTotal: {total_price} INR.\nThank you for ordering!"
-    # Greet the user and ask for preferences when first started
-    if menu_preferences is None:
-        if "hello" in command or "hi" in command:
-            return "Hello, welcome to Biryani Hub! We have the following categories: Biryanis, Starters, Curries, Desserts, Soft Drinks. Please choose a category."
-        preferences = ["non-vegetarian", "vegetarian", "all"]
-        if command in preferences:
-            menu_preferences = command
-            return f"You've selected the {command} menu! Which section would you like to browse next? (e.g., biryanis, starters, curries, desserts, soft drinks)"
-        # Use fuzzy matching to help recognize similar inputs
-        closest_match = process.extractOne(command, preferences, scorer=fuzz.partial_ratio)
-        if closest_match and closest_match[1] > 75:
-            menu_preferences = closest_match[0]
-            return f"Great choice! You've chosen the {menu_preferences} menu. Which section would you like to browse next?"
-        return "I couldn't recognize your choice. Please say either 'Non-Vegetarian', 'Vegetarian', or 'All'."
-    # Handle section preferences and list items
-    if section_preferences is None:
-        sections = list(default_sections.keys())
-        for section in sections:
-            if section in command:
-                section_preferences = section
-                items_text = ', '.join(default_sections[section_preferences])
-                response_text = f"Here are the items in the {section_preferences} section: {items_text}. Please choose an item."
-                # Speak the response
-                return response_text
-        closest_match = process.extractOne(command, sections, scorer=fuzz.partial_ratio)
-        if closest_match and closest_match[1] > 75:
-            section_preferences = closest_match[0]
-            items_text = ', '.join(default_sections[section_preferences])
-            return f"Here are the items in the {section_preferences} section: {items_text}. What would you like to add?"
-        return "I didn't catch that. Please say a section like 'biryanis', 'starters', 'curries', 'desserts', or 'soft drinks'."
-    # Filter items based on the menu preference (vegetarian/non-vegetarian)
-    available_items = []
-    if menu_preferences == "vegetarian":
-        available_items = [item for item in default_sections[section_preferences] if item in menus["vegetarian"]]
-    elif menu_preferences == "non-vegetarian":
-        available_items = [item for item in default_sections[section_preferences] if item in menus["non-vegetarian"]]
-    elif menu_preferences == "all":
-        available_items = [item for item in default_sections[section_preferences]]
-    for item in available_items:
-        if item in command:
-            quantity = extract_quantity(command)
-            if quantity:
-                cart.append([item, prices[item], quantity])
-                return f"Added {quantity} x {item} to your cart. Your current cart: {', '.join([f'{i[0]} x{i[2]}' for i in cart])}. Would you like to add more items?"
-    return "I didn't recognize the item you mentioned. Please say the item name clearly, or choose from the available items."
-def extract_quantity(command):
-    """
-    Extract quantity from the command (e.g., 'two', '3', '5').
-    """
-    number_words = {
-        "one": 1, "two": 2, "three": 3, "four": 4, "five": 5,
-        "six": 6, "seven": 7, "eight": 8, "nine": 9, "ten": 10,
-        "1": 1, "2": 2, "3": 3, "4": 4, "5": 5, "6": 6, "7": 7, "8": 8, "9": 9, "10": 10
-    }
-    command_words = command.split()
-    for word in command_words:
-        if word in number_words:
-            return number_words[word]
-    return None
 html_code = """
 <!DOCTYPE html>
 <html lang="en">
@@ -204,43 +35,25 @@ html_code = """
     <title>AI Dining Assistant</title>
     <style>
         body {
-            display: flex;
-            flex-direction: column;
-            align-items: center;
-            justify-content: center;
-            min-height: 100vh;
-            margin: 0;
             font-family: Arial, sans-serif;
             background-color: #f4f4f9;
         }
         h1 {
             color: #333;
         }
         .mic-button {
-            font-size: 2rem;
-            padding: 1rem 2rem;
-            color: white;
             background-color: #007bff;
             border: none;
-            border-radius: 50px;
             cursor: pointer;
-            transition: background-color 0.3s;
-        }
-        .mic-button:hover {
-            background-color: #0056b3;
         }
         .status, .response {
-            margin-top: 1rem;
-            text-align: center;
-            color: #555;
-            font-size: 1.2rem;
-        }
-        .response {
-            background-color: #e8e8ff;
-            padding: 1rem;
-            border-radius: 10px;
-            box-shadow: 0 4px 8px rgba(0, 0, 0, 0.2);
-            display: block;
         }
     </style>
 </head>
@@ -248,75 +61,186 @@ html_code = """
     <h1>AI Dining Assistant</h1>
     <button class="mic-button" id="mic-button">🎤</button>
     <div class="status" id="status">Press the mic button to start...</div>
-    <div class="response" id="response">Response will appear here...</div>
     <script>
         const micButton = document.getElementById('mic-button');
         const status = document.getElementById('status');
         const response = document.getElementById('response');
-        let mediaRecorder;
-        let audioChunks = [];
-        let isConversationActive = false;
         micButton.addEventListener('click', () => {
-            if (!isConversationActive) {
-                isConversationActive = true;
-                startConversation();
             }
         });
-        function startConversation() {
-            const utterance = new SpeechSynthesisUtterance('Hello, welcome to Biryani Hub! We have the following categories: Biryanis, Starters, Curries, Desserts, Soft Drinks. Please choose a category.');
             speechSynthesis.speak(utterance);
             utterance.onend = () => {
-                status.textContent = 'Listening...';
                 startListening();
             };
         }
-        function startListening() {
-            navigator.mediaDevices.getUserMedia({ audio: true }).then(stream => {
-                mediaRecorder = new MediaRecorder(stream, { mimeType: 'audio/webm;codecs=opus' });
-                mediaRecorder.start();
-                audioChunks = [];
-                mediaRecorder.ondataavailable = event => audioChunks.push(event.data);
-                mediaRecorder.onstop = async () => {
-                    const audioBlob = new Blob(audioChunks, { type: 'audio/webm' });
-                    const formData = new FormData();
-                    formData.append('audio', audioBlob);
-                    status.textContent = 'Processing...';
-                    try {
-                        const result = await fetch('/process-audio', { method: 'POST', body: formData });
-                        const data = await result.json();
-                        response.textContent = 'You said: ' + data.response; // Display user text
-                        response.style.display = 'block';
-                        const utterance = new SpeechSynthesisUtterance(data.response);
-                        speechSynthesis.speak(utterance);
-                        utterance.onend = () => {
-                            console.log("Speech synthesis completed.");
-                            status.textContent = 'Listening...';
-                            setTimeout(() => {
-                                startListening();
-                            }, 100);
-                        };
-                        utterance.onerror = (e) => {
-                            console.error("Speech synthesis error:", e.error);
-                            status.textContent = 'Error with speech output.';
-                            isConversationActive = false;
-                        };
-                    } catch (error) {
-                        response.textContent = 'Sorry, I could not understand. Please try again.';
-                        response.style.display = 'block';
-                        status.textContent = 'Press the mic button to restart the conversation.';
-                        isConversationActive = false;
-                    }
-                };
-                setTimeout(() => mediaRecorder.stop(), 5000);
-            }).catch(() => {
-                status.textContent = 'Microphone access denied.';
-                isConversationActive = false;
-            });
         }
     </script>
 </body>
 </html>
 """
 if __name__ == "__main__":
     app.run(host="0.0.0.0", port=7860)

+                                        voice assistant
 from flask import Flask, render_template_string, request, jsonify
+import speech_recognition as sr
 from tempfile import NamedTemporaryFile
+import os
 import ffmpeg
+import logging
+from werkzeug.exceptions import BadRequest
 app = Flask(__name__)
 logging.basicConfig(level=logging.INFO)
 # Global variables
+cart = []  # To store items, quantities, and prices
+MENU = {
+    "Biryani": {"Chicken Biryani": 250, "Veg Biryani": 200, "Mutton Biryani": 300},
+    "Starters": {"Chicken Wings": 220, "Paneer Tikka": 180, "Fish Fingers": 250, "Spring Rolls": 160},
+    "Breads": {"Butter Naan": 50, "Garlic Naan": 60, "Roti": 40, "Lachha Paratha": 70},
+    "Curries": {"Butter Chicken": 300, "Paneer Butter Masala": 250, "Dal Tadka": 200, "Chicken Tikka Masala": 320},
+    "Drinks": {"Coke": 60, "Sprite": 60, "Mango Lassi": 80, "Masala Soda": 70},
+    "Desserts": {"Gulab Jamun": 100, "Rasgulla": 90, "Ice Cream": 120, "Brownie with Ice Cream": 180},
 }
+current_category = None
+current_item = None
+awaiting_quantity = False
+# HTML Template for Frontend
 html_code = """
 <!DOCTYPE html>
 <html lang="en">
     <title>AI Dining Assistant</title>
     <style>
         body {
             font-family: Arial, sans-serif;
+            text-align: center;
             background-color: #f4f4f9;
         }
         h1 {
             color: #333;
         }
         .mic-button {
+            width: 80px;
+            height: 80px;
+            border-radius: 50%;
             background-color: #007bff;
+            color: white;
+            font-size: 24px;
             border: none;
             cursor: pointer;
         }
         .status, .response {
+            margin-top: 20px;
         }
     </style>
 </head>
     <h1>AI Dining Assistant</h1>
     <button class="mic-button" id="mic-button">🎤</button>
     <div class="status" id="status">Press the mic button to start...</div>
+    <div class="response" id="response" style="display: none;">Response will appear here...</div>
     <script>
         const micButton = document.getElementById('mic-button');
         const status = document.getElementById('status');
         const response = document.getElementById('response');
+        let isListening = false;
         micButton.addEventListener('click', () => {
+            if (!isListening) {
+                isListening = true;
+                greetUser();
             }
         });
+        function greetUser() {
+            const utterance = new SpeechSynthesisUtterance("Hi. Welcome to Biryani Hub. Can I show you the menu?");
             speechSynthesis.speak(utterance);
             utterance.onend = () => {
+                status.textContent = "Listening...";
                 startListening();
             };
         }
+        async function startListening() {
+            const stream = await navigator.mediaDevices.getUserMedia({ audio: true });
+            const mediaRecorder = new MediaRecorder(stream, { mimeType: "audio/webm;codecs=opus" });
+            const audioChunks = [];
+            mediaRecorder.ondataavailable = (event) => audioChunks.push(event.data);
+            mediaRecorder.onstop = async () => {
+                const audioBlob = new Blob(audioChunks, { type: "audio/webm" });
+                const formData = new FormData();
+                formData.append("audio", audioBlob);
+                status.textContent = "Processing...";
+                try {
+                    const result = await fetch("/process-audio", { method: "POST", body: formData });
+                    const data = await result.json();
+                    response.textContent = data.response;
+                    response.style.display = "block";
+                    const utterance = new SpeechSynthesisUtterance(data.response);
+                    speechSynthesis.speak(utterance);
+                    utterance.onend = () => {
+                        if (!data.response.includes("Goodbye") && !data.response.includes("final order")) {
+                            startListening(); // Continue listening
+                        } else {
+                            status.textContent = "Conversation ended.";
+                            isListening = false;
+                        }
+                    };
+                } catch (error) {
+                    response.textContent = "Error processing your request. Please try again.";
+                    status.textContent = "Press the mic button to restart.";
+                    isListening = false;
+                }
+            };
+            mediaRecorder.start();
+            setTimeout(() => mediaRecorder.stop(), 5000); // Stop recording after 5 seconds
         }
     </script>
 </body>
 </html>
 """
+@app.route("/")
+def index():
+    return render_template_string(html_code)
+@app.route("/process-audio", methods=["POST"])
+def process_audio():
+    global current_category, current_item, awaiting_quantity
+    try:
+        audio_file = request.files.get("audio")
+        if not audio_file:
+            raise BadRequest("No audio file provided.")
+        temp_file = NamedTemporaryFile(delete=False, suffix=".webm")
+        audio_file.save(temp_file.name)
+        if os.path.getsize(temp_file.name) == 0:
+            raise BadRequest("Uploaded audio file is empty.")
+        converted_file = NamedTemporaryFile(delete=False, suffix=".wav")
+        ffmpeg.input(temp_file.name).output(
+            converted_file.name, acodec="pcm_s16le", ac=1, ar="16000"
+        ).run(overwrite_output=True)
+        recognizer = sr.Recognizer()
+        with sr.AudioFile(converted_file.name) as source:
+            audio_data = recognizer.record(source)
+            try:
+                command = recognizer.recognize_google(audio_data)
+                logging.info(f"Recognized command: {command}")
+                response = process_command(command)
+            except sr.UnknownValueError:
+                response = "Sorry, I couldn't understand your command. Could you please repeat?"
+            except sr.RequestError as e:
+                response = f"Error with the speech recognition service: {e}"
+        return jsonify({"response": response})
+    except BadRequest as br:
+        return jsonify({"response": f"Bad Request: {str(br)}"}), 400
+    except Exception as e:
+        return jsonify({"response": f"An error occurred: {str(e)}"}), 500
+    finally:
+        os.unlink(temp_file.name)
+        os.unlink(converted_file.name)
+def process_command(command):
+    global cart, MENU, current_category, current_item, awaiting_quantity
+    command = command.lower()
+    # Handle quantity input
+    if awaiting_quantity and command.isdigit():
+        quantity = int(command)
+        if quantity > 0:
+            cart.append((current_item, MENU[current_category][current_item], quantity))
+            awaiting_quantity = False
+            item = current_item
+            current_item = None
+            total = sum(i[1] * i[2] for i in cart)
+            cart_summary = ", ".join([f"{i[0]} x{i[2]} (₹{i[1] * i[2]})" for i in cart])
+            return f"Added {quantity} of {item} to your cart. Cart: {cart_summary}. Total: ₹{total}. Would you like to see the menu again?"
+        else:
+            return "Quantity must be at least 1. How many would you like to order?"
+    # Handle category selection
+    for category, items in MENU.items():
+        if category.lower() in command:
+            current_category = category
+            item_list = ", ".join([f"{item} (₹{price})" for item, price in items.items()])
+            return f"{category} menu: {item_list}. What would you like to order?"
+    # Handle item selection with dynamic matching
+    if current_category:
+        for item in MENU[current_category].keys():
+            if item.lower().startswith(command) or command in item.lower():
+                current_item = item
+                awaiting_quantity = True
+                return f"How many quantities of {current_item} would you like?"
+    # Handle item removal
+    if "remove" in command:
+        for item in cart:
+            if item[0].lower() in command:
+                cart.remove(item)
+                total = sum(i[1] * i[2] for i in cart)
+                cart_summary = ", ".join([f"{i[0]} x{i[2]} (₹{i[1] * i[2]})" for i in cart])
+                return f"Removed {item[0]} from your cart. Updated cart: {cart_summary}. Total: ₹{total}."
+        return "The item you are trying to remove is not in your cart."
+    # Handle final order
+    if "final order" in command or "submit" in command:
+        if cart:
+            order_details = ", ".join([f"{item[0]} x{item[2]} (₹{item[1] * item[2]})" for item in cart])
+            total = sum(item[1] * item[2] for item in cart)
+            cart.clear()
+            return f"Your final order is: {order_details}. Total price: ₹{total}. Thank you for visiting Biryani Hub!"
+        else:
+            return "Your cart is empty. Please add items before placing the final order."
+    # Handle cart details
+    if "cart details" in command:
+        if cart:
+            cart_summary = "\n".join([f"{i[0]} x{i[2]} (₹{i[1] * i[2]})" for i in cart])
+            total = sum(i[1] * i[2] for i in cart)
+            return f"Your cart contains:\n{cart_summary}\nTotal: ₹{total}."
+        else:
+            return "Your cart is empty."
+    # Generic response for menu request
+    if "menu" in command:
+        categories = ", ".join(MENU.keys())
+        return f"We have the following categories: {categories}. Please select a category to proceed."
+    # Default response
+    return "Sorry, I didn't understand that. Please try again."
 if __name__ == "__main__":
     app.run(host="0.0.0.0", port=7860)