Spaces:
Sleeping
Sleeping
| import os | |
| import speech_recognition as sr | |
| import logging | |
| from flask import Flask, render_template_string, request, jsonify | |
| from tempfile import NamedTemporaryFile | |
| import ffmpeg | |
| from fuzzywuzzy import process, fuzz | |
| # Initialize Flask app | |
| app = Flask(__name__) | |
| logging.basicConfig(level=logging.INFO) | |
| # Global variables | |
| cart = [] # Stores items as [item_name, price, quantity] in the cart | |
| menu_preferences = None # Tracks the current menu preference | |
| section_preferences = None # Tracks the current section preference | |
| default_menu_preferences = "all" # To reset menu preferences | |
| default_sections = { | |
| "biryanis": ["veg biryani", "paneer biryani", "chicken biryani", "mutton biryani"], | |
| "starters": ["samosa", "onion pakoda", "chilli gobi", "chicken manchurian", "veg manchurian"], | |
| "curries": ["paneer butter", "chicken curry", "fish curry", "chilli chicken"], | |
| "desserts": ["gulab jamun", "ice cream"], | |
| "soft drinks": ["cola", "lemon soda"] | |
| } | |
| prices = { | |
| "samosa": 9, | |
| "onion pakoda": 10, | |
| "chilli gobi": 12, | |
| "chicken biryani": 14, | |
| "mutton biryani": 16, | |
| "veg biryani": 12, | |
| "paneer butter": 10, | |
| "fish curry": 12, | |
| "chicken manchurian": 14, | |
| "veg manchurian": 12, | |
| "chilli chicken": 14, | |
| "paneer biryani": 13, | |
| "chicken curry": 14, | |
| "gulab jamun": 8, | |
| "ice cream": 6, | |
| "cola": 5, | |
| "lemon soda": 6 | |
| } | |
| menus = { | |
| "all": list(prices.keys()), | |
| "vegetarian": [ | |
| "samosa", "onion pakoda", "chilli gobi", "veg biryani", "paneer butter", "veg manchurian", "paneer biryani", "gulab jamun", "ice cream", "cola", "lemon soda" | |
| ], | |
| "non-vegetarian": [ | |
| "chicken biryani", "mutton biryani", "fish curry", "chicken manchurian", "chilli chicken", "chicken curry", "gulab jamun", "ice cream", "cola", "lemon soda" | |
| ] | |
| } | |
| def index(): | |
| return render_template_string(html_code) | |
| def reset_cart(): | |
| global cart, menu_preferences, section_preferences | |
| cart = [] | |
| menu_preferences = None | |
| section_preferences = None | |
| return "Cart reset successfully." | |
| def process_audio(): | |
| try: | |
| # Handle audio input | |
| audio_file = request.files.get("audio") | |
| if not audio_file: | |
| return jsonify({"response": "Oops! I didn't catch any audio. Please try again."}), 400 | |
| # Save and convert audio to WAV format | |
| temp_file = NamedTemporaryFile(delete=False, suffix=".webm") | |
| audio_file.save(temp_file.name) | |
| converted_file = NamedTemporaryFile(delete=False, suffix=".wav") | |
| ffmpeg.input(temp_file.name).output( | |
| converted_file.name, acodec="pcm_s16le", ac=1, ar="16000" | |
| ).run(overwrite_output=True) | |
| # Recognize speech | |
| recognizer = sr.Recognizer() | |
| recognizer.dynamic_energy_threshold = True | |
| recognizer.energy_threshold = 4000 # Increased sensitivity | |
| with sr.AudioFile(converted_file.name) as source: | |
| recognizer.adjust_for_ambient_noise(source, duration=1) | |
| audio_data = recognizer.record(source) | |
| # Use multiple recognition services with fallbacks | |
| try: | |
| raw_command = recognizer.recognize_google(audio_data).lower() | |
| except sr.UnknownValueError: | |
| raw_command = "Sorry, I couldn't understand that." | |
| except sr.RequestError as e: | |
| raw_command = f"Request error from the service: {e}" | |
| logging.info(f"User said: {raw_command}") # Print user speech in the console | |
| # Display the transcribed text and AI voice response | |
| response = process_command(raw_command) | |
| except Exception as e: | |
| response = f"An error occurred: {str(e)}" | |
| finally: | |
| os.unlink(temp_file.name) | |
| os.unlink(converted_file.name) | |
| return jsonify({"response": response}) | |
| def preprocess_command(command): | |
| """ | |
| Normalize the user command to improve matching. | |
| """ | |
| command = command.strip().lower() | |
| return command | |
| def process_command(command): | |
| global cart, menu_preferences, section_preferences | |
| # Finalize order | |
| if "final order" in command or "complete order" in command: | |
| if not cart: | |
| return "Your cart is empty. Please add items before finalizing the order." | |
| order_summary = "\n".join([f"{item[2]} x {item[0]} for {item[1] * item[2]} INR" for item in cart]) | |
| total_price = sum(item[1] * item[2] for item in cart) | |
| cart.clear() # Clear the cart after finalizing | |
| menu_preferences = None | |
| section_preferences = None | |
| return f"Your order has been placed successfully:\n{order_summary}\nTotal: {total_price} INR.\nThank you for ordering!" | |
| # Greet the user and ask for preferences when first started | |
| if menu_preferences is None: | |
| if "hello" in command or "hi" in command: | |
| return "Hello, welcome to Biryani Hub! Please choose your preference: All, Vegetarian, or Non-Vegetarian." | |
| preferences = ["non-vegetarian", "vegetarian", "all"] | |
| if command in preferences: | |
| menu_preferences = command | |
| return f"You've selected the {command} menu! Which section would you like to browse next? (e.g., biryanis, starters, curries, desserts, soft drinks)" | |
| # Use fuzzy matching to help recognize similar inputs | |
| closest_match = process.extractOne(command, preferences, scorer=fuzz.partial_ratio) | |
| if closest_match and closest_match[1] > 75: | |
| menu_preferences = closest_match[0] | |
| return f"Great choice! You've chosen the {menu_preferences} menu. Which section would you like to browse next?" | |
| return "I couldn't recognize your choice. Please say either 'Non-Vegetarian', 'Vegetarian', or 'All'." | |
| if section_preferences is None: | |
| sections = list(default_sections.keys()) | |
| for section in sections: | |
| if section in command: | |
| section_preferences = section | |
| return f"Here are the items in the {section_preferences} section: {', '.join(default_sections[section_preferences])}. Please choose an item." | |
| closest_match = process.extractOne(command, sections, scorer=fuzz.partial_ratio) | |
| if closest_match and closest_match[1] > 75: | |
| section_preferences = closest_match[0] | |
| return f"Here are the items in the {section_preferences} section: {', '.join(default_sections[section_preferences])}. What would you like to add?" | |
| return "I didn't catch that. Please say a section like 'biryanis', 'starters', 'curries', 'desserts', or 'soft drinks'." | |
| # Filter items based on the menu preference (vegetarian/non-vegetarian) | |
| available_items = [] | |
| if menu_preferences == "vegetarian": | |
| available_items = [item for item in default_sections[section_preferences] if item in menus["vegetarian"]] | |
| elif menu_preferences == "non-vegetarian": | |
| available_items = [item for item in default_sections[section_preferences] if item in menus["non-vegetarian"]] | |
| elif menu_preferences == "all": | |
| available_items = [item for item in default_sections[section_preferences]] | |
| for item in available_items: | |
| if item in command: | |
| quantity = extract_quantity(command) | |
| if quantity: | |
| cart.append([item, prices[item], quantity]) | |
| return f"Added {quantity} x {item} to your cart. Your current cart: {', '.join([f'{i[0]} x{i[2]}' for i in cart])}. Would you like to add more items?" | |
| return "I didn't recognize the item you mentioned. Please say the item name clearly, or choose from the available items." | |
| def extract_quantity(command): | |
| """ | |
| Extract quantity from the command (e.g., 'two', '3', '5'). | |
| """ | |
| number_words = { | |
| "one": 1, "two": 2, "three": 3, "four": 4, "five": 5, | |
| "six": 6, "seven": 7, "eight": 8, "nine": 9, "ten": 10, | |
| "1": 1, "2": 2, "3": 3, "4": 4, "5": 5, "6": 6, "7": 7, "8": 8, "9": 9, "10": 10 | |
| } | |
| command_words = command.split() | |
| for word in command_words: | |
| if word in number_words: | |
| return number_words[word] | |
| return None | |
| html_code = """ | |
| <!DOCTYPE html> | |
| <html lang="en"> | |
| <head> | |
| <meta charset="UTF-8"> | |
| <meta name="viewport" content="width=device-width, initial-scale=1.0"> | |
| <title>AI Dining Assistant</title> | |
| <style> | |
| body { | |
| display: flex; | |
| flex-direction: column; | |
| align-items: center; | |
| justify-content: center; | |
| min-height: 100vh; | |
| margin: 0; | |
| font-family: Arial, sans-serif; | |
| background-color: #f4f4f9; | |
| } | |
| h1 { | |
| color: #333; | |
| } | |
| .mic-button { | |
| font-size: 2rem; | |
| padding: 1rem 2rem; | |
| color: white; | |
| background-color: #007bff; | |
| border: none; | |
| border-radius: 50px; | |
| cursor: pointer; | |
| transition: background-color 0.3s; | |
| } | |
| .mic-button:hover { | |
| background-color: #0056b3; | |
| } | |
| .status, .response { | |
| margin-top: 1rem; | |
| text-align: center; | |
| color: #555; | |
| font-size: 1.2rem; | |
| } | |
| .response { | |
| background-color: #e8e8ff; | |
| padding: 1rem; | |
| border-radius: 10px; | |
| box-shadow: 0 4px 8px rgba(0, 0, 0, 0.2); | |
| display: none; | |
| } | |
| </style> | |
| </head> | |
| <body> | |
| <h1>AI Dining Assistant</h1> | |
| <button class="mic-button" id="mic-button">🎤</button> | |
| <div class="status" id="status">Press the mic button to start...</div> | |
| <div class="response" id="response">Response will appear here...</div> | |
| <script> | |
| const micButton = document.getElementById('mic-button'); | |
| const status = document.getElementById('status'); | |
| const response = document.getElementById('response'); | |
| let mediaRecorder; | |
| let audioChunks = []; | |
| let isConversationActive = false; | |
| micButton.addEventListener('click', () => { | |
| if (!isConversationActive) { | |
| isConversationActive = true; | |
| startConversation(); | |
| } | |
| }); | |
| function startConversation() { | |
| const utterance = new SpeechSynthesisUtterance('Hello, welcome to Biryani Hub! Please choose your preference: All, Vegetarian, or Non-Vegetarian.'); | |
| speechSynthesis.speak(utterance); | |
| utterance.onend = () => { | |
| status.textContent = 'Listening...'; | |
| startListening(); | |
| }; | |
| } | |
| function startListening() { | |
| navigator.mediaDevices.getUserMedia({ audio: true }).then(stream => { | |
| mediaRecorder = new MediaRecorder(stream, { mimeType: 'audio/webm;codecs=opus' }); | |
| mediaRecorder.start(); | |
| audioChunks = []; | |
| mediaRecorder.ondataavailable = event => audioChunks.push(event.data); | |
| mediaRecorder.onstop = async () => { | |
| const audioBlob = new Blob(audioChunks, { type: 'audio/webm' }); | |
| const formData = new FormData(); | |
| formData.append('audio', audioBlob); | |
| status.textContent = 'Processing...'; | |
| try { | |
| const result = await fetch('/process-audio', { method: 'POST', body: formData }); | |
| const data = await result.json(); | |
| response.textContent = 'You said: ' + data.response; // Display user text | |
| response.style.display = 'block'; | |
| const utterance = new SpeechSynthesisUtterance(data.response); | |
| speechSynthesis.speak(utterance); | |
| utterance.onend = () => { | |
| console.log("Speech synthesis completed."); | |
| if (data.response.includes("final order") || data.response.includes("Thank you for ordering")) { | |
| status.textContent = 'Order completed. Press the mic button to start again.'; | |
| isConversationActive = false; | |
| } else { | |
| status.textContent = 'Listening...'; | |
| setTimeout(() => { | |
| startListening(); | |
| }, 100); | |
| } | |
| }; | |
| utterance.onerror = (e) => { | |
| console.error("Speech synthesis error:", e.error); | |
| status.textContent = 'Error with speech output.'; | |
| isConversationActive = false; | |
| }; | |
| } catch (error) { | |
| response.textContent = 'Sorry, I could not understand. Please try again.'; | |
| response.style.display = 'block'; | |
| status.textContent = 'Press the mic button to restart the conversation.'; | |
| isConversationActive = false; | |
| } | |
| }; | |
| setTimeout(() => mediaRecorder.stop(), 5000); | |
| }).catch(() => { | |
| status.textContent = 'Microphone access denied.'; | |
| isConversationActive = false; | |
| }); | |
| } | |
| </script> | |
| </body> | |
| </html> | |
| """ | |
| if __name__ == "__main__": | |
| app.run(host="0.0.0.0", port=7860) | |