Voice_Menu_Ordering5

Sleeping

App Files Files Community

Voice_Menu_Ordering5 / app.py

nagasurendra

Update app.py

ac47bc5 verified about 1 year ago

raw

history blame contribute delete

4.51 kB

	import gradio as gr
	from gtts import gTTS
	import os
	import tempfile
	import json
	import speech_recognition as sr

	# Store cart in a temporary storage
	cart = []

	# Define the menu items dynamically
	menu_items = {
	"Pizza": 10.99,
	"Burger": 8.49,
	"Pasta": 12.99,
	"Salad": 7.99,
	"Soda": 2.49
	}

	def generate_voice_response(text):
	tts = gTTS(text)
	temp_file = tempfile.NamedTemporaryFile(delete=False, suffix=".mp3")
	temp_file.close()
	tts.save(temp_file.name)
	return temp_file.name

	def calculate_total(cart):
	return len(cart) # Only count items, not prices

	def restaurant_voice_assistant(audio, state_json):
	global cart
	state = json.loads(state_json) if state_json else {}
	response = ""
	voice_path = None

	# Convert audio input to text
	input_text = ""
	if audio:
	recognizer = sr.Recognizer()
	with sr.AudioFile(audio) as source:
	try:
	input_text = recognizer.recognize_google(recognizer.record(source)).lower()
	except sr.UnknownValueError:
	input_text = ""

	if not state.get("menu_shown", False):
	# Show menu dynamically
	response = "Welcome to our restaurant! Here is our menu:\n"
	for item in menu_items.keys():
	response += f"{item}\n"
	response += "\nPlease tell me the item you would like to add to your cart or ask for the price of an item."
	state["menu_shown"] = True
	elif not input_text.strip():
	# Wait for valid input without responding if no input is provided
	return "", None, json.dumps(state)
	elif "price of" in input_text:
	# Handle price queries
	matched_items = [item for item in menu_items if item.lower() in input_text]
	if len(matched_items) == 1:
	item = matched_items[0]
	response = f"The price of {item} is ${menu_items[item]:.2f}."
	elif len(matched_items) > 1:
	response = f"I detected multiple items in your input: {', '.join(matched_items)}. Please ask for the price of one item at a time."
	else:
	response = "I couldn't find that item on the menu. Please ask for an item available in the menu."
	elif any(item.lower() in input_text for item in menu_items):
	# Match the input text with menu items
	matched_items = [item for item in menu_items if item.lower() in input_text and item not in state.get("current_items", [])]
	if len(matched_items) == 1:
	item = matched_items[0]
	cart.append(item)
	state.setdefault("current_items", []).append(item) # Track items added in the current cycle
	response = f"{item} has been added to your cart. Your current cart includes:\n"
	for cart_item in cart:
	response += f"- {cart_item}\n"
	response += "\nWould you like to add anything else?"
	elif len(matched_items) > 1:
	response = f"I detected multiple items in your input: {', '.join(matched_items)}. Please mention one item at a time."
	elif "menu" in input_text:
	response = "Here is our menu again:\n"
	for item in menu_items.keys():
	response += f"{item}\n"
	response += "\nWhat would you like to add to your cart or ask about?"
	elif "final order" in input_text or "submit order" in input_text:
	if cart:
	response = "Your final order includes:\n"
	for item in cart:
	response += f"- {item}\n"
	response += f"\nThank you for ordering!"
	cart = [] # Clear cart after finalizing order
	state["current_items"] = [] # Clear current cycle tracking
	else:
	response = "Your cart is empty. Would you like to order something?"
	else:
	response = "I didn’t quite catch that. Please tell me what you’d like to order or ask about."

	voice_path = generate_voice_response(response)
	return response, voice_path, json.dumps(state)

	with gr.Blocks() as demo:
	state = gr.State(value=json.dumps({}))

	with gr.Row():
	user_audio = gr.Audio(type="filepath", label="Your Voice Input")
	output_text = gr.Textbox(label="Response Text")

	with gr.Row():
	voice_output = gr.Audio(label="Response Audio", autoplay=True)

	# Automatically process audio when recording stops
	user_audio.change(restaurant_voice_assistant, inputs=[user_audio, state], outputs=[output_text, voice_output, state])

	demo.launch()