First_agent_uasername

Build error

App Files Files Community

First_agent_uasername / app.py

uasername

Update app.py

8b67e5c verified 11 months ago

raw

history blame contribute delete

5.81 kB

	import os
	import requests
	import random
	import yaml
	import datetime
	import pytz
	import gradio as gr
	from gtts import gTTS # Use Google TTS instead of pyttsx3
	from smolagents import CodeAgent, DuckDuckGoSearchTool, HfApiModel, load_tool, tool
	from tools.final_answer import FinalAnswerTool
	from Gradio_UI import GradioUI
	from tools.web_search import DuckDuckGoSearchTool
	from tools.visit_webpage import VisitWebpageTool

	from Code_Functions import speak_text


	from smolagents.agent_types import AgentText
	from smolagents.agent_types import AgentAudio

	import soundfile
	import io
	import librosa
	import numpy as np

	@tool
	def lookup_definition(query: str) -> AgentText:
	"""Fetches the definition of a word from the Dictionary API and returns it as AgentText.

	Args:
	query: The word to look up.

	Returns:
	A text response.
	"""
	url = f"https://api.dictionaryapi.dev/api/v2/entries/en/{query}"
	try:
	response = requests.get(url)
	response.raise_for_status()
	data = response.json()

	if not data:
	response_text = "No definition found."
	else:
	word = data[0].get("word", "Unknown word")
	origin = data[0].get("origin", "Origin not available")
	definitions = [
	f"({meaning.get('partOfSpeech', 'Unknown')}) {definition['definition']}"
	for meaning in data[0].get("meanings", [])
	for definition in meaning.get("definitions", [])
	]
	if not definitions:
	response_text = f"Word: {word}\nOrigin: {origin}\nNo definitions found."
	else:
	response_text = f"Word: {word}\nOrigin: {origin}\nDefinitions:\n- " + "\n- ".join(definitions)
	except requests.RequestException as e:
	response_text = f"Error fetching definition: {str(e)}"

	return AgentText(response_text)







	@tool
	def text_to_speech(text: str) -> AgentAudio:
	"""
	Converts input text to speech and returns an AgentAudio instance with the audio file path.
	Args:
	text: The text sring with word definition that will be converted into speech.
	Returns:
	AgentAudio: An AgentAudio instance containing the file path to the generated audio.
	"""
	from gtts import gTTS
	AUDIO_OUTPUT_PATH = "/tmp/response.mp3"
	tts = gTTS(text=text, lang='en')
	tts.save(AUDIO_OUTPUT_PATH)
	return AgentAudio(AUDIO_OUTPUT_PATH)


	# Define the audio output path
	AUDIO_OUTPUT_PATH = "/tmp/response.mp3"

	def speak_text(text):
	"""Convert text to speech using gTTS and save as an MP3 file."""
	tts = gTTS(text=text, lang='en')
	tts.save(AUDIO_OUTPUT_PATH)
	return AUDIO_OUTPUT_PATH # Return the file path for Gradio Audio component



	@tool
	def search_dad_jokes(term: str) -> str:
	"""A tool that searches for dad jokes containing a specific term.
	Args:
	term: The keyword to search for in dad jokes.
	"""
	try:
	headers = {
	"Accept": "application/json",
	"User-Agent": "YourAppName (https://yourappurl.com)"
	}
	response = requests.get(f"https://icanhazdadjoke.com/search?term={term}", headers=headers)
	data = response.json()
	if data['results']:
	jokes = [joke['joke'] for joke in data['results']]
	response_text = f"Found {len(jokes)} jokes:\n" + "\n\n".join(jokes)
	else:
	response_text = f"No jokes found for the term '{term}'."
	except Exception as e:
	response_text = f"Error searching for jokes: {str(e)}"

	# Generate audio using gTTS
	audio_file = speak_text(response_text)

	return response_text, audio_file # Return text and audio file path


	lookup_definition_tool = lookup_definition
	text_to_speech_tool = text_to_speech
	dad_jokes_tool = search_dad_jokes

	final_answer = FinalAnswerTool()
	web_search_tool = DuckDuckGoSearchTool()
	visit_webpage_tool = VisitWebpageTool()



	# If the agent does not answer, the model is overloaded, please use another model or the following Hugging Face Endpoint that also contains qwen2.5 coder:
	# model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud'

	model = HfApiModel(
	max_tokens=2096,
	temperature=0.5,
	model_id='Qwen/Qwen2.5-Coder-32B-Instruct',# it is possible that this model may be overloaded
	custom_role_conversions=None,
	)


	# Import tool from Hub
	image_generation_tool = load_tool("agents-course/text-to-image", trust_remote_code=True)

	with open("prompts.yaml", 'r') as stream:
	prompt_templates = yaml.safe_load(stream)

	agent = CodeAgent(
	model=model,
	tools=[visit_webpage_tool, web_search_tool, final_answer, image_generation_tool, lookup_definition_tool, text_to_speech_tool, dad_jokes_tool], ## add your tools here (don't remove final answer)
	max_steps=6,
	verbosity_level=1,
	grammar=None,
	planning_interval=None,
	name=None,
	description=None,
	prompt_templates=prompt_templates
	)

	#Gradio interface with text and audio output
	def gradio_search_jokes(word):
	"""Wrapper function for Gradio to call search_dad_jokes and generate audio."""
	response_text, audio_file = search_dad_jokes(word) # Ensure search_dad_jokes returns (text, file path)
	return response_text, audio_file



	#Define the Gradio UI
	with gr.Blocks() as demo:
	gr.Markdown("### Dad Jokes Finder with AI & Text-to-Speech 🎙️")

	with gr.Row():
	input_box = gr.Textbox(label="Enter a word")
	output_text = gr.Textbox(label="Jokes Found")
	output_audio = gr.Audio(label="Audio Pronunciation", type="filepath")

	btn = gr.Button("Get Jokes")
	btn.click(gradio_search_jokes, inputs=input_box, outputs=[output_text, output_audio])

	demo.launch()


	# GradioUI(agent).launch()