Spaces:
Build error
Build error
| import os | |
| import requests | |
| import random | |
| import yaml | |
| import datetime | |
| import pytz | |
| import gradio as gr | |
| from gtts import gTTS # Use Google TTS instead of pyttsx3 | |
| from smolagents import CodeAgent, DuckDuckGoSearchTool, HfApiModel, load_tool, tool | |
| from tools.final_answer import FinalAnswerTool | |
| from Gradio_UI import GradioUI | |
| from tools.web_search import DuckDuckGoSearchTool | |
| from tools.visit_webpage import VisitWebpageTool | |
| from Code_Functions import speak_text | |
| from smolagents.agent_types import AgentText | |
| from smolagents.agent_types import AgentAudio | |
| import soundfile | |
| import io | |
| import librosa | |
| import numpy as np | |
| def lookup_definition(query: str) -> AgentText: | |
| """Fetches the definition of a word from the Dictionary API and returns it as AgentText. | |
| Args: | |
| query: The word to look up. | |
| Returns: | |
| A text response. | |
| """ | |
| url = f"https://api.dictionaryapi.dev/api/v2/entries/en/{query}" | |
| try: | |
| response = requests.get(url) | |
| response.raise_for_status() | |
| data = response.json() | |
| if not data: | |
| response_text = "No definition found." | |
| else: | |
| word = data[0].get("word", "Unknown word") | |
| origin = data[0].get("origin", "Origin not available") | |
| definitions = [ | |
| f"({meaning.get('partOfSpeech', 'Unknown')}) {definition['definition']}" | |
| for meaning in data[0].get("meanings", []) | |
| for definition in meaning.get("definitions", []) | |
| ] | |
| if not definitions: | |
| response_text = f"Word: {word}\nOrigin: {origin}\nNo definitions found." | |
| else: | |
| response_text = f"Word: {word}\nOrigin: {origin}\nDefinitions:\n- " + "\n- ".join(definitions) | |
| except requests.RequestException as e: | |
| response_text = f"Error fetching definition: {str(e)}" | |
| return AgentText(response_text) | |
| def text_to_speech(text: str) -> AgentAudio: | |
| """ | |
| Converts input text to speech and returns an AgentAudio instance with the audio file path. | |
| Args: | |
| text: The text sring with word definition that will be converted into speech. | |
| Returns: | |
| AgentAudio: An AgentAudio instance containing the file path to the generated audio. | |
| """ | |
| from gtts import gTTS | |
| AUDIO_OUTPUT_PATH = "/tmp/response.mp3" | |
| tts = gTTS(text=text, lang='en') | |
| tts.save(AUDIO_OUTPUT_PATH) | |
| return AgentAudio(AUDIO_OUTPUT_PATH) | |
| # Define the audio output path | |
| AUDIO_OUTPUT_PATH = "/tmp/response.mp3" | |
| def speak_text(text): | |
| """Convert text to speech using gTTS and save as an MP3 file.""" | |
| tts = gTTS(text=text, lang='en') | |
| tts.save(AUDIO_OUTPUT_PATH) | |
| return AUDIO_OUTPUT_PATH # Return the file path for Gradio Audio component | |
| def search_dad_jokes(term: str) -> str: | |
| """A tool that searches for dad jokes containing a specific term. | |
| Args: | |
| term: The keyword to search for in dad jokes. | |
| """ | |
| try: | |
| headers = { | |
| "Accept": "application/json", | |
| "User-Agent": "YourAppName (https://yourappurl.com)" | |
| } | |
| response = requests.get(f"https://icanhazdadjoke.com/search?term={term}", headers=headers) | |
| data = response.json() | |
| if data['results']: | |
| jokes = [joke['joke'] for joke in data['results']] | |
| response_text = f"Found {len(jokes)} jokes:\n" + "\n\n".join(jokes) | |
| else: | |
| response_text = f"No jokes found for the term '{term}'." | |
| except Exception as e: | |
| response_text = f"Error searching for jokes: {str(e)}" | |
| # Generate audio using gTTS | |
| audio_file = speak_text(response_text) | |
| return response_text, audio_file # Return text and audio file path | |
| lookup_definition_tool = lookup_definition | |
| text_to_speech_tool = text_to_speech | |
| dad_jokes_tool = search_dad_jokes | |
| final_answer = FinalAnswerTool() | |
| web_search_tool = DuckDuckGoSearchTool() | |
| visit_webpage_tool = VisitWebpageTool() | |
| # If the agent does not answer, the model is overloaded, please use another model or the following Hugging Face Endpoint that also contains qwen2.5 coder: | |
| # model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud' | |
| model = HfApiModel( | |
| max_tokens=2096, | |
| temperature=0.5, | |
| model_id='Qwen/Qwen2.5-Coder-32B-Instruct',# it is possible that this model may be overloaded | |
| custom_role_conversions=None, | |
| ) | |
| # Import tool from Hub | |
| image_generation_tool = load_tool("agents-course/text-to-image", trust_remote_code=True) | |
| with open("prompts.yaml", 'r') as stream: | |
| prompt_templates = yaml.safe_load(stream) | |
| agent = CodeAgent( | |
| model=model, | |
| tools=[visit_webpage_tool, web_search_tool, final_answer, image_generation_tool, lookup_definition_tool, text_to_speech_tool, dad_jokes_tool], ## add your tools here (don't remove final answer) | |
| max_steps=6, | |
| verbosity_level=1, | |
| grammar=None, | |
| planning_interval=None, | |
| name=None, | |
| description=None, | |
| prompt_templates=prompt_templates | |
| ) | |
| #Gradio interface with text and audio output | |
| def gradio_search_jokes(word): | |
| """Wrapper function for Gradio to call search_dad_jokes and generate audio.""" | |
| response_text, audio_file = search_dad_jokes(word) # Ensure search_dad_jokes returns (text, file path) | |
| return response_text, audio_file | |
| #Define the Gradio UI | |
| with gr.Blocks() as demo: | |
| gr.Markdown("### Dad Jokes Finder with AI & Text-to-Speech 🎙️") | |
| with gr.Row(): | |
| input_box = gr.Textbox(label="Enter a word") | |
| output_text = gr.Textbox(label="Jokes Found") | |
| output_audio = gr.Audio(label="Audio Pronunciation", type="filepath") | |
| btn = gr.Button("Get Jokes") | |
| btn.click(gradio_search_jokes, inputs=input_box, outputs=[output_text, output_audio]) | |
| demo.launch() | |
| # GradioUI(agent).launch() | |