Spaces:
Sleeping
Sleeping
File size: 4,065 Bytes
c8e2203 9b5b26a c19d193 e6f3222 6aae614 8fe992b 9b5b26a 5df72d6 9b5b26a 011563f e6f3222 9b5b26a e6f3222 011563f e6f3222 9b5b26a e6f3222 011563f 2a0b989 e6f3222 2a0b989 e6f3222 9b5b26a 8c01ffb df1e246 6aae614 ae7a494 e121372 bf6d34c 29ec968 fe328e0 13d500a 8c01ffb 9b5b26a 8c01ffb 861422e 9b5b26a 8c01ffb 8fe992b db0edd6 8c01ffb 861422e 8fe992b 9b5b26a 8c01ffb | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 | from smolagents import CodeAgent, DuckDuckGoSearchTool, HfApiModel, load_tool, tool
import datetime
import requests
import pytz
import yaml
import json
from bs4 import BeautifulSoup
from tools.final_answer import FinalAnswerTool
from Gradio_UI import GradioUI
# Below is an example of a tool that does nothing. Amaze us with your creativity !
@tool
def inspect_web_page(url: str, max_length: int = 5000) -> str:
"""
Visits a web page, extracts the main text content, and returns it
in a clean, readable format for the AI.
Args:
url (str): The valid URL of the website to visit (e.g., "https://example.com").
max_length (int): The maximum number of characters to return. Defaults to 5000. Capped at 20000.
Returns:
str: A JSON formatted string containing the page title and clean body text,
or an error message if the extraction failed.
"""
headers = {
"User-Agent": "AI-Agent-Explorer/1.0"
}
HARD_LIMIT = 20000
try:
# 1. Fetch the page
response = requests.get(url, headers=headers, timeout=10)
response.raise_for_status()
# 2. Parse HTML
soup = BeautifulSoup(response.text, 'html.parser')
# 3. Clean up: Remove scripts, styles, and navigation to reduce noise
for script in soup(["script", "style", "nav", "footer", "header"]):
script.decompose()
# 4. Extract Title and Text
page_title = soup.title.string if soup.title else "No Title"
# Get text and clean up whitespace
text = soup.get_text()
lines = (line.strip() for line in text.splitlines())
chunks = (phrase.strip() for line in lines for phrase in line.split(" "))
clean_text = '\n'.join(chunk for chunk in chunks if chunk)
# 5. Limit text length (optional, to fit context windows)
max_chars = min(HARD_LIMIT, max_length)
if len(clean_text) > max_chars:
clean_text = clean_text[:max_chars] + "... [Content Truncated]"
# 6. Return structured result
return json.dumps({
"status": "success",
"title": page_title,
"content": clean_text
}, indent=2)
except Exception as e:
return json.dumps({
"status": "error",
"message": str(e)
})
@tool
def get_current_time_in_timezone(timezone: str) -> str:
"""A tool that fetches the current local time in a specified timezone.
Args:
timezone: A string representing a valid timezone (e.g., 'America/New_York').
"""
try:
# Create timezone object
tz = pytz.timezone(timezone)
# Get current time in that timezone
local_time = datetime.datetime.now(tz).strftime("%Y-%m-%d %H:%M:%S")
return f"The current local time in {timezone} is: {local_time}"
except Exception as e:
return f"Error fetching time for timezone '{timezone}': {str(e)}"
search_tool = DuckDuckGoSearchTool(max_results=10)
final_answer = FinalAnswerTool()
# If the agent does not answer, the model is overloaded, please use another model or the following Hugging Face Endpoint that also contains qwen2.5 coder:
# model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud'
model = HfApiModel(
max_tokens=2096,
temperature=0.5,
model_id='Qwen/Qwen2.5-Coder-32B-Instruct',# it is possible that this model may be overloaded
custom_role_conversions=None,
)
# Import tool from Hub
image_generation_tool = load_tool("agents-course/text-to-image", trust_remote_code=True)
with open("prompts.yaml", 'r') as stream:
prompt_templates = yaml.safe_load(stream)
agent = CodeAgent(
model=model,
tools=[search_tool, inspect_web_page, get_current_time_in_timezone, final_answer], ## add your tools here (don't remove final answer)
max_steps=6,
verbosity_level=1,
grammar=None,
planning_interval=None,
name=None,
description=None,
prompt_templates=prompt_templates
)
GradioUI(agent).launch() |