MultiAgentExamples-AliA / image_agent.py
AliA1997
Completed some demos from huggingface tutorials.
8bed67e
import os
import PIL
import requests
from io import BytesIO
from PIL import Image
from smolagents import CodeAgent, OpenAIServerModel, InferenceClientModel
from huggingface_hub import login
image_urls = [
"https://encrypted-tbn0.gstatic.com/images?q=tbn:ANd9GcTcB9-ieIzm2uhtTkMkV5F50xbL4itvh3j8bg&s", # Joker image
"https://encrypted-tbn0.gstatic.com/images?q=tbn:ANd9GcR0SWQC74KuQWrJA33pJqUmOuDx62K7p1uEcQ&s" # Joker image
]
stored_images = []
for url in image_urls:
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/114.0.0.0 Safari/537.36"
}
response = requests.get(url, headers)
try:
image = Image.open(BytesIO(response.content)).convert("RGB")
stored_images.append(image)
except PIL.UnidentifiedImageError:
print("⚠️ The downloaded file is not a valid image.")
# Optional: save the raw bytes for inspection
with open("debug_image.bin", "wb") as f:
f.write(response.content)
# image = Image.open(BytesIO(response.content)).convert("RGB")
def init_stored_image_agent() -> CodeAgent:
# Now based on the images indicate if it's wonder women or joker.
model = OpenAIServerModel(model_id="gpt-4o")
stored_image_agent = CodeAgent(
tools=[],
model=model,
max_steps=5,
verbosity_level=2
)
return stored_image_agent