Spaces:

Boobs00
/

use

Configuration error

use / tests /test_vision.py

Upload folder using huggingface_hub

db4810d verified 10 months ago

1.45 kB

	"""
	Simple try of the agent.

	@dev You need to add OPENAI_API_KEY to your environment variables.
	"""

	import os
	import sys
	from pprint import pprint

	import pytest

	from browser_use.browser.browser import Browser, BrowserConfig

	sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))

	from langchain_openai import ChatOpenAI

	from browser_use import Agent, AgentHistoryList, Controller

	llm = ChatOpenAI(model='gpt-4o')
	controller = Controller()

	# use this test to ask the model questions about the page like
	# which color do you see for bbox labels, list all with their label
	# whats the smallest bboxes with labels and


	@controller.registry.action(description='explain what you see on the screen and ask user for input')
	async def explain_screen(text: str) -> str:
	pprint(text)
	answer = input('\nuser input next question: \n')
	return answer


	@controller.registry.action(description='done')
	async def done(text: str) -> str:
	# pprint(text)
	return 'call explain_screen'


	agent = Agent(
	task='call explain_screen all the time the user asks you questions e.g. about the page like bbox which you see are labels - your task is to expalin it and get the next question',
	llm=llm,
	controller=controller,
	browser=Browser(config=BrowserConfig(disable_security=True, headless=False)),
	)


	@pytest.mark.skip(reason='this is for local testing only')
	async def test_vision():
	history: AgentHistoryList = await agent.run(20)