| from dataclasses import dataclass, field
|
|
|
| from browsergym.utils.obs import flatten_axtree_to_str
|
|
|
| from openhands.core.schema import ActionType, ObservationType
|
| from openhands.events.observation.observation import Observation
|
|
|
|
|
| @dataclass
|
| class BrowserOutputObservation(Observation):
|
| """This data class represents the output of a browser."""
|
|
|
| url: str
|
| trigger_by_action: str
|
| screenshot: str = field(repr=False, default='')
|
| error: bool = False
|
| observation: str = ObservationType.BROWSE
|
|
|
| open_pages_urls: list = field(default_factory=list)
|
| active_page_index: int = -1
|
| dom_object: dict = field(default_factory=dict, repr=False)
|
| axtree_object: dict = field(default_factory=dict, repr=False)
|
| extra_element_properties: dict = field(
|
| default_factory=dict, repr=False
|
| )
|
| last_browser_action: str = ''
|
| last_browser_action_error: str = ''
|
| focused_element_bid: str = ''
|
|
|
| @property
|
| def message(self) -> str:
|
| return 'Visited ' + self.url
|
|
|
| def __str__(self) -> str:
|
| ret = (
|
| '**BrowserOutputObservation**\n'
|
| f'URL: {self.url}\n'
|
| f'Error: {self.error}\n'
|
| f'Open pages: {self.open_pages_urls}\n'
|
| f'Active page index: {self.active_page_index}\n'
|
| f'Last browser action: {self.last_browser_action}\n'
|
| f'Last browser action error: {self.last_browser_action_error}\n'
|
| f'Focused element bid: {self.focused_element_bid}\n'
|
| )
|
| ret += '--- Agent Observation ---\n'
|
| ret += self.get_agent_obs_text()
|
| return ret
|
|
|
| def get_agent_obs_text(self) -> str:
|
| """Get a concise text that will be shown to the agent."""
|
| if self.trigger_by_action == ActionType.BROWSE_INTERACTIVE:
|
| text = f'[Current URL: {self.url}]\n'
|
| text += f'[Focused element bid: {self.focused_element_bid}]\n\n'
|
| if self.error:
|
| text += (
|
| '================ BEGIN error message ===============\n'
|
| 'The following error occurred when executing the last action:\n'
|
| f'{self.last_browser_action_error}\n'
|
| '================ END error message ===============\n'
|
| )
|
| else:
|
| text += '[Action executed successfully.]\n'
|
| try:
|
|
|
|
|
|
|
| cur_axtree_txt = self.get_axtree_str(filter_visible_only=False)
|
| text += (
|
| f'============== BEGIN accessibility tree ==============\n'
|
| f'{cur_axtree_txt}\n'
|
| f'============== END accessibility tree ==============\n'
|
| )
|
| except Exception as e:
|
| text += (
|
| f'\n[Error encountered when processing the accessibility tree: {e}]'
|
| )
|
| return text
|
|
|
| elif self.trigger_by_action == ActionType.BROWSE:
|
| text = f'[Current URL: {self.url}]\n'
|
| if self.error:
|
| text += (
|
| '================ BEGIN error message ===============\n'
|
| 'The following error occurred when trying to visit the URL:\n'
|
| f'{self.last_browser_action_error}\n'
|
| '================ END error message ===============\n'
|
| )
|
| text += '============== BEGIN webpage content ==============\n'
|
| text += self.content
|
| text += '\n============== END webpage content ==============\n'
|
| return text
|
| else:
|
| raise ValueError(f'Invalid trigger_by_action: {self.trigger_by_action}')
|
|
|
| def get_axtree_str(self, filter_visible_only: bool = False) -> str:
|
| cur_axtree_txt = flatten_axtree_to_str(
|
| self.axtree_object,
|
| extra_properties=self.extra_element_properties,
|
| with_clickable=True,
|
| skip_generic=False,
|
| filter_visible_only=filter_visible_only,
|
| )
|
| return cur_axtree_txt
|
|
|