|
from dataclasses import dataclass, field
|
|
|
|
from browsergym.utils.obs import flatten_axtree_to_str
|
|
|
|
from openhands.core.schema import ActionType, ObservationType
|
|
from openhands.events.observation.observation import Observation
|
|
|
|
|
|
@dataclass
|
|
class BrowserOutputObservation(Observation):
|
|
"""This data class represents the output of a browser."""
|
|
|
|
url: str
|
|
trigger_by_action: str
|
|
screenshot: str = field(repr=False, default='')
|
|
error: bool = False
|
|
observation: str = ObservationType.BROWSE
|
|
|
|
open_pages_urls: list = field(default_factory=list)
|
|
active_page_index: int = -1
|
|
dom_object: dict = field(default_factory=dict, repr=False)
|
|
axtree_object: dict = field(default_factory=dict, repr=False)
|
|
extra_element_properties: dict = field(
|
|
default_factory=dict, repr=False
|
|
)
|
|
last_browser_action: str = ''
|
|
last_browser_action_error: str = ''
|
|
focused_element_bid: str = ''
|
|
|
|
@property
|
|
def message(self) -> str:
|
|
return 'Visited ' + self.url
|
|
|
|
def __str__(self) -> str:
|
|
ret = (
|
|
'**BrowserOutputObservation**\n'
|
|
f'URL: {self.url}\n'
|
|
f'Error: {self.error}\n'
|
|
f'Open pages: {self.open_pages_urls}\n'
|
|
f'Active page index: {self.active_page_index}\n'
|
|
f'Last browser action: {self.last_browser_action}\n'
|
|
f'Last browser action error: {self.last_browser_action_error}\n'
|
|
f'Focused element bid: {self.focused_element_bid}\n'
|
|
)
|
|
ret += '--- Agent Observation ---\n'
|
|
ret += self.get_agent_obs_text()
|
|
return ret
|
|
|
|
def get_agent_obs_text(self) -> str:
|
|
"""Get a concise text that will be shown to the agent."""
|
|
if self.trigger_by_action == ActionType.BROWSE_INTERACTIVE:
|
|
text = f'[Current URL: {self.url}]\n'
|
|
text += f'[Focused element bid: {self.focused_element_bid}]\n\n'
|
|
if self.error:
|
|
text += (
|
|
'================ BEGIN error message ===============\n'
|
|
'The following error occurred when executing the last action:\n'
|
|
f'{self.last_browser_action_error}\n'
|
|
'================ END error message ===============\n'
|
|
)
|
|
else:
|
|
text += '[Action executed successfully.]\n'
|
|
try:
|
|
|
|
|
|
|
|
cur_axtree_txt = self.get_axtree_str(filter_visible_only=False)
|
|
text += (
|
|
f'============== BEGIN accessibility tree ==============\n'
|
|
f'{cur_axtree_txt}\n'
|
|
f'============== END accessibility tree ==============\n'
|
|
)
|
|
except Exception as e:
|
|
text += (
|
|
f'\n[Error encountered when processing the accessibility tree: {e}]'
|
|
)
|
|
return text
|
|
|
|
elif self.trigger_by_action == ActionType.BROWSE:
|
|
text = f'[Current URL: {self.url}]\n'
|
|
if self.error:
|
|
text += (
|
|
'================ BEGIN error message ===============\n'
|
|
'The following error occurred when trying to visit the URL:\n'
|
|
f'{self.last_browser_action_error}\n'
|
|
'================ END error message ===============\n'
|
|
)
|
|
text += '============== BEGIN webpage content ==============\n'
|
|
text += self.content
|
|
text += '\n============== END webpage content ==============\n'
|
|
return text
|
|
else:
|
|
raise ValueError(f'Invalid trigger_by_action: {self.trigger_by_action}')
|
|
|
|
def get_axtree_str(self, filter_visible_only: bool = False) -> str:
|
|
cur_axtree_txt = flatten_axtree_to_str(
|
|
self.axtree_object,
|
|
extra_properties=self.extra_element_properties,
|
|
with_clickable=True,
|
|
skip_generic=False,
|
|
filter_visible_only=filter_visible_only,
|
|
)
|
|
return cur_axtree_txt
|
|
|