utils.py 2.6 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758
  1. import os
  2. from opendevin.core.exceptions import BrowserUnavailableException
  3. from opendevin.core.schema import ActionType
  4. from opendevin.events.action import BrowseInteractiveAction, BrowseURLAction
  5. from opendevin.events.observation import BrowserOutputObservation
  6. from opendevin.runtime.browser.browser_env import BrowserEnv
  7. async def browse(
  8. action: BrowseURLAction | BrowseInteractiveAction, browser: BrowserEnv | None
  9. ) -> BrowserOutputObservation:
  10. if browser is None:
  11. raise BrowserUnavailableException()
  12. if isinstance(action, BrowseURLAction):
  13. # legacy BrowseURLAction
  14. asked_url = action.url
  15. if not asked_url.startswith('http'):
  16. asked_url = os.path.abspath(os.curdir) + action.url
  17. action_str = f'goto("{asked_url}")'
  18. elif isinstance(action, BrowseInteractiveAction):
  19. # new BrowseInteractiveAction, supports full featured BrowserGym actions
  20. # action in BrowserGym: see https://github.com/ServiceNow/BrowserGym/blob/main/core/src/browsergym/core/action/functions.py
  21. action_str = action.browser_actions
  22. else:
  23. raise ValueError(f'Invalid action type: {action.action}')
  24. try:
  25. # obs provided by BrowserGym: see https://github.com/ServiceNow/BrowserGym/blob/main/core/src/browsergym/core/env.py#L396
  26. obs = browser.step(action_str)
  27. return BrowserOutputObservation(
  28. content=obs['text_content'], # text content of the page
  29. open_pages_urls=obs['open_pages_urls'], # list of open pages
  30. active_page_index=obs['active_page_index'], # index of the active page
  31. dom_object=obs['dom_object'], # DOM object
  32. axtree_object=obs['axtree_object'], # accessibility tree object
  33. extra_element_properties=obs[
  34. 'extra_element_properties'
  35. ], # extra element properties
  36. last_browser_action=obs['last_action'], # last browser env action performed
  37. focused_element_bid=obs['focused_element_bid'], # focused element bid
  38. screenshot=obs['screenshot'], # base64-encoded screenshot, png
  39. url=obs['url'], # URL of the page
  40. error=True if obs['last_action_error'] else False, # error flag
  41. last_browser_action_error=obs[
  42. 'last_action_error'
  43. ], # last browser env action error
  44. )
  45. except Exception as e:
  46. return BrowserOutputObservation(
  47. content=str(e),
  48. screenshot='',
  49. error=True,
  50. last_browser_action_error=str(e),
  51. url=asked_url if action.action == ActionType.BROWSE else '',
  52. )