├── .gitignore ├── CITATION.cff ├── LICENSE ├── README.md ├── agent ├── __init__.py ├── agent.py ├── prompts │ ├── __init__.py │ ├── jsons │ │ ├── p_cot_id_actree_2s.json │ │ ├── p_cot_id_actree_2s_no_na.json │ │ ├── p_cot_id_actree_3s.json │ │ ├── p_multimodal_cot_id_actree_3s.json │ │ └── p_som_cot_id_actree_3s.json │ ├── multimodal_examples │ │ ├── multimodal_example1.png │ │ ├── multimodal_example2.png │ │ └── multimodal_example3.png │ ├── prompt_constructor.py │ ├── raw │ │ ├── p_cot_id_actree_2s.py │ │ ├── p_cot_id_actree_2s_no_na.py │ │ ├── p_cot_id_actree_3s.py │ │ ├── p_multimodal_cot_id_actree_3s.py │ │ └── p_som_cot_id_actree_3s.py │ ├── som_examples │ │ ├── som_example1.png │ │ ├── som_example2.png │ │ └── som_example3.png │ └── to_json.py └── value_function.py ├── browser_env ├── __init__.py ├── actions.py ├── async_envs.py ├── auto_login.py ├── constants.py ├── env_config.py ├── envs.py ├── helper_functions.py ├── javascript │ ├── frame_mark_elements.js │ └── frame_unmark_elements.js ├── processors.py ├── py.typed ├── trajectory.py └── utils.py ├── coco_images ├── 000000000285.jpg ├── 000000022371.jpg ├── 000000023781.jpg ├── 000000024567.jpg ├── 000000029675.jpg ├── 000000029984.jpg ├── 000000039551.jpg ├── 000000048153.jpg ├── 000000048396.jpg ├── 000000048924.jpg ├── 000000050331.jpg ├── 000000058539.jpg ├── 000000058705.jpg ├── 000000060899.jpg ├── 000000064574.jpg ├── 000000064718.jpg ├── 000000066771.jpg ├── 000000084477.jpg ├── 000000097278.jpg ├── 000000102805.jpg ├── 000000136772.jpg ├── 000000161032.jpg ├── 000000162415.jpg ├── 000000163257.jpg ├── 000000163682.jpg ├── 000000166768.jpg ├── 000000167240.jpg ├── 000000167353.jpg ├── 000000172595.jpg ├── 000000173008.jpg ├── 000000175443.jpg ├── 000000176232.jpg ├── 000000286708.jpg ├── 000000324258.jpg ├── 000000324715.jpg ├── 000000327601.jpg ├── 000000329041.jpg ├── 000000348012.jpg ├── 000000399655.jpg ├── 000000415238.jpg ├── 000000433515.jpg ├── 000000440507.jpg ├── 000000444275.jpg ├── 000000513484.jpg └── 000000515982.jpg ├── config_files ├── vwa │ ├── test_classifieds.raw.json │ ├── test_reddit.raw.json │ └── test_shopping.raw.json └── wa │ └── test_webarena.raw.json ├── environment_docker ├── README.md └── webarena-homepage │ ├── app.py │ ├── static │ └── figures │ │ ├── calculator.png │ │ ├── classifieds.png │ │ ├── cms.png │ │ ├── gitlab.png │ │ ├── manual1.png │ │ ├── manual2.png │ │ ├── map.png │ │ ├── onestopshop.png │ │ ├── password.png │ │ ├── reddit.png │ │ ├── scratchpad.png │ │ └── wikipedia.png │ └── templates │ ├── calculator.html │ ├── index.html │ └── scratchpad.html ├── evaluation_harness ├── __init__.py ├── evaluators.py ├── helper_functions.py └── image_utils.py ├── llms ├── __init__.py ├── lm_config.py ├── providers │ ├── gemini_utils.py │ ├── hf_utils.py │ └── openai_utils.py ├── tokenizers.py └── utils.py ├── media ├── SourceCodePro-SemiBold.ttf ├── find_restaurant.gif ├── homepage_demo.png ├── overview.png ├── search_overview.gif └── som_figure.png ├── paper.pdf ├── prepare.sh ├── requirements.txt ├── run.py ├── run_demo.py ├── scripts ├── calc_breakdown_sr.py ├── check_error_runs.py ├── collect_obs.py ├── generate_test_data.py ├── reset_reddit.sh ├── reset_shopping.sh ├── run_llama_vwa_shopping_search.sh ├── run_shopping_som_search_batch.sh ├── run_vwa_classifieds_search.sh ├── run_vwa_reddit_search.sh ├── run_vwa_shopping_search.sh └── run_webarena_search.sh ├── setup.cfg ├── setup.py ├── tests ├── conftest.py ├── test_browser_env │ ├── sites │ │ └── new_tab.html │ ├── test_action_functionalities.py │ ├── test_actions.py │ ├── test_auth_cookie.py │ ├── test_playwright_actions.py │ └── test_script_browser_env.py └── test_evaluation_harness │ ├── configs │ ├── exact_image_failure.json │ ├── exact_image_resize_failure_1.json │ ├── exact_image_resize_failure_2.json │ ├── exact_image_resize_template.json │ ├── exact_image_success.json │ ├── func_eval_fail.json │ ├── func_eval_success.json │ ├── func_url_func_1.json │ ├── func_url_func_2.json │ ├── html_content_element_exact_match.json │ ├── html_content_exact_match.json │ ├── html_content_url_comb.json │ ├── html_required_values_failure_1.json │ ├── html_required_values_success_1.json │ ├── image_evaluator_yes.json │ ├── image_evaluator_yes_direct_img.json │ ├── image_evaluator_yes_no.json │ ├── string_match.json │ └── url_exact_match.json │ ├── test_exact_evaluators.py │ └── test_helper_functions.py └── wa_parallel_run.sh /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/.gitignore -------------------------------------------------------------------------------- /CITATION.cff: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/CITATION.cff -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/README.md -------------------------------------------------------------------------------- /agent/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/__init__.py -------------------------------------------------------------------------------- /agent/agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/agent.py -------------------------------------------------------------------------------- /agent/prompts/__init__.py: -------------------------------------------------------------------------------- 1 | from .prompt_constructor import * 2 | -------------------------------------------------------------------------------- /agent/prompts/jsons/p_cot_id_actree_2s.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/jsons/p_cot_id_actree_2s.json -------------------------------------------------------------------------------- /agent/prompts/jsons/p_cot_id_actree_2s_no_na.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/jsons/p_cot_id_actree_2s_no_na.json -------------------------------------------------------------------------------- /agent/prompts/jsons/p_cot_id_actree_3s.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/jsons/p_cot_id_actree_3s.json -------------------------------------------------------------------------------- /agent/prompts/jsons/p_multimodal_cot_id_actree_3s.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/jsons/p_multimodal_cot_id_actree_3s.json -------------------------------------------------------------------------------- /agent/prompts/jsons/p_som_cot_id_actree_3s.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/jsons/p_som_cot_id_actree_3s.json -------------------------------------------------------------------------------- /agent/prompts/multimodal_examples/multimodal_example1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/multimodal_examples/multimodal_example1.png -------------------------------------------------------------------------------- /agent/prompts/multimodal_examples/multimodal_example2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/multimodal_examples/multimodal_example2.png -------------------------------------------------------------------------------- /agent/prompts/multimodal_examples/multimodal_example3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/multimodal_examples/multimodal_example3.png -------------------------------------------------------------------------------- /agent/prompts/prompt_constructor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/prompt_constructor.py -------------------------------------------------------------------------------- /agent/prompts/raw/p_cot_id_actree_2s.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/raw/p_cot_id_actree_2s.py -------------------------------------------------------------------------------- /agent/prompts/raw/p_cot_id_actree_2s_no_na.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/raw/p_cot_id_actree_2s_no_na.py -------------------------------------------------------------------------------- /agent/prompts/raw/p_cot_id_actree_3s.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/raw/p_cot_id_actree_3s.py -------------------------------------------------------------------------------- /agent/prompts/raw/p_multimodal_cot_id_actree_3s.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/raw/p_multimodal_cot_id_actree_3s.py -------------------------------------------------------------------------------- /agent/prompts/raw/p_som_cot_id_actree_3s.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/raw/p_som_cot_id_actree_3s.py -------------------------------------------------------------------------------- /agent/prompts/som_examples/som_example1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/som_examples/som_example1.png -------------------------------------------------------------------------------- /agent/prompts/som_examples/som_example2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/som_examples/som_example2.png -------------------------------------------------------------------------------- /agent/prompts/som_examples/som_example3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/som_examples/som_example3.png -------------------------------------------------------------------------------- /agent/prompts/to_json.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/prompts/to_json.py -------------------------------------------------------------------------------- /agent/value_function.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/agent/value_function.py -------------------------------------------------------------------------------- /browser_env/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/__init__.py -------------------------------------------------------------------------------- /browser_env/actions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/actions.py -------------------------------------------------------------------------------- /browser_env/async_envs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/async_envs.py -------------------------------------------------------------------------------- /browser_env/auto_login.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/auto_login.py -------------------------------------------------------------------------------- /browser_env/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/constants.py -------------------------------------------------------------------------------- /browser_env/env_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/env_config.py -------------------------------------------------------------------------------- /browser_env/envs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/envs.py -------------------------------------------------------------------------------- /browser_env/helper_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/helper_functions.py -------------------------------------------------------------------------------- /browser_env/javascript/frame_mark_elements.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/javascript/frame_mark_elements.js -------------------------------------------------------------------------------- /browser_env/javascript/frame_unmark_elements.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/javascript/frame_unmark_elements.js -------------------------------------------------------------------------------- /browser_env/processors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/processors.py -------------------------------------------------------------------------------- /browser_env/py.typed: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /browser_env/trajectory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/trajectory.py -------------------------------------------------------------------------------- /browser_env/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/browser_env/utils.py -------------------------------------------------------------------------------- /coco_images/000000000285.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000000285.jpg -------------------------------------------------------------------------------- /coco_images/000000022371.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000022371.jpg -------------------------------------------------------------------------------- /coco_images/000000023781.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000023781.jpg -------------------------------------------------------------------------------- /coco_images/000000024567.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000024567.jpg -------------------------------------------------------------------------------- /coco_images/000000029675.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000029675.jpg -------------------------------------------------------------------------------- /coco_images/000000029984.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000029984.jpg -------------------------------------------------------------------------------- /coco_images/000000039551.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000039551.jpg -------------------------------------------------------------------------------- /coco_images/000000048153.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000048153.jpg -------------------------------------------------------------------------------- /coco_images/000000048396.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000048396.jpg -------------------------------------------------------------------------------- /coco_images/000000048924.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000048924.jpg -------------------------------------------------------------------------------- /coco_images/000000050331.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000050331.jpg -------------------------------------------------------------------------------- /coco_images/000000058539.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000058539.jpg -------------------------------------------------------------------------------- /coco_images/000000058705.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000058705.jpg -------------------------------------------------------------------------------- /coco_images/000000060899.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000060899.jpg -------------------------------------------------------------------------------- /coco_images/000000064574.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000064574.jpg -------------------------------------------------------------------------------- /coco_images/000000064718.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000064718.jpg -------------------------------------------------------------------------------- /coco_images/000000066771.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000066771.jpg -------------------------------------------------------------------------------- /coco_images/000000084477.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000084477.jpg -------------------------------------------------------------------------------- /coco_images/000000097278.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000097278.jpg -------------------------------------------------------------------------------- /coco_images/000000102805.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000102805.jpg -------------------------------------------------------------------------------- /coco_images/000000136772.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000136772.jpg -------------------------------------------------------------------------------- /coco_images/000000161032.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000161032.jpg -------------------------------------------------------------------------------- /coco_images/000000162415.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000162415.jpg -------------------------------------------------------------------------------- /coco_images/000000163257.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000163257.jpg -------------------------------------------------------------------------------- /coco_images/000000163682.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000163682.jpg -------------------------------------------------------------------------------- /coco_images/000000166768.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000166768.jpg -------------------------------------------------------------------------------- /coco_images/000000167240.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000167240.jpg -------------------------------------------------------------------------------- /coco_images/000000167353.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000167353.jpg -------------------------------------------------------------------------------- /coco_images/000000172595.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000172595.jpg -------------------------------------------------------------------------------- /coco_images/000000173008.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000173008.jpg -------------------------------------------------------------------------------- /coco_images/000000175443.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000175443.jpg -------------------------------------------------------------------------------- /coco_images/000000176232.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000176232.jpg -------------------------------------------------------------------------------- /coco_images/000000286708.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000286708.jpg -------------------------------------------------------------------------------- /coco_images/000000324258.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000324258.jpg -------------------------------------------------------------------------------- /coco_images/000000324715.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000324715.jpg -------------------------------------------------------------------------------- /coco_images/000000327601.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000327601.jpg -------------------------------------------------------------------------------- /coco_images/000000329041.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000329041.jpg -------------------------------------------------------------------------------- /coco_images/000000348012.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000348012.jpg -------------------------------------------------------------------------------- /coco_images/000000399655.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000399655.jpg -------------------------------------------------------------------------------- /coco_images/000000415238.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000415238.jpg -------------------------------------------------------------------------------- /coco_images/000000433515.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000433515.jpg -------------------------------------------------------------------------------- /coco_images/000000440507.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000440507.jpg -------------------------------------------------------------------------------- /coco_images/000000444275.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000444275.jpg -------------------------------------------------------------------------------- /coco_images/000000513484.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000513484.jpg -------------------------------------------------------------------------------- /coco_images/000000515982.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/coco_images/000000515982.jpg -------------------------------------------------------------------------------- /config_files/vwa/test_classifieds.raw.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/config_files/vwa/test_classifieds.raw.json -------------------------------------------------------------------------------- /config_files/vwa/test_reddit.raw.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/config_files/vwa/test_reddit.raw.json -------------------------------------------------------------------------------- /config_files/vwa/test_shopping.raw.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/config_files/vwa/test_shopping.raw.json -------------------------------------------------------------------------------- /config_files/wa/test_webarena.raw.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/config_files/wa/test_webarena.raw.json -------------------------------------------------------------------------------- /environment_docker/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/README.md -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/app.py -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/static/figures/calculator.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/static/figures/calculator.png -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/static/figures/classifieds.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/static/figures/classifieds.png -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/static/figures/cms.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/static/figures/cms.png -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/static/figures/gitlab.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/static/figures/gitlab.png -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/static/figures/manual1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/static/figures/manual1.png -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/static/figures/manual2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/static/figures/manual2.png -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/static/figures/map.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/static/figures/map.png -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/static/figures/onestopshop.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/static/figures/onestopshop.png -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/static/figures/password.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/static/figures/password.png -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/static/figures/reddit.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/static/figures/reddit.png -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/static/figures/scratchpad.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/static/figures/scratchpad.png -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/static/figures/wikipedia.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/static/figures/wikipedia.png -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/templates/calculator.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/templates/calculator.html -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/templates/index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/templates/index.html -------------------------------------------------------------------------------- /environment_docker/webarena-homepage/templates/scratchpad.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/environment_docker/webarena-homepage/templates/scratchpad.html -------------------------------------------------------------------------------- /evaluation_harness/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/evaluation_harness/__init__.py -------------------------------------------------------------------------------- /evaluation_harness/evaluators.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/evaluation_harness/evaluators.py -------------------------------------------------------------------------------- /evaluation_harness/helper_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/evaluation_harness/helper_functions.py -------------------------------------------------------------------------------- /evaluation_harness/image_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/evaluation_harness/image_utils.py -------------------------------------------------------------------------------- /llms/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/llms/__init__.py -------------------------------------------------------------------------------- /llms/lm_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/llms/lm_config.py -------------------------------------------------------------------------------- /llms/providers/gemini_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/llms/providers/gemini_utils.py -------------------------------------------------------------------------------- /llms/providers/hf_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/llms/providers/hf_utils.py -------------------------------------------------------------------------------- /llms/providers/openai_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/llms/providers/openai_utils.py -------------------------------------------------------------------------------- /llms/tokenizers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/llms/tokenizers.py -------------------------------------------------------------------------------- /llms/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/llms/utils.py -------------------------------------------------------------------------------- /media/SourceCodePro-SemiBold.ttf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/media/SourceCodePro-SemiBold.ttf -------------------------------------------------------------------------------- /media/find_restaurant.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/media/find_restaurant.gif -------------------------------------------------------------------------------- /media/homepage_demo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/media/homepage_demo.png -------------------------------------------------------------------------------- /media/overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/media/overview.png -------------------------------------------------------------------------------- /media/search_overview.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/media/search_overview.gif -------------------------------------------------------------------------------- /media/som_figure.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/media/som_figure.png -------------------------------------------------------------------------------- /paper.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/paper.pdf -------------------------------------------------------------------------------- /prepare.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/prepare.sh -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/requirements.txt -------------------------------------------------------------------------------- /run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/run.py -------------------------------------------------------------------------------- /run_demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/run_demo.py -------------------------------------------------------------------------------- /scripts/calc_breakdown_sr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/scripts/calc_breakdown_sr.py -------------------------------------------------------------------------------- /scripts/check_error_runs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/scripts/check_error_runs.py -------------------------------------------------------------------------------- /scripts/collect_obs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/scripts/collect_obs.py -------------------------------------------------------------------------------- /scripts/generate_test_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/scripts/generate_test_data.py -------------------------------------------------------------------------------- /scripts/reset_reddit.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/scripts/reset_reddit.sh -------------------------------------------------------------------------------- /scripts/reset_shopping.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/scripts/reset_shopping.sh -------------------------------------------------------------------------------- /scripts/run_llama_vwa_shopping_search.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/scripts/run_llama_vwa_shopping_search.sh -------------------------------------------------------------------------------- /scripts/run_shopping_som_search_batch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/scripts/run_shopping_som_search_batch.sh -------------------------------------------------------------------------------- /scripts/run_vwa_classifieds_search.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/scripts/run_vwa_classifieds_search.sh -------------------------------------------------------------------------------- /scripts/run_vwa_reddit_search.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/scripts/run_vwa_reddit_search.sh -------------------------------------------------------------------------------- /scripts/run_vwa_shopping_search.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/scripts/run_vwa_shopping_search.sh -------------------------------------------------------------------------------- /scripts/run_webarena_search.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/scripts/run_webarena_search.sh -------------------------------------------------------------------------------- /setup.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/setup.cfg -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/setup.py -------------------------------------------------------------------------------- /tests/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/conftest.py -------------------------------------------------------------------------------- /tests/test_browser_env/sites/new_tab.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_browser_env/sites/new_tab.html -------------------------------------------------------------------------------- /tests/test_browser_env/test_action_functionalities.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_browser_env/test_action_functionalities.py -------------------------------------------------------------------------------- /tests/test_browser_env/test_actions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_browser_env/test_actions.py -------------------------------------------------------------------------------- /tests/test_browser_env/test_auth_cookie.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_browser_env/test_auth_cookie.py -------------------------------------------------------------------------------- /tests/test_browser_env/test_playwright_actions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_browser_env/test_playwright_actions.py -------------------------------------------------------------------------------- /tests/test_browser_env/test_script_browser_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_browser_env/test_script_browser_env.py -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/exact_image_failure.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/exact_image_failure.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/exact_image_resize_failure_1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/exact_image_resize_failure_1.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/exact_image_resize_failure_2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/exact_image_resize_failure_2.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/exact_image_resize_template.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/exact_image_resize_template.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/exact_image_success.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/exact_image_success.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/func_eval_fail.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/func_eval_fail.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/func_eval_success.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/func_eval_success.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/func_url_func_1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/func_url_func_1.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/func_url_func_2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/func_url_func_2.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/html_content_element_exact_match.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/html_content_element_exact_match.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/html_content_exact_match.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/html_content_exact_match.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/html_content_url_comb.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/html_content_url_comb.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/html_required_values_failure_1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/html_required_values_failure_1.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/html_required_values_success_1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/html_required_values_success_1.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/image_evaluator_yes.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/image_evaluator_yes.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/image_evaluator_yes_direct_img.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/image_evaluator_yes_direct_img.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/image_evaluator_yes_no.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/image_evaluator_yes_no.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/string_match.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/string_match.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/configs/url_exact_match.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/configs/url_exact_match.json -------------------------------------------------------------------------------- /tests/test_evaluation_harness/test_exact_evaluators.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/test_exact_evaluators.py -------------------------------------------------------------------------------- /tests/test_evaluation_harness/test_helper_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/tests/test_evaluation_harness/test_helper_functions.py -------------------------------------------------------------------------------- /wa_parallel_run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/kohjingyu/search-agents/HEAD/wa_parallel_run.sh --------------------------------------------------------------------------------