├── .gitignore ├── LICENSE ├── README.md ├── README_ZH.md ├── assets ├── .DS_Store ├── ToolLLaMA-logo.png ├── ToolLLaMA.png ├── answer_anno.png ├── comparison.png ├── instructiongeneration.png ├── overview.png ├── paper.pdf ├── performance.png └── toolbench-demo.mp4 ├── data_example ├── answer │ ├── .DS_Store │ ├── G1_answer │ │ ├── 10_ChatGPT_DFS_woFilter_w2.json │ │ ├── 11_ChatGPT_DFS_woFilter_w2.json │ │ ├── 57_ChatGPT_DFS_woFilter_w2.json │ │ ├── 59_ChatGPT_DFS_woFilter_w2.json │ │ └── 69_ChatGPT_DFS_woFilter_w2.json │ ├── G2_answer │ │ ├── 102_ChatGPT_DFS_woFilter_w2.json │ │ ├── 10_ChatGPT_DFS_woFilter_w2.json │ │ ├── 119_ChatGPT_DFS_woFilter_w2.json │ │ ├── 127_ChatGPT_DFS_woFilter_w2.json │ │ └── 52_ChatGPT_DFS_woFilter_w2.json │ └── G3_answer │ │ ├── 13_ChatGPT_DFS_woFilter_w2.json │ │ ├── 15_ChatGPT_DFS_woFilter_w2.json │ │ ├── 21_ChatGPT_DFS_woFilter_w2.json │ │ ├── 3_ChatGPT_DFS_woFilter_w2.json │ │ └── 8_ChatGPT_DFS_woFilter_w2.json ├── instruction │ ├── G1_query.json │ ├── G2_query.json │ ├── G3_query.json │ ├── inference_query_demo.json │ └── inference_query_demo_open_domain.json └── toolenv │ ├── .DS_Store │ ├── response_examples │ ├── .DS_Store │ ├── Advertising │ │ ├── privatepublicapi.json │ │ ├── publicapitestinginbox.json │ │ └── putreq.json │ ├── Artificial_Intelligence_Machine_Learning │ │ ├── speech_recognition.json │ │ ├── stable_diffusion_v2.json │ │ └── starpredictai_ai_powered_text_review_star_predictor.json │ ├── Business │ │ ├── abuse_ip_check.json │ │ ├── acopaer.json │ │ └── acrosuite_oauther.json │ ├── Commerce │ │ ├── ado_stock.json │ │ ├── aliexpress_true_api.json │ │ └── aliexpress_unofficial.json │ └── Gaming │ │ ├── csgo_matches_and_tournaments.json │ │ ├── demo_project_v2.json │ │ └── dice_roll_simulator.json │ └── tools │ ├── .DS_Store │ ├── Advertising │ ├── .DS_Store │ ├── bog_boi_api │ │ └── api.py │ ├── bty690warped │ │ └── api.py │ └── buy_gmail_accounts │ │ └── api.py │ ├── Artificial_Intelligence_Machine_Learning │ ├── .DS_Store │ ├── b2b_sales_forecasting │ │ └── api.py │ ├── bard │ │ └── api.py │ └── bard_api │ │ └── api.py │ ├── Business │ ├── .DS_Store │ ├── contacts_api │ │ └── api.py │ ├── contus_mirrorfly │ │ └── api.py │ └── crime_rate │ │ └── api.py │ ├── Commerce │ ├── .DS_Store │ ├── amazon_data_scapper │ │ └── api.py │ ├── api_shopping │ │ └── api.py │ └── codeepy_vispox │ │ └── api.py │ └── Music │ ├── .DS_Store │ ├── genius_song_lyrics │ └── api.py │ ├── getsongs │ └── api.py │ └── kooed │ └── api.py ├── docs └── index.html ├── ds_configs ├── stage2.json └── stage3.json ├── preprocess ├── preprocess_retriever_data.py └── preprocess_toolllama_data.py ├── requirements.txt ├── scripts ├── inference_chatgpt_pipeline.sh ├── inference_chatgpt_pipeline_w_rapidapi_key.sh ├── inference_davinci_pipeline.sh ├── inference_toolllama_lora_pipeline.sh ├── inference_toolllama_lora_pipeline_open_domain.sh ├── inference_toolllama_pipeline.sh ├── preprocess_retriever_data.sh ├── preprocess_toolllama_data.sh ├── train_retriever.sh ├── train_toolllama.sh └── train_toolllama_lora.sh └── toolbench ├── inference ├── Algorithms │ ├── DFS.py │ ├── __init__.py │ ├── base_search.py │ └── single_chain.py ├── Downstream_tasks │ ├── __init__.py │ ├── base_env.py │ └── rapidapi.py ├── LLM │ ├── __init__.py │ ├── base_io.py │ ├── chatgpt_function_model.py │ ├── davinci_model.py │ ├── llama_model.py │ ├── retriever.py │ ├── tool_llama_lora_model.py │ └── tool_llama_model.py ├── LLM_rank │ ├── __init__.py │ └── rank_candidate.py ├── Prompts │ ├── ReAct_prompts.py │ ├── Tree_search_prompts.py │ ├── __init__.py │ └── rank_prompts.py ├── Tree │ ├── Tree.py │ └── __init__.py ├── callbacks │ └── ServerEventCallback.py ├── qa_pipeline.py ├── qa_pipeline_open_domain.py ├── server.py ├── toolbench_server.py └── utils.py ├── model ├── __init__.py ├── apply_delta.py ├── compression.py ├── make_delta.py └── model_adapter.py ├── retrieval ├── api_evaluator.py ├── inference_example.py └── train.py ├── tool_conversation.py ├── tooleval ├── README.md ├── README_ZH.md ├── __init__.py ├── automatic_eval_sample.py ├── convert_answers.py ├── convert_to_answer_format.py ├── dataset │ └── __init__.py ├── eval_and_update_leaderboard.py ├── eval_pass_rate.py ├── eval_preference.py ├── evaluation │ ├── __init__.py │ ├── dataclass.py │ ├── methodcls.py │ └── usereval.py ├── evaluators │ ├── __init__.py │ ├── registered_cls │ │ ├── __init__.py │ │ ├── base.py │ │ ├── rtl.py │ │ ├── tooleval.py │ │ └── utils.py │ ├── tooleval_gpt-3.5-turbo_default │ │ ├── config.yaml │ │ └── template.txt │ ├── tooleval_gpt-3.5-turbo_fn │ │ ├── config.yaml │ │ └── template.txt │ └── tooleval_gpt-3.5-turbo_normalized │ │ ├── config.yaml │ │ └── template.txt ├── evaluators_comparison.py ├── requirements.txt ├── results │ ├── default_evalset │ │ ├── DFS │ │ │ └── win.csv │ │ └── gpt-3.5-turbo_CoT │ │ │ ├── G1_category.json │ │ │ ├── G1_instruction.json │ │ │ ├── G1_tool.json │ │ │ ├── G2_category.json │ │ │ ├── G2_instruction.json │ │ │ └── G3_instruction.json │ ├── leaderboard###default_evalset###tooleval_gpt-3.5-turbo_normalized###ChatGPT-DFSDT.csv │ └── leaderboard###default_evalset###tooleval_gpt-3.5-turbo_normalized###gpt-3.5-turbo_CoT.csv ├── run_convert_answer.sh ├── run_pass_rate.sh ├── run_preference.sh └── utils.py ├── train ├── llama_condense_monkey_patch.py ├── llama_flash_attn_monkey_patch.py ├── train.py ├── train_lora.py └── train_mem.py └── utils.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/README.md -------------------------------------------------------------------------------- /README_ZH.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/README_ZH.md -------------------------------------------------------------------------------- /assets/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/assets/.DS_Store -------------------------------------------------------------------------------- /assets/ToolLLaMA-logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/assets/ToolLLaMA-logo.png -------------------------------------------------------------------------------- /assets/ToolLLaMA.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/assets/ToolLLaMA.png -------------------------------------------------------------------------------- /assets/answer_anno.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/assets/answer_anno.png -------------------------------------------------------------------------------- /assets/comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/assets/comparison.png -------------------------------------------------------------------------------- /assets/instructiongeneration.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/assets/instructiongeneration.png -------------------------------------------------------------------------------- /assets/overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/assets/overview.png -------------------------------------------------------------------------------- /assets/paper.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/assets/paper.pdf -------------------------------------------------------------------------------- /assets/performance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/assets/performance.png -------------------------------------------------------------------------------- /assets/toolbench-demo.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/assets/toolbench-demo.mp4 -------------------------------------------------------------------------------- /data_example/answer/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/.DS_Store -------------------------------------------------------------------------------- /data_example/answer/G1_answer/10_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G1_answer/10_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G1_answer/11_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G1_answer/11_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G1_answer/57_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G1_answer/57_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G1_answer/59_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G1_answer/59_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G1_answer/69_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G1_answer/69_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G2_answer/102_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G2_answer/102_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G2_answer/10_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G2_answer/10_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G2_answer/119_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G2_answer/119_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G2_answer/127_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G2_answer/127_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G2_answer/52_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G2_answer/52_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G3_answer/13_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G3_answer/13_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G3_answer/15_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G3_answer/15_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G3_answer/21_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G3_answer/21_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G3_answer/3_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G3_answer/3_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/answer/G3_answer/8_ChatGPT_DFS_woFilter_w2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/answer/G3_answer/8_ChatGPT_DFS_woFilter_w2.json -------------------------------------------------------------------------------- /data_example/instruction/G1_query.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/instruction/G1_query.json -------------------------------------------------------------------------------- /data_example/instruction/G2_query.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/instruction/G2_query.json -------------------------------------------------------------------------------- /data_example/instruction/G3_query.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/instruction/G3_query.json -------------------------------------------------------------------------------- /data_example/instruction/inference_query_demo.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/instruction/inference_query_demo.json -------------------------------------------------------------------------------- /data_example/instruction/inference_query_demo_open_domain.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/instruction/inference_query_demo_open_domain.json -------------------------------------------------------------------------------- /data_example/toolenv/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/.DS_Store -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/response_examples/.DS_Store -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Advertising/privatepublicapi.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/response_examples/Advertising/privatepublicapi.json -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Advertising/publicapitestinginbox.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/response_examples/Advertising/publicapitestinginbox.json -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Advertising/putreq.json: -------------------------------------------------------------------------------- 1 | { 2 | "api_list": [] 3 | } -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Artificial_Intelligence_Machine_Learning/speech_recognition.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/response_examples/Artificial_Intelligence_Machine_Learning/speech_recognition.json -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Artificial_Intelligence_Machine_Learning/stable_diffusion_v2.json: -------------------------------------------------------------------------------- 1 | { 2 | "api_list": [] 3 | } -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Artificial_Intelligence_Machine_Learning/starpredictai_ai_powered_text_review_star_predictor.json: -------------------------------------------------------------------------------- 1 | { 2 | "api_list": [] 3 | } -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Business/abuse_ip_check.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/response_examples/Business/abuse_ip_check.json -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Business/acopaer.json: -------------------------------------------------------------------------------- 1 | { 2 | "api_list": [] 3 | } -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Business/acrosuite_oauther.json: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Commerce/ado_stock.json: -------------------------------------------------------------------------------- 1 | { 2 | "api_list": [] 3 | } -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Commerce/aliexpress_true_api.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/response_examples/Commerce/aliexpress_true_api.json -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Commerce/aliexpress_unofficial.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/response_examples/Commerce/aliexpress_unofficial.json -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Gaming/csgo_matches_and_tournaments.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/response_examples/Gaming/csgo_matches_and_tournaments.json -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Gaming/demo_project_v2.json: -------------------------------------------------------------------------------- 1 | { 2 | "api_list": [] 3 | } -------------------------------------------------------------------------------- /data_example/toolenv/response_examples/Gaming/dice_roll_simulator.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/response_examples/Gaming/dice_roll_simulator.json -------------------------------------------------------------------------------- /data_example/toolenv/tools/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/.DS_Store -------------------------------------------------------------------------------- /data_example/toolenv/tools/Advertising/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Advertising/.DS_Store -------------------------------------------------------------------------------- /data_example/toolenv/tools/Advertising/bog_boi_api/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Advertising/bog_boi_api/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Advertising/bty690warped/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Advertising/bty690warped/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Advertising/buy_gmail_accounts/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Advertising/buy_gmail_accounts/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Artificial_Intelligence_Machine_Learning/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Artificial_Intelligence_Machine_Learning/.DS_Store -------------------------------------------------------------------------------- /data_example/toolenv/tools/Artificial_Intelligence_Machine_Learning/b2b_sales_forecasting/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Artificial_Intelligence_Machine_Learning/b2b_sales_forecasting/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Artificial_Intelligence_Machine_Learning/bard/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Artificial_Intelligence_Machine_Learning/bard/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Artificial_Intelligence_Machine_Learning/bard_api/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Artificial_Intelligence_Machine_Learning/bard_api/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Business/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Business/.DS_Store -------------------------------------------------------------------------------- /data_example/toolenv/tools/Business/contacts_api/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Business/contacts_api/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Business/contus_mirrorfly/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Business/contus_mirrorfly/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Business/crime_rate/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Business/crime_rate/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Commerce/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Commerce/.DS_Store -------------------------------------------------------------------------------- /data_example/toolenv/tools/Commerce/amazon_data_scapper/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Commerce/amazon_data_scapper/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Commerce/api_shopping/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Commerce/api_shopping/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Commerce/codeepy_vispox/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Commerce/codeepy_vispox/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Music/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Music/.DS_Store -------------------------------------------------------------------------------- /data_example/toolenv/tools/Music/genius_song_lyrics/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Music/genius_song_lyrics/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Music/getsongs/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Music/getsongs/api.py -------------------------------------------------------------------------------- /data_example/toolenv/tools/Music/kooed/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/data_example/toolenv/tools/Music/kooed/api.py -------------------------------------------------------------------------------- /docs/index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/docs/index.html -------------------------------------------------------------------------------- /ds_configs/stage2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/ds_configs/stage2.json -------------------------------------------------------------------------------- /ds_configs/stage3.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/ds_configs/stage3.json -------------------------------------------------------------------------------- /preprocess/preprocess_retriever_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/preprocess/preprocess_retriever_data.py -------------------------------------------------------------------------------- /preprocess/preprocess_toolllama_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/preprocess/preprocess_toolllama_data.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/requirements.txt -------------------------------------------------------------------------------- /scripts/inference_chatgpt_pipeline.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/scripts/inference_chatgpt_pipeline.sh -------------------------------------------------------------------------------- /scripts/inference_chatgpt_pipeline_w_rapidapi_key.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/scripts/inference_chatgpt_pipeline_w_rapidapi_key.sh -------------------------------------------------------------------------------- /scripts/inference_davinci_pipeline.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/scripts/inference_davinci_pipeline.sh -------------------------------------------------------------------------------- /scripts/inference_toolllama_lora_pipeline.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/scripts/inference_toolllama_lora_pipeline.sh -------------------------------------------------------------------------------- /scripts/inference_toolllama_lora_pipeline_open_domain.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/scripts/inference_toolllama_lora_pipeline_open_domain.sh -------------------------------------------------------------------------------- /scripts/inference_toolllama_pipeline.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/scripts/inference_toolllama_pipeline.sh -------------------------------------------------------------------------------- /scripts/preprocess_retriever_data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/scripts/preprocess_retriever_data.sh -------------------------------------------------------------------------------- /scripts/preprocess_toolllama_data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/scripts/preprocess_toolllama_data.sh -------------------------------------------------------------------------------- /scripts/train_retriever.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/scripts/train_retriever.sh -------------------------------------------------------------------------------- /scripts/train_toolllama.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/scripts/train_toolllama.sh -------------------------------------------------------------------------------- /scripts/train_toolllama_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/scripts/train_toolllama_lora.sh -------------------------------------------------------------------------------- /toolbench/inference/Algorithms/DFS.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/Algorithms/DFS.py -------------------------------------------------------------------------------- /toolbench/inference/Algorithms/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /toolbench/inference/Algorithms/base_search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/Algorithms/base_search.py -------------------------------------------------------------------------------- /toolbench/inference/Algorithms/single_chain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/Algorithms/single_chain.py -------------------------------------------------------------------------------- /toolbench/inference/Downstream_tasks/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /toolbench/inference/Downstream_tasks/base_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/Downstream_tasks/base_env.py -------------------------------------------------------------------------------- /toolbench/inference/Downstream_tasks/rapidapi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/Downstream_tasks/rapidapi.py -------------------------------------------------------------------------------- /toolbench/inference/LLM/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /toolbench/inference/LLM/base_io.py: -------------------------------------------------------------------------------- 1 | import re 2 | 3 | def base_io(input_str): 4 | pass -------------------------------------------------------------------------------- /toolbench/inference/LLM/chatgpt_function_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/LLM/chatgpt_function_model.py -------------------------------------------------------------------------------- /toolbench/inference/LLM/davinci_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/LLM/davinci_model.py -------------------------------------------------------------------------------- /toolbench/inference/LLM/llama_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/LLM/llama_model.py -------------------------------------------------------------------------------- /toolbench/inference/LLM/retriever.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/LLM/retriever.py -------------------------------------------------------------------------------- /toolbench/inference/LLM/tool_llama_lora_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/LLM/tool_llama_lora_model.py -------------------------------------------------------------------------------- /toolbench/inference/LLM/tool_llama_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/LLM/tool_llama_model.py -------------------------------------------------------------------------------- /toolbench/inference/LLM_rank/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /toolbench/inference/LLM_rank/rank_candidate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/LLM_rank/rank_candidate.py -------------------------------------------------------------------------------- /toolbench/inference/Prompts/ReAct_prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/Prompts/ReAct_prompts.py -------------------------------------------------------------------------------- /toolbench/inference/Prompts/Tree_search_prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/Prompts/Tree_search_prompts.py -------------------------------------------------------------------------------- /toolbench/inference/Prompts/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /toolbench/inference/Prompts/rank_prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/Prompts/rank_prompts.py -------------------------------------------------------------------------------- /toolbench/inference/Tree/Tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/Tree/Tree.py -------------------------------------------------------------------------------- /toolbench/inference/Tree/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /toolbench/inference/callbacks/ServerEventCallback.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/callbacks/ServerEventCallback.py -------------------------------------------------------------------------------- /toolbench/inference/qa_pipeline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/qa_pipeline.py -------------------------------------------------------------------------------- /toolbench/inference/qa_pipeline_open_domain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/qa_pipeline_open_domain.py -------------------------------------------------------------------------------- /toolbench/inference/server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/server.py -------------------------------------------------------------------------------- /toolbench/inference/toolbench_server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/toolbench_server.py -------------------------------------------------------------------------------- /toolbench/inference/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/inference/utils.py -------------------------------------------------------------------------------- /toolbench/model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/model/__init__.py -------------------------------------------------------------------------------- /toolbench/model/apply_delta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/model/apply_delta.py -------------------------------------------------------------------------------- /toolbench/model/compression.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/model/compression.py -------------------------------------------------------------------------------- /toolbench/model/make_delta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/model/make_delta.py -------------------------------------------------------------------------------- /toolbench/model/model_adapter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/model/model_adapter.py -------------------------------------------------------------------------------- /toolbench/retrieval/api_evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/retrieval/api_evaluator.py -------------------------------------------------------------------------------- /toolbench/retrieval/inference_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/retrieval/inference_example.py -------------------------------------------------------------------------------- /toolbench/retrieval/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/retrieval/train.py -------------------------------------------------------------------------------- /toolbench/tool_conversation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tool_conversation.py -------------------------------------------------------------------------------- /toolbench/tooleval/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/README.md -------------------------------------------------------------------------------- /toolbench/tooleval/README_ZH.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/README_ZH.md -------------------------------------------------------------------------------- /toolbench/tooleval/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /toolbench/tooleval/automatic_eval_sample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/automatic_eval_sample.py -------------------------------------------------------------------------------- /toolbench/tooleval/convert_answers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/convert_answers.py -------------------------------------------------------------------------------- /toolbench/tooleval/convert_to_answer_format.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/convert_to_answer_format.py -------------------------------------------------------------------------------- /toolbench/tooleval/dataset/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /toolbench/tooleval/eval_and_update_leaderboard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/eval_and_update_leaderboard.py -------------------------------------------------------------------------------- /toolbench/tooleval/eval_pass_rate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/eval_pass_rate.py -------------------------------------------------------------------------------- /toolbench/tooleval/eval_preference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/eval_preference.py -------------------------------------------------------------------------------- /toolbench/tooleval/evaluation/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluation/__init__.py -------------------------------------------------------------------------------- /toolbench/tooleval/evaluation/dataclass.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluation/dataclass.py -------------------------------------------------------------------------------- /toolbench/tooleval/evaluation/methodcls.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluation/methodcls.py -------------------------------------------------------------------------------- /toolbench/tooleval/evaluation/usereval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluation/usereval.py -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators/__init__.py -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators/registered_cls/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators/registered_cls/__init__.py -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators/registered_cls/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators/registered_cls/base.py -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators/registered_cls/rtl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators/registered_cls/rtl.py -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators/registered_cls/tooleval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators/registered_cls/tooleval.py -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators/registered_cls/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators/registered_cls/utils.py -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators/tooleval_gpt-3.5-turbo_default/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators/tooleval_gpt-3.5-turbo_default/config.yaml -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators/tooleval_gpt-3.5-turbo_default/template.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators/tooleval_gpt-3.5-turbo_default/template.txt -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators/tooleval_gpt-3.5-turbo_fn/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators/tooleval_gpt-3.5-turbo_fn/config.yaml -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators/tooleval_gpt-3.5-turbo_fn/template.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators/tooleval_gpt-3.5-turbo_fn/template.txt -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators/tooleval_gpt-3.5-turbo_normalized/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators/tooleval_gpt-3.5-turbo_normalized/config.yaml -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators/tooleval_gpt-3.5-turbo_normalized/template.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators/tooleval_gpt-3.5-turbo_normalized/template.txt -------------------------------------------------------------------------------- /toolbench/tooleval/evaluators_comparison.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/evaluators_comparison.py -------------------------------------------------------------------------------- /toolbench/tooleval/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/requirements.txt -------------------------------------------------------------------------------- /toolbench/tooleval/results/default_evalset/DFS/win.csv: -------------------------------------------------------------------------------- 1 | ,Method,Win Rate,Std Error 2 | 0,DFS,, 3 | -------------------------------------------------------------------------------- /toolbench/tooleval/results/default_evalset/gpt-3.5-turbo_CoT/G1_category.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/results/default_evalset/gpt-3.5-turbo_CoT/G1_category.json -------------------------------------------------------------------------------- /toolbench/tooleval/results/default_evalset/gpt-3.5-turbo_CoT/G1_instruction.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/results/default_evalset/gpt-3.5-turbo_CoT/G1_instruction.json -------------------------------------------------------------------------------- /toolbench/tooleval/results/default_evalset/gpt-3.5-turbo_CoT/G1_tool.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/results/default_evalset/gpt-3.5-turbo_CoT/G1_tool.json -------------------------------------------------------------------------------- /toolbench/tooleval/results/default_evalset/gpt-3.5-turbo_CoT/G2_category.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/results/default_evalset/gpt-3.5-turbo_CoT/G2_category.json -------------------------------------------------------------------------------- /toolbench/tooleval/results/default_evalset/gpt-3.5-turbo_CoT/G2_instruction.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/results/default_evalset/gpt-3.5-turbo_CoT/G2_instruction.json -------------------------------------------------------------------------------- /toolbench/tooleval/results/default_evalset/gpt-3.5-turbo_CoT/G3_instruction.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/results/default_evalset/gpt-3.5-turbo_CoT/G3_instruction.json -------------------------------------------------------------------------------- /toolbench/tooleval/results/leaderboard###default_evalset###tooleval_gpt-3.5-turbo_normalized###ChatGPT-DFSDT.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/results/leaderboard###default_evalset###tooleval_gpt-3.5-turbo_normalized###ChatGPT-DFSDT.csv -------------------------------------------------------------------------------- /toolbench/tooleval/results/leaderboard###default_evalset###tooleval_gpt-3.5-turbo_normalized###gpt-3.5-turbo_CoT.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/results/leaderboard###default_evalset###tooleval_gpt-3.5-turbo_normalized###gpt-3.5-turbo_CoT.csv -------------------------------------------------------------------------------- /toolbench/tooleval/run_convert_answer.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/run_convert_answer.sh -------------------------------------------------------------------------------- /toolbench/tooleval/run_pass_rate.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/run_pass_rate.sh -------------------------------------------------------------------------------- /toolbench/tooleval/run_preference.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/run_preference.sh -------------------------------------------------------------------------------- /toolbench/tooleval/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/tooleval/utils.py -------------------------------------------------------------------------------- /toolbench/train/llama_condense_monkey_patch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/train/llama_condense_monkey_patch.py -------------------------------------------------------------------------------- /toolbench/train/llama_flash_attn_monkey_patch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/train/llama_flash_attn_monkey_patch.py -------------------------------------------------------------------------------- /toolbench/train/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/train/train.py -------------------------------------------------------------------------------- /toolbench/train/train_lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/train/train_lora.py -------------------------------------------------------------------------------- /toolbench/train/train_mem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/train/train_mem.py -------------------------------------------------------------------------------- /toolbench/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenBMB/ToolBench/HEAD/toolbench/utils.py --------------------------------------------------------------------------------