├── .gitignore ├── .gitmodules ├── LICENSE ├── README.md ├── docs ├── DATA_GENERATION.md ├── EVALUATION.md ├── KUBERNETES_DEPLOY.md └── MODEL_TRAINING.md ├── environment.yml ├── figures ├── codeact-comparison-perf.png ├── codeact-comparison-table.png ├── data-stats.png ├── json-text-comparison.png ├── model-performance.png └── overview.png ├── mint ├── agents │ ├── __init__.py │ ├── bard_agent.py │ ├── base.py │ ├── claude_agent.py │ ├── claude_feedback_agent.py │ ├── openai_feedback_agent.py │ ├── openai_lm_agent.py │ ├── vllm_agent.py │ └── vllm_feedback_agent.py ├── configs │ ├── __init__.py │ ├── config_variables.py │ └── generate_config.py ├── data_gen_configs │ ├── claude-2 │ │ └── F=None │ │ │ └── max5_p2+tool+cd │ │ │ ├── code_generation │ │ │ └── APPS │ │ │ │ └── train.json │ │ │ ├── decision_making │ │ │ └── alfworld │ │ │ │ └── train.json │ │ │ ├── reasoning │ │ │ ├── algebra │ │ │ │ └── train.json │ │ │ ├── counting_and_probability │ │ │ │ └── train.json │ │ │ ├── geometry │ │ │ │ └── train.json │ │ │ ├── hotpotqa │ │ │ │ └── train.json │ │ │ ├── intermediate_algebra │ │ │ │ └── train.json │ │ │ ├── number_theory │ │ │ │ └── train.json │ │ │ ├── prealgebra │ │ │ │ └── train.json │ │ │ ├── precalculus │ │ │ │ └── train.json │ │ │ └── strategyqa │ │ │ │ └── train.json │ │ │ └── tabular │ │ │ └── wiki_table_questions │ │ │ └── train.json │ ├── claude-instant-1 │ │ └── F=None │ │ │ └── max5_p2+tool+cd │ │ │ ├── code_generation │ │ │ └── APPS │ │ │ │ └── train.json │ │ │ ├── decision_making │ │ │ └── alfworld │ │ │ │ └── train.json │ │ │ ├── reasoning │ │ │ ├── algebra │ │ │ │ └── train.json │ │ │ ├── counting_and_probability │ │ │ │ └── train.json │ │ │ ├── geometry │ │ │ │ └── train.json │ │ │ ├── hotpotqa │ │ │ │ └── train.json │ │ │ ├── intermediate_algebra │ │ │ │ └── train.json │ │ │ ├── number_theory │ │ │ │ └── train.json │ │ │ ├── prealgebra │ │ │ │ └── train.json │ │ │ ├── precalculus │ │ │ │ └── train.json │ │ │ └── strategyqa │ │ │ │ └── train.json │ │ │ └── tabular │ │ │ └── wiki_table_questions │ │ │ └── train.json │ ├── gpt-3.5-turbo-0613 │ │ └── F=None │ │ │ └── max5_p2+tool+cd │ │ │ ├── code_generation │ │ │ └── APPS │ │ │ │ └── train.json │ │ │ ├── decision_making │ │ │ └── alfworld │ │ │ │ └── train.json │ │ │ ├── reasoning │ │ │ ├── algebra │ │ │ │ └── train.json │ │ │ ├── counting_and_probability │ │ │ │ └── train.json │ │ │ ├── geometry │ │ │ │ └── train.json │ │ │ ├── hotpotqa │ │ │ │ └── train.json │ │ │ ├── intermediate_algebra │ │ │ │ └── train.json │ │ │ ├── number_theory │ │ │ │ └── train.json │ │ │ ├── prealgebra │ │ │ │ └── train.json │ │ │ ├── precalculus │ │ │ │ └── train.json │ │ │ └── strategyqa │ │ │ │ └── train.json │ │ │ └── tabular │ │ │ └── wiki_table_questions │ │ │ └── train.json │ ├── gpt-3.5-turbo-16k-0613 │ │ └── F=None │ │ │ └── max5_p2+tool+cd │ │ │ ├── code_generation │ │ │ └── APPS │ │ │ │ └── train.json │ │ │ ├── decision_making │ │ │ └── alfworld │ │ │ │ └── train.json │ │ │ ├── reasoning │ │ │ ├── algebra │ │ │ │ └── train.json │ │ │ ├── counting_and_probability │ │ │ │ └── train.json │ │ │ ├── geometry │ │ │ │ └── train.json │ │ │ ├── hotpotqa │ │ │ │ └── train.json │ │ │ ├── intermediate_algebra │ │ │ │ └── train.json │ │ │ ├── number_theory │ │ │ │ └── train.json │ │ │ ├── prealgebra │ │ │ │ └── train.json │ │ │ ├── precalculus │ │ │ │ └── train.json │ │ │ └── strategyqa │ │ │ │ └── train.json │ │ │ └── tabular │ │ │ └── wiki_table_questions │ │ │ └── train.json │ └── gpt-4-0613 │ │ └── F=None │ │ └── max5_p2+tool+cd │ │ ├── code_generation │ │ └── APPS │ │ │ └── train.json │ │ ├── decision_making │ │ └── alfworld │ │ │ └── train.json │ │ ├── reasoning │ │ ├── algebra │ │ │ └── train.json │ │ ├── counting_and_probability │ │ │ └── train.json │ │ ├── geometry │ │ │ └── train.json │ │ ├── hotpotqa │ │ │ └── train.json │ │ ├── intermediate_algebra │ │ │ └── train.json │ │ ├── number_theory │ │ │ └── train.json │ │ ├── prealgebra │ │ │ └── train.json │ │ ├── precalculus │ │ │ └── train.json │ │ └── strategyqa │ │ │ └── train.json │ │ └── tabular │ │ └── wiki_table_questions │ │ └── train.json ├── datatypes.py ├── envs │ ├── __init__.py │ ├── alfworld_env.py │ ├── base.py │ └── general_env.py ├── main.py ├── prompt │ ├── __init__.py │ └── templates │ │ ├── template_feedback_agent.txt │ │ ├── template_with_tool.txt │ │ └── template_without_tool.txt ├── tasks │ ├── __init__.py │ ├── alfworld.py │ ├── base.py │ ├── codegen │ │ ├── APPS │ │ │ ├── __init__.py │ │ │ ├── testing_util.py │ │ │ └── utils.py │ │ └── __init__.py │ ├── in_context_examples │ │ ├── APPS │ │ │ ├── with_tool.txt │ │ │ └── with_tool_and_feedback.txt │ │ ├── README.md │ │ ├── alfworld │ │ │ ├── clean │ │ │ │ ├── with_tool.txt │ │ │ │ └── with_tool_and_feedback.txt │ │ │ ├── cool │ │ │ │ ├── with_tool.txt │ │ │ │ └── with_tool_and_feedback.txt │ │ │ ├── examine │ │ │ │ ├── with_tool.txt │ │ │ │ └── with_tool_and_feedback.txt │ │ │ ├── heat │ │ │ │ ├── with_tool.txt │ │ │ │ └── with_tool_and_feedback.txt │ │ │ ├── put │ │ │ │ ├── with_tool.txt │ │ │ │ └── with_tool_and_feedback.txt │ │ │ └── puttwo │ │ │ │ ├── with_tool.txt │ │ │ │ └── with_tool_and_feedback.txt │ │ ├── humaneval │ │ │ ├── with_tool.txt │ │ │ └── with_tool_and_feedback.txt │ │ ├── mbpp │ │ │ ├── with_tool.txt │ │ │ └── with_tool_and_feedback.txt │ │ ├── reasoning │ │ │ ├── with_tool.txt │ │ │ └── with_tool_and_feedback.txt │ │ └── tabular │ │ │ ├── with_tool.txt │ │ │ └── with_tool_and_feedback.txt │ ├── reasoning │ │ ├── __init__.py │ │ ├── grader.py │ │ └── math_normalize.py │ └── tabular │ │ ├── __init__.py │ │ └── evaluator.py ├── tools │ ├── __init__.py │ ├── alfworld.py │ ├── arxiv_search.py │ ├── base.py │ ├── python_tool.py │ ├── web_search.py │ └── wikipedia_search.py └── utils │ ├── __init__.py │ ├── exception.py │ └── exec.py ├── requirements.txt └── scripts ├── chat ├── code_execution │ ├── Dockerfile.api │ ├── Dockerfile.executor │ ├── api.py │ ├── jupyter.py │ └── start_jupyter_server.sh ├── demo.py ├── kubernetes │ ├── build_chat_ui_and_push.sh │ ├── build_code_execute_api_and_push.sh │ ├── build_code_executor_container_and_push.sh │ └── k8s.template.yml ├── run_chat_ui.sh ├── run_chat_ui_debug.sh ├── start_mongodb.sh └── start_vllm.sh ├── data ├── analyze_dataset.ipynb ├── create_hf_dataset.py ├── download_from_hf.py ├── general │ ├── process_capybara.py │ ├── process_general_traj.sh │ ├── process_openorca.py │ └── process_sharegpt.py ├── interaction │ ├── collection │ │ ├── convert_outputs.ipynb │ │ ├── process_trajectories.ipynb │ │ ├── run.sh │ │ └── run_mint_docker_interactive.sh │ ├── download_raw_data.sh │ ├── process_APPS.py │ ├── process_MATH.py │ ├── process_WikiTableQuestions.py │ └── process_hotpotQA.py └── megatron_conversion │ ├── process_mixture_llama.sh │ └── process_mixture_mistral.sh ├── docker ├── Dockerfile.megatron ├── Dockerfile.mint ├── run_megatron_interactive.sh └── run_megatron_interactive_slurm.sh ├── eval ├── aggregate_eval.py ├── api-bank │ ├── .gitignore │ ├── API-Bank-arxiv-version.pdf │ ├── LICENSE │ ├── README.md │ ├── api_bank_analysis.ipynb │ ├── api_call_extraction.py │ ├── apis │ │ ├── __init__.py │ │ ├── add_agenda.py │ │ ├── add_alarm.py │ │ ├── add_meeting.py │ │ ├── add_reminder.py │ │ ├── add_scene.py │ │ ├── api.py │ │ ├── appointment_registration.py │ │ ├── book_hotel.py │ │ ├── calculator.py │ │ ├── cancel_registration.py │ │ ├── cancel_timed_switch.py │ │ ├── check_token.py │ │ ├── delete_account.py │ │ ├── delete_agenda.py │ │ ├── delete_alarm.py │ │ ├── delete_meeting.py │ │ ├── delete_reminder.py │ │ ├── delete_scene.py │ │ ├── dictionary.py │ │ ├── document_qa.py │ │ ├── emergency_knowledge.py │ │ ├── forgot_password.py │ │ ├── get_today.py │ │ ├── get_user_token.py │ │ ├── image_caption.py │ │ ├── modify_agenda.py │ │ ├── modify_alarm.py │ │ ├── modify_meeting.py │ │ ├── modify_password.py │ │ ├── modify_registration.py │ │ ├── modify_reminder.py │ │ ├── modify_scene.py │ │ ├── open_bank_account.py │ │ ├── play_music.py │ │ ├── query_agenda.py │ │ ├── query_alarm.py │ │ ├── query_balance.py │ │ ├── query_health_data.py │ │ ├── query_history_today.py │ │ ├── query_meeting.py │ │ ├── query_registration.py │ │ ├── query_reminder.py │ │ ├── query_scene.py │ │ ├── query_stock.py │ │ ├── record_health_data.py │ │ ├── register_user.py │ │ ├── search_engine.py │ │ ├── send_email.py │ │ ├── speech_recognition.py │ │ ├── symptom_search.py │ │ ├── timed_switch.py │ │ ├── tool_search.py │ │ ├── translate.py │ │ └── wiki.py │ ├── data │ │ ├── all_apis.csv │ │ └── exceptions.json │ ├── demo.py │ ├── evaluator.py │ ├── evaluator_by_json.py │ ├── figures │ │ ├── multi-agent.png │ │ └── three_ability.png │ ├── init_database │ │ ├── Account.json │ │ ├── Agenda.json │ │ ├── Alarm.json │ │ ├── Appointments.json │ │ ├── Bank.json │ │ ├── HealthData.json │ │ ├── History.json │ │ ├── Hotel.json │ │ ├── ImageCaptioning.json │ │ ├── Meeting.json │ │ ├── QuestionAnswering.json │ │ ├── Reminder.json │ │ ├── Scenes.json │ │ ├── SearchEngine.json │ │ ├── SpeechRecognition.json │ │ ├── Stock.json │ │ ├── Symptom.json │ │ ├── TimeSwitch.json │ │ └── Wiki.json │ ├── lv1-lv2-samples │ │ ├── level-1-given-desc │ │ │ ├── AddAgenda-AddAlarm-GetUserToken-level-2-1.jsonl │ │ │ ├── AddAgenda-AddMeeting-GetUserToken-level-2-2.jsonl │ │ │ ├── AddAgenda-AddMeeting-GetUserToken-level-2-3.jsonl │ │ │ ├── AddAgenda-AddMeeting-GetUserToken-level-2-4.jsonl │ │ │ ├── AddAgenda-level-1-1.jsonl │ │ │ ├── AddAgenda-level-1-2.jsonl │ │ │ ├── AddAlarm-GetReminder-ModifyAgenda-GetUserToken-level-2-1.jsonl │ │ │ ├── AddAlarm-level-1-1.jsonl │ │ │ ├── AddMeeting-level-1-1.jsonl │ │ │ ├── AddReminder-level-1-1.jsonl │ │ │ ├── AddReminder-level-1-2.jsonl │ │ │ ├── AddReminder-level-1-3.jsonl │ │ │ ├── AppointmentRegistration-level-1-1.jsonl │ │ │ ├── AppointmentRegistration-level-1-2.jsonl │ │ │ ├── AppointmentRegistration-level-1-3.jsonl │ │ │ ├── BookHotel-level-1-1.jsonl │ │ │ ├── BookHotel-level-1-2.jsonl │ │ │ ├── BookHotel-level-1-3.jsonl │ │ │ ├── BookHotel-level-1-4.jsonl │ │ │ ├── BookHotel-level-1-5.jsonl │ │ │ ├── Calculator-QueryHistoryToday-level-2-1.jsonl │ │ │ ├── Calculator-QueryHistoryToday-level-2-2.jsonl │ │ │ ├── Calculator-level-1-1.jsonl │ │ │ ├── Calculator-level-1-2.jsonl │ │ │ ├── Calculator-level-1-3.jsonl │ │ │ ├── CancelRegistration-RecordHealthData-QueryRegistration-level-2-1.jsonl │ │ │ ├── CancelRegistration-RecordHealthData-QueryRegistration-level-2-2.jsonl │ │ │ ├── CancelRegistration-RecordHealthData-level-2-1.jsonl │ │ │ ├── CancelRegistration-RecordHealthData-level-2-2.jsonl │ │ │ ├── CancelRegistration-RecordHealthData-level-2-3.jsonl │ │ │ ├── CancelRegistration-RecordHealthData-level-2-4.jsonl │ │ │ ├── CancelRegistration-RecordHealthData-level-2-5.jsonl │ │ │ ├── CancelRegistration-level-1-1.jsonl │ │ │ ├── CancelRegistration-level-1-2.jsonl │ │ │ ├── CancelRegistration-level-1-3.jsonl │ │ │ ├── CancelTimedSwitch-level-1-1.jsonl │ │ │ ├── CancelTimedSwitch-level-1-2.jsonl │ │ │ ├── CancelTimedSwitch-level-1-3.jsonl │ │ │ ├── CancelTimedSwitch-level-1-4.jsonl │ │ │ ├── CancelTimedSwitch-level-1-5.jsonl │ │ │ ├── DeleteAccount-ModifyPassword-GetUserToken-level-2-1.jsonl │ │ │ ├── DeleteAccount-ModifyPassword-GetUserToken-level-2-2.jsonl │ │ │ ├── DeleteAccount-ModifyPassword-GetUserToken-level-2-3.jsonl │ │ │ ├── DeleteAccount-ModifyPassword-GetUserToken-level-2-4.jsonl │ │ │ ├── DeleteAccount-ModifyPassword-GetUserToken-level-2-5.jsonl │ │ │ ├── DeleteAccount-RegisterUser-ForgotPassword-GetUserToken-level-2-1.jsonl │ │ │ ├── DeleteAccount-RegisterUser-ForgotPassword-GetUserToken-level-2-2.jsonl │ │ │ ├── DeleteAccount-level-1-1.jsonl │ │ │ ├── DeleteAccount-level-1-2.jsonl │ │ │ ├── DeleteAccount-level-1-3.jsonl │ │ │ ├── DeleteAgenda-AddAlarm-DeleteMeeting-GetUserToken-level-2-1.jsonl │ │ │ ├── DeleteAgenda-AddAlarm-DeleteMeeting-GetUserToken-level-2-2.jsonl │ │ │ ├── DeleteAgenda-level-1-1.jsonl │ │ │ ├── DeleteAlarm-AddAgenda-GetUserToken-level-2-1.jsonl │ │ │ ├── DeleteAlarm-AddAgenda-GetUserToken-level-2-2.jsonl │ │ │ ├── DeleteAlarm-level-1-1.jsonl │ │ │ ├── DeleteAlarm-level-1-2.jsonl │ │ │ ├── DeleteMeeting-level-1-1.jsonl │ │ │ ├── DeleteReminder-level-1-1.jsonl │ │ │ ├── DeleteScene-level-1-1.jsonl │ │ │ ├── DeleteScene-level-1-2.jsonl │ │ │ ├── DeleteScene-level-1-3.jsonl │ │ │ ├── Dictionary-level-1-1.jsonl │ │ │ ├── Dictionary-level-1-2.jsonl │ │ │ ├── Dictionary-level-1-3.jsonl │ │ │ ├── Dictionary-level-1-4.jsonl │ │ │ ├── DocumentQA-level-1-1.jsonl │ │ │ ├── DocumentQA-level-1-2.jsonl │ │ │ ├── DocumentQA-level-1-3.jsonl │ │ │ ├── DocumentQA-level-1-4.jsonl │ │ │ ├── EmergencyKnowledge-ModifyRegistration-RecordHealthData-level-2-1.jsonl │ │ │ ├── EmergencyKnowledge-ModifyRegistration-RecordHealthData-level-2-2.jsonl │ │ │ ├── EmergencyKnowledge-ModifyRegistration-RecordHealthData-level-2-3.jsonl │ │ │ ├── EmergencyKnowledge-level-1-1.jsonl │ │ │ ├── EmergencyKnowledge-level-1-2.jsonl │ │ │ ├── ForgotPassword-ModifyPassword-GetUserToken-level-2-1.jsonl │ │ │ ├── ForgotPassword-RegisterUser-DeleteAccount-GetUserToken-level-2-1.jsonl │ │ │ ├── ForgotPassword-level-1-1.jsonl │ │ │ ├── GetMeeting-level-1-1.jsonl │ │ │ ├── GetMeeting-level-1-2.jsonl │ │ │ ├── GetReminder-level-1-1.jsonl │ │ │ ├── GetReminder-level-1-2.jsonl │ │ │ ├── GetToday-ModifyMeeting-ModifyAlarm-GetUserToken-level-2-1.jsonl │ │ │ ├── GetToday-ModifyMeeting-ModifyAlarm-GetUserToken-level-2-2.jsonl │ │ │ ├── GetToday-level-1-1.jsonl │ │ │ ├── GetToday-level-1-2.jsonl │ │ │ ├── GetToday-level-1-3.jsonl │ │ │ ├── GetToday-level-1-4.jsonl │ │ │ ├── ImageCaption-level-1-1.jsonl │ │ │ ├── ModifyAgenda-level-1-1.jsonl │ │ │ ├── ModifyAgenda-level-1-2.jsonl │ │ │ ├── ModifyAlarm-AddAgenda-GetUserToken-level-2-1.jsonl │ │ │ ├── ModifyAlarm-AddAgenda-GetUserToken-level-2-2.jsonl │ │ │ ├── ModifyAlarm-level-1-1.jsonl │ │ │ ├── ModifyAlarm-level-1-2.jsonl │ │ │ ├── ModifyMeeting-level-1-1.jsonl │ │ │ ├── ModifyMeeting-level-1-2.jsonl │ │ │ ├── ModifyMeeting-level-1-3.jsonl │ │ │ ├── ModifyPassword-ForgotPassword-DeleteAccount-GetUserToken-level-2-1.jsonl │ │ │ ├── ModifyPassword-ForgotPassword-DeleteAccount-GetUserToken-level-2-2.jsonl │ │ │ ├── ModifyPassword-ForgotPassword-DeleteAccount-GetUserToken-level-2-3.jsonl │ │ │ ├── ModifyPassword-ForgotPassword-DeleteAccount-GetUserToken-level-2-4.jsonl │ │ │ ├── ModifyPassword-RegisterUser-GetUserToken-level-2-1.jsonl │ │ │ ├── ModifyPassword-level-1-1.jsonl │ │ │ ├── ModifyPassword-level-1-2.jsonl │ │ │ ├── ModifyRegistration-EmergencyKnowledge-level-2-1.jsonl │ │ │ ├── ModifyRegistration-EmergencyKnowledge-level-2-2.jsonl │ │ │ ├── ModifyRegistration-EmergencyKnowledge-level-2-3.jsonl │ │ │ ├── ModifyRegistration-EmergencyKnowledge-level-2-4.jsonl │ │ │ ├── ModifyRegistration-QueryHealthData-CancelRegistration-level-2-1.jsonl │ │ │ ├── ModifyRegistration-QueryHealthData-CancelRegistration-level-2-2.jsonl │ │ │ ├── ModifyRegistration-level-1-1.jsonl │ │ │ ├── ModifyRegistration-level-1-2.jsonl │ │ │ ├── ModifyRegistration-level-1-3.jsonl │ │ │ ├── ModifyRegistration-level-1-4.jsonl │ │ │ ├── ModifyRegistration-level-1-5.jsonl │ │ │ ├── ModifyReminder-AddAgenda-DeleteAgenda-GetUserToken-level-2-1.jsonl │ │ │ ├── ModifyReminder-AddAgenda-DeleteAgenda-GetUserToken-level-2-2.jsonl │ │ │ ├── ModifyReminder-AddAgenda-GetUserToken-level-2-1.jsonl │ │ │ ├── ModifyReminder-AddAgenda-GetUserToken-level-2-2.jsonl │ │ │ ├── ModifyReminder-AddAgenda-GetUserToken-level-2-3.jsonl │ │ │ ├── ModifyReminder-level-1-1.jsonl │ │ │ ├── ModifyReminder-level-1-2.jsonl │ │ │ ├── ModifyReminder-level-1-3.jsonl │ │ │ ├── OpenBankAccount-QueryBalance-QueryStock-GetUserToken-level-2-2.jsonl │ │ │ ├── OpenBankAccount-QueryStock-QueryBalance-GetUserToken-level-2-1.jsonl │ │ │ ├── OpenBankAccount-QueryStock-level-2-1.jsonl │ │ │ ├── OpenBankAccount-level-1-1.jsonl │ │ │ ├── OpenBankAccount-level-1-2.jsonl │ │ │ ├── OpenBankAccount-level-1-3.jsonl │ │ │ ├── OpenBankAccount-level-1-4.jsonl │ │ │ ├── OpenBankAccount-level-1-5.jsonl │ │ │ ├── PlayMusic-level-1-1.jsonl │ │ │ ├── PlayMusic-level-1-2.jsonl │ │ │ ├── PlayMusic-level-1-3.jsonl │ │ │ ├── QueryAgenda-level-1-1.jsonl │ │ │ ├── QueryAlarm-level-1-1.jsonl │ │ │ ├── QueryBalance-OpenBankAccount-QueryStock-GetUserToken-level-2-1.jsonl │ │ │ ├── QueryBalance-QueryStock-OpenBankAccount-GetUserToken-level-2-1.jsonl │ │ │ ├── QueryBalance-QueryStock-OpenBankAccount-GetUserToken-level-2-2.jsonl │ │ │ ├── QueryBalance-level-1-1.jsonl │ │ │ ├── QueryBalance-level-1-2.jsonl │ │ │ ├── QueryHealthData-CancelRegistration-SymptomSearch-level-2-1.jsonl │ │ │ ├── QueryHealthData-level-1-1.jsonl │ │ │ ├── QueryHealthData-level-1-2.jsonl │ │ │ ├── QueryHistoryToday-Calculator-level-2-1.jsonl │ │ │ ├── QueryHistoryToday-Calculator-level-2-2.jsonl │ │ │ ├── QueryHistoryToday-Calculator-level-2-3.jsonl │ │ │ ├── QueryHistoryToday-Calculator-level-2-4.jsonl │ │ │ ├── QueryHistoryToday-level-1-1.jsonl │ │ │ ├── QueryHistoryToday-level-1-2.jsonl │ │ │ ├── QueryHistoryToday-level-1-3.jsonl │ │ │ ├── QueryMeeting-level-1-1.jsonl │ │ │ ├── QueryRegistration-AppointmentRegistration-level-2-1.jsonl │ │ │ ├── QueryRegistration-EmergencyKnowledge-level-2-1.jsonl │ │ │ ├── QueryRegistration-EmergencyKnowledge-level-2-2.jsonl │ │ │ ├── QueryRegistration-EmergencyKnowledge-level-2-3.jsonl │ │ │ ├── QueryRegistration-EmergencyKnowledge-level-2-4.jsonl │ │ │ ├── QueryRegistration-SymptomSearch-RecordHealthData-level-2-1.jsonl │ │ │ ├── QueryRegistration-SymptomSearch-RecordHealthData-level-2-2.jsonl │ │ │ ├── QueryRegistration-level-1-1.jsonl │ │ │ ├── QueryRegistration-level-1-2.jsonl │ │ │ ├── QueryRegistration-level-1-3.jsonl │ │ │ ├── QueryRegistration-level-1-4.jsonl │ │ │ ├── QueryRegistration-level-1-5.jsonl │ │ │ ├── QueryReminder-level-1-1.jsonl │ │ │ ├── QueryReminder-level-1-2.jsonl │ │ │ ├── QueryScene-level-1-1.jsonl │ │ │ ├── QueryScene-level-1-2.jsonl │ │ │ ├── QueryScene-level-1-3.jsonl │ │ │ ├── QueryScene-level-1-4.jsonl │ │ │ ├── QueryScene-level-1-5.jsonl │ │ │ ├── QueryStock-OpenBankAccount-QueryBalance-GetUserToken-level-2-1.jsonl │ │ │ ├── QueryStock-OpenBankAccount-QueryBalance-GetUserToken-level-2-2.jsonl │ │ │ ├── QueryStock-OpenBankAccount-level-2-1.jsonl │ │ │ ├── QueryStock-QueryBalance-GetUserToken-level-2-1.jsonl │ │ │ ├── QueryStock-QueryBalance-OpenBankAccount-GetUserToken-level-2-1.jsonl │ │ │ ├── QueryStock-QueryBalance-OpenBankAccount-GetUserToken-level-2-2.jsonl │ │ │ ├── QueryStock-level-1-1.jsonl │ │ │ ├── QueryStock-level-1-2.jsonl │ │ │ ├── QueryStock-level-1-3.jsonl │ │ │ ├── QueryStock-level-1-4.jsonl │ │ │ ├── QueryStock-level-1-5.jsonl │ │ │ ├── RecordHealthData-AppointmentRegistration-EmergencyKnowledge-level-2-1.jsonl │ │ │ ├── RecordHealthData-AppointmentRegistration-EmergencyKnowledge-level-2-2.jsonl │ │ │ ├── RecordHealthData-AppointmentRegistration-EmergencyKnowledge-level-2-3.jsonl │ │ │ ├── RecordHealthData-AppointmentRegistration-EmergencyKnowledge-level-2-4.jsonl │ │ │ ├── RecordHealthData-AppointmentRegistration-EmergencyKnowledge-level-2-5.jsonl │ │ │ ├── RecordHealthData-AppointmentRegistration-QueryRegistration-level-2-1.jsonl │ │ │ ├── RecordHealthData-AppointmentRegistration-QueryRegistration-level-2-2.jsonl │ │ │ ├── RecordHealthData-level-1-1.jsonl │ │ │ ├── RecordHealthData-level-1-2.jsonl │ │ │ ├── RegisterUser-ForgotPassword-DeleteAccount-GetUserToken-level-2-1.jsonl │ │ │ ├── RegisterUser-ForgotPassword-level-2-1.jsonl │ │ │ ├── RegisterUser-ForgotPassword-level-2-2.jsonl │ │ │ ├── RegisterUser-ForgotPassword-level-2-3.jsonl │ │ │ ├── RegisterUser-level-1-1.jsonl │ │ │ ├── RegisterUser-level-1-2.jsonl │ │ │ ├── RegisterUser-level-1-3.jsonl │ │ │ ├── SearchEngine-level-1-1.jsonl │ │ │ ├── SearchEngine-level-1-2.jsonl │ │ │ ├── SendEmail-level-1-1.jsonl │ │ │ ├── SpeechRecognition-level-1-1.jsonl │ │ │ ├── SymptomSearch-AppointmentRegistration-level-2-1.jsonl │ │ │ ├── SymptomSearch-level-1-1.jsonl │ │ │ ├── SymptomSearch-level-1-2.jsonl │ │ │ ├── TimedSwitch-level-1-1.jsonl │ │ │ ├── TimedSwitch-level-1-2.jsonl │ │ │ ├── TimedSwitch-level-1-3.jsonl │ │ │ ├── Translate-level-1-1.jsonl │ │ │ ├── Translate-level-1-2.jsonl │ │ │ ├── Translate-level-1-3.jsonl │ │ │ ├── Translate-level-1-4.jsonl │ │ │ └── Wiki-level-1-1.jsonl │ │ └── level-2-toolsearcher │ │ │ ├── AddAgenda-level-3-1.jsonl │ │ │ ├── AddAgenda-level-3-2.jsonl │ │ │ ├── AddAlarm-level-3-1.jsonl │ │ │ ├── AddAlarm-level-3-2.jsonl │ │ │ ├── AddMeeting-level-3-1.jsonl │ │ │ ├── AddMeeting-level-3-2.jsonl │ │ │ ├── AddReminder-level-3-1.jsonl │ │ │ ├── AppointmentRegistration-level-3-1.jsonl │ │ │ ├── BookHotel-level-3-1.jsonl │ │ │ ├── BookHotel-level-3-2.jsonl │ │ │ ├── BookHotel-level-3-3.jsonl │ │ │ ├── Calculator-level-3-1.jsonl │ │ │ ├── Calculator-level-3-2.jsonl │ │ │ ├── DeleteAccount-level-3-1.jsonl │ │ │ ├── DeleteAccount-level-3-2.jsonl │ │ │ ├── DeleteAccount-level-3-3.jsonl │ │ │ ├── DeleteAgenda-level-3-1.jsonl │ │ │ ├── DeleteAgenda-level-3-2.jsonl │ │ │ ├── DeleteAlarm-level-3-1.jsonl │ │ │ ├── DeleteMeeting-level-3-1.jsonl │ │ │ ├── DeleteMeeting-level-3-2.jsonl │ │ │ ├── DeleteReminder-level-3-1.jsonl │ │ │ ├── EmergencyKnowledge-level-3-1.jsonl │ │ │ ├── GetToday-level-3-1.jsonl │ │ │ ├── ModifyAgenda-level-3-1.jsonl │ │ │ ├── ModifyMeeting-level-3-1.jsonl │ │ │ ├── ModifyRegistration-level-3-1.jsonl │ │ │ ├── ModifyReminder-level-3-1.jsonl │ │ │ ├── QueryAlarm-level-3-1.jsonl │ │ │ ├── QueryBalance-level-3-1.jsonl │ │ │ ├── QueryBalance-level-3-2.jsonl │ │ │ ├── QueryHealthData-level-3-1.jsonl │ │ │ ├── QueryHistoryToday-level-3-2.jsonl │ │ │ ├── QueryHistoryToday-level-3-3.jsonl │ │ │ ├── QueryMeeting-level-3-1.jsonl │ │ │ ├── QueryMeeting-level-3-2.jsonl │ │ │ ├── QueryRegistration-level-3-1.jsonl │ │ │ ├── QueryRegistration-level-3-2.jsonl │ │ │ ├── QueryReminder-level-3-1.jsonl │ │ │ ├── QueryReminder-level-3-2.jsonl │ │ │ ├── QueryReminder-level-3-3.jsonl │ │ │ ├── QueryStock-level-3-1.jsonl │ │ │ ├── RecordHealthData-level-3-1.jsonl │ │ │ ├── RecordHealthData-level-3-2.jsonl │ │ │ ├── RecordHealthData-level-3-3.jsonl │ │ │ ├── SymptomSearch-level-3-1.jsonl │ │ │ ├── SymptomSearch-level-3-2.jsonl │ │ │ ├── SymptomSearch-level-3-3.jsonl │ │ │ ├── SymptomSearch-level-3-4.jsonl │ │ │ └── SymptomSearch-level-3-5.jsonl │ ├── lv3-samples │ │ ├── Financial Management.txt │ │ ├── Health Management.txt │ │ ├── Hospital.txt │ │ ├── Hotel Booking.txt │ │ ├── Meeting Schedule.txt │ │ ├── Personal Assistant.txt │ │ ├── Reminder.txt │ │ └── Shopping.txt │ ├── lv3_apis │ │ ├── account_info.py │ │ ├── add_meeting.py │ │ ├── calculator.py │ │ ├── clothing_recommandation.py │ │ ├── email_reminder.py │ │ ├── flight_search.py │ │ ├── geocoding.py │ │ ├── get_occupation_salary.py │ │ ├── get_weather.py │ │ ├── hotel_availability.py │ │ ├── like_count.py │ │ ├── movie_recommandation.py │ │ ├── nearby_restaurants.py │ │ ├── organization_members.py │ │ ├── query_meeting.py │ │ ├── tax_calculator.py │ │ ├── tool_search.py │ │ ├── travel_status.py │ │ ├── update_account_info.py │ │ ├── user_posts.py │ │ ├── user_watched_movies.py │ │ └── users_movie_preference.py │ ├── lv3_evaluator.py │ ├── requirements.txt │ ├── run.sh │ ├── simulator.py │ ├── tool_manager.py │ └── utils.py ├── gsm8k │ ├── evaluate_gsm8k.py │ └── gsm8k.sh ├── human_eval │ ├── HumanEval.jsonl │ ├── evaluate_human_eval.py │ └── human_eval.sh ├── m3tooleval │ ├── m3tooleval_analysis.ipynb │ ├── main.py │ ├── run.sh │ └── tasks │ │ ├── __init__.py │ │ ├── base.py │ │ ├── impl │ │ ├── __init__.py │ │ ├── dna_sequencer.py │ │ ├── message_decoder.py │ │ ├── trade_calculator.py │ │ ├── travel_itinerary_planning.py │ │ └── web_browsing │ │ │ ├── __init__.py │ │ │ ├── generate_web_pages.py │ │ │ ├── metadata.json │ │ │ └── web_pages.jsonl │ │ └── repl.py ├── miniwob++ │ ├── .gitignore │ ├── LICENSE │ ├── README.md │ ├── available_tasks.txt │ ├── computergym │ │ ├── .gitignore │ │ ├── README.md │ │ ├── computergym │ │ │ ├── __init__.py │ │ │ └── miniwob │ │ │ │ ├── base_env.py │ │ │ │ └── miniwob_interface │ │ │ │ ├── __init__.py │ │ │ │ ├── action.py │ │ │ │ ├── environment.py │ │ │ │ ├── fields.py │ │ │ │ ├── html │ │ │ │ ├── .gitignore │ │ │ │ ├── common │ │ │ │ │ ├── shapes.js │ │ │ │ │ ├── special │ │ │ │ │ │ ├── book-flight │ │ │ │ │ │ │ └── domestic.js │ │ │ │ │ │ ├── checkbox-numbers │ │ │ │ │ │ │ ├── ch_0.png │ │ │ │ │ │ │ ├── ch_1.png │ │ │ │ │ │ │ ├── ch_2.png │ │ │ │ │ │ │ ├── ch_3.png │ │ │ │ │ │ │ ├── ch_4.png │ │ │ │ │ │ │ ├── ch_5.png │ │ │ │ │ │ │ ├── ch_6.png │ │ │ │ │ │ │ ├── ch_7.png │ │ │ │ │ │ │ ├── ch_8.png │ │ │ │ │ │ │ └── ch_9.png │ │ │ │ │ │ ├── click-pie │ │ │ │ │ │ │ ├── raphael.icons.min.js │ │ │ │ │ │ │ ├── raphael.min.js │ │ │ │ │ │ │ └── wheelnav.min.js │ │ │ │ │ │ ├── drag-cube │ │ │ │ │ │ │ ├── blank.png │ │ │ │ │ │ │ ├── cube.css │ │ │ │ │ │ │ └── cube.js │ │ │ │ │ │ ├── email-inbox-nl │ │ │ │ │ │ │ └── templates.js │ │ │ │ │ │ ├── email-inbox │ │ │ │ │ │ │ ├── delete.png │ │ │ │ │ │ │ ├── email-inbox.css │ │ │ │ │ │ │ ├── forward.png │ │ │ │ │ │ │ ├── left-arrow-white.png │ │ │ │ │ │ │ ├── left-arrow.png │ │ │ │ │ │ │ ├── reply.png │ │ │ │ │ │ │ ├── search.png │ │ │ │ │ │ │ ├── send.png │ │ │ │ │ │ │ ├── star-clicked.png │ │ │ │ │ │ │ └── star.png │ │ │ │ │ │ ├── navigate-tree │ │ │ │ │ │ │ ├── images │ │ │ │ │ │ │ │ ├── ajax-loader.gif │ │ │ │ │ │ │ │ ├── file.gif │ │ │ │ │ │ │ │ ├── folder-closed.gif │ │ │ │ │ │ │ │ ├── folder.gif │ │ │ │ │ │ │ │ ├── minus.gif │ │ │ │ │ │ │ │ ├── plus.gif │ │ │ │ │ │ │ │ ├── treeview-black-line.gif │ │ │ │ │ │ │ │ ├── treeview-black.gif │ │ │ │ │ │ │ │ ├── treeview-default-line.gif │ │ │ │ │ │ │ │ ├── treeview-default.gif │ │ │ │ │ │ │ │ ├── treeview-famfamfam-line.gif │ │ │ │ │ │ │ │ ├── treeview-famfamfam.gif │ │ │ │ │ │ │ │ ├── treeview-gray-line.gif │ │ │ │ │ │ │ │ ├── treeview-gray.gif │ │ │ │ │ │ │ │ ├── treeview-red-line.gif │ │ │ │ │ │ │ │ └── treeview-red.gif │ │ │ │ │ │ │ ├── jquery.treeview.css │ │ │ │ │ │ │ └── jquery.treeview.min.js │ │ │ │ │ │ ├── search-engine │ │ │ │ │ │ │ └── jquery.twbsPagination.min.js │ │ │ │ │ │ ├── social-media │ │ │ │ │ │ │ ├── like-hover.png │ │ │ │ │ │ │ ├── like.png │ │ │ │ │ │ │ ├── more-hover.png │ │ │ │ │ │ │ ├── more.png │ │ │ │ │ │ │ ├── reply-hover.png │ │ │ │ │ │ │ ├── reply.png │ │ │ │ │ │ │ ├── retweet-hover.png │ │ │ │ │ │ │ ├── retweet.png │ │ │ │ │ │ │ ├── share-hover.png │ │ │ │ │ │ │ └── share.png │ │ │ │ │ │ ├── text-editor │ │ │ │ │ │ │ ├── quill.min.js │ │ │ │ │ │ │ └── quill.snow.css │ │ │ │ │ │ └── tic-tac-toe │ │ │ │ │ │ │ ├── o.png │ │ │ │ │ │ │ └── x.png │ │ │ │ │ └── ui_utils.js │ │ │ │ ├── core │ │ │ │ │ ├── core.css │ │ │ │ │ ├── core.js │ │ │ │ │ ├── d3.v3.min.js │ │ │ │ │ ├── jquery-ui │ │ │ │ │ │ ├── external │ │ │ │ │ │ │ └── jquery │ │ │ │ │ │ │ │ └── jquery.js │ │ │ │ │ │ ├── images │ │ │ │ │ │ │ ├── ui-icons_444444_256x240.png │ │ │ │ │ │ │ ├── ui-icons_555555_256x240.png │ │ │ │ │ │ │ ├── ui-icons_777620_256x240.png │ │ │ │ │ │ │ ├── ui-icons_777777_256x240.png │ │ │ │ │ │ │ ├── ui-icons_cc0000_256x240.png │ │ │ │ │ │ │ └── ui-icons_ffffff_256x240.png │ │ │ │ │ │ ├── jquery-ui.min.css │ │ │ │ │ │ ├── jquery-ui.min.js │ │ │ │ │ │ ├── jquery-ui.structure.min.css │ │ │ │ │ │ └── jquery-ui.theme.min.css │ │ │ │ │ ├── jscolor.min.js │ │ │ │ │ └── record.js │ │ │ │ ├── flight │ │ │ │ │ ├── AA │ │ │ │ │ │ ├── apps │ │ │ │ │ │ │ └── common │ │ │ │ │ │ │ │ └── js │ │ │ │ │ │ │ │ ├── aacom.js │ │ │ │ │ │ │ │ ├── aacomDevice.js │ │ │ │ │ │ │ │ ├── airportcode.js │ │ │ │ │ │ │ │ ├── cookieconsent.js │ │ │ │ │ │ │ │ ├── jquery │ │ │ │ │ │ │ │ └── aacom │ │ │ │ │ │ │ │ │ ├── plugins │ │ │ │ │ │ │ │ │ ├── aaAirportAutoComplete.js │ │ │ │ │ │ │ │ │ ├── aaCache.js │ │ │ │ │ │ │ │ │ ├── aaCookie.js │ │ │ │ │ │ │ │ │ ├── aaCountryLanSelect.js │ │ │ │ │ │ │ │ │ ├── aaDropdownPanel.js │ │ │ │ │ │ │ │ │ ├── aaFooterAds.js │ │ │ │ │ │ │ │ │ └── aaTextBoxMessage.js │ │ │ │ │ │ │ │ │ └── utilities │ │ │ │ │ │ │ │ │ ├── aaUtilities-2.1.js │ │ │ │ │ │ │ │ │ └── aaUtils.js │ │ │ │ │ │ │ │ └── wa.js │ │ │ │ │ │ ├── content │ │ │ │ │ │ │ ├── common │ │ │ │ │ │ │ │ └── css │ │ │ │ │ │ │ │ │ └── v3 │ │ │ │ │ │ │ │ │ ├── core.css │ │ │ │ │ │ │ │ │ ├── jquery-ui-1.10-aa.css │ │ │ │ │ │ │ │ │ ├── reservation │ │ │ │ │ │ │ │ │ └── findFlights │ │ │ │ │ │ │ │ │ │ └── mobile │ │ │ │ │ │ │ │ │ │ └── findFlights.css │ │ │ │ │ │ │ │ │ └── responsive.css │ │ │ │ │ │ │ ├── fonts │ │ │ │ │ │ │ │ ├── american-v2 │ │ │ │ │ │ │ │ │ ├── americansans-bold.woff │ │ │ │ │ │ │ │ │ ├── americansans-light.woff │ │ │ │ │ │ │ │ │ ├── americansans-medium.woff │ │ │ │ │ │ │ │ │ └── americansans-regular.woff │ │ │ │ │ │ │ │ └── icons │ │ │ │ │ │ │ │ │ └── american-icons-v4-4.woff │ │ │ │ │ │ │ └── images │ │ │ │ │ │ │ │ ├── chrome │ │ │ │ │ │ │ │ ├── icons │ │ │ │ │ │ │ │ │ └── loading.gif │ │ │ │ │ │ │ │ └── rebrand │ │ │ │ │ │ │ │ │ ├── aa-flight-icon.png │ │ │ │ │ │ │ │ │ ├── aa-icons-flags-sprite.png │ │ │ │ │ │ │ │ │ ├── aa-logo.png │ │ │ │ │ │ │ │ │ ├── down-arrow.png │ │ │ │ │ │ │ │ │ ├── favicon.png │ │ │ │ │ │ │ │ │ ├── oneworld.png │ │ │ │ │ │ │ │ │ ├── shadow-down.png │ │ │ │ │ │ │ │ │ ├── shadow-vertical-150.png │ │ │ │ │ │ │ │ │ ├── shadow12-down.png │ │ │ │ │ │ │ │ │ ├── shadow12-up.png │ │ │ │ │ │ │ │ │ └── shadow3-down.png │ │ │ │ │ │ │ │ └── graphics │ │ │ │ │ │ │ │ └── icons │ │ │ │ │ │ │ │ └── aa-jqueryUIicons-sprite.png │ │ │ │ │ │ ├── dataset-AA.js │ │ │ │ │ │ ├── index.html │ │ │ │ │ │ ├── js │ │ │ │ │ │ │ ├── aa │ │ │ │ │ │ │ │ ├── common │ │ │ │ │ │ │ │ │ ├── aa-utility-menu.js │ │ │ │ │ │ │ │ │ ├── aacom-ui-1.0.0.js │ │ │ │ │ │ │ │ │ └── core-2.0.0.js │ │ │ │ │ │ │ │ ├── modules │ │ │ │ │ │ │ │ │ ├── airportLookup.js │ │ │ │ │ │ │ │ │ ├── ajax.js │ │ │ │ │ │ │ │ │ ├── browserdetect.js │ │ │ │ │ │ │ │ │ ├── commonsetup.js │ │ │ │ │ │ │ │ │ ├── mobileDatePicker.js │ │ │ │ │ │ │ │ │ ├── utilities.js │ │ │ │ │ │ │ │ │ └── widgets.js │ │ │ │ │ │ │ │ ├── plugins │ │ │ │ │ │ │ │ │ └── noBounce.js │ │ │ │ │ │ │ │ └── shopping │ │ │ │ │ │ │ │ │ └── mobileSearchFlights.js │ │ │ │ │ │ │ └── libs │ │ │ │ │ │ │ │ ├── jquery │ │ │ │ │ │ │ │ ├── jquery-1.11.1.min.js │ │ │ │ │ │ │ │ ├── jquery-migrate-1.2.1.min.js │ │ │ │ │ │ │ │ └── ui │ │ │ │ │ │ │ │ │ └── 1.10 │ │ │ │ │ │ │ │ │ ├── i18n │ │ │ │ │ │ │ │ │ └── jquery.ui.datepicker-en-aa.js │ │ │ │ │ │ │ │ │ └── jquery-ui.min.js │ │ │ │ │ │ │ │ └── modernizr-2.8.1.js │ │ │ │ │ │ ├── original.html │ │ │ │ │ │ ├── surrogate │ │ │ │ │ │ │ ├── airportLookup.js │ │ │ │ │ │ │ └── airports.json │ │ │ │ │ │ └── wrapper.html │ │ │ │ │ ├── Alaska-auto-medium │ │ │ │ │ │ ├── images │ │ │ │ │ │ │ ├── aura.png │ │ │ │ │ │ │ ├── cal3.png │ │ │ │ │ │ │ ├── chkboxes3.png │ │ │ │ │ │ │ ├── clear_text2.png │ │ │ │ │ │ │ ├── collapse.png │ │ │ │ │ │ │ ├── expand.png │ │ │ │ │ │ │ ├── flight_arrow.png │ │ │ │ │ │ │ ├── geo.png │ │ │ │ │ │ │ ├── home.png │ │ │ │ │ │ │ ├── info2.png │ │ │ │ │ │ │ ├── leftright.png │ │ │ │ │ │ │ ├── logo2.png │ │ │ │ │ │ │ └── logos │ │ │ │ │ │ │ │ ├── AA.png │ │ │ │ │ │ │ │ ├── AS.png │ │ │ │ │ │ │ │ ├── DL.png │ │ │ │ │ │ │ │ └── VX.png │ │ │ │ │ │ ├── index.html │ │ │ │ │ │ ├── mobileweb-v3-28-6227-21813.css │ │ │ │ │ │ ├── scripts │ │ │ │ │ │ │ ├── datepickr.js │ │ │ │ │ │ │ ├── main.js │ │ │ │ │ │ │ └── shopbook.js │ │ │ │ │ │ ├── stylesheets │ │ │ │ │ │ │ └── circular │ │ │ │ │ │ │ │ ├── ASCircularWeb-Bold.woff │ │ │ │ │ │ │ │ └── ASCircularWeb-Book.woff │ │ │ │ │ │ ├── surrogate │ │ │ │ │ │ │ ├── airportLookup.js │ │ │ │ │ │ │ └── airports.json │ │ │ │ │ │ └── wrapper.html │ │ │ │ │ ├── Alaska-auto │ │ │ │ │ │ ├── images │ │ │ │ │ │ │ ├── aura.png │ │ │ │ │ │ │ ├── cal3.png │ │ │ │ │ │ │ ├── chkboxes3.png │ │ │ │ │ │ │ ├── clear_text2.png │ │ │ │ │ │ │ ├── collapse.png │ │ │ │ │ │ │ ├── expand.png │ │ │ │ │ │ │ ├── flight_arrow.png │ │ │ │ │ │ │ ├── geo.png │ │ │ │ │ │ │ ├── home.png │ │ │ │ │ │ │ ├── info2.png │ │ │ │ │ │ │ ├── leftright.png │ │ │ │ │ │ │ ├── logo2.png │ │ │ │ │ │ │ └── logos │ │ │ │ │ │ │ │ ├── AA.png │ │ │ │ │ │ │ │ ├── AS.png │ │ │ │ │ │ │ │ ├── DL.png │ │ │ │ │ │ │ │ └── VX.png │ │ │ │ │ │ ├── index.html │ │ │ │ │ │ ├── mobileweb-v3-28-6227-21813.css │ │ │ │ │ │ ├── scripts │ │ │ │ │ │ │ ├── datepickr.js │ │ │ │ │ │ │ ├── main.js │ │ │ │ │ │ │ └── shopbook.js │ │ │ │ │ │ ├── stylesheets │ │ │ │ │ │ │ └── circular │ │ │ │ │ │ │ │ ├── ASCircularWeb-Bold.woff │ │ │ │ │ │ │ │ └── ASCircularWeb-Book.woff │ │ │ │ │ │ ├── surrogate │ │ │ │ │ │ │ ├── airportLookup.js │ │ │ │ │ │ │ └── airports.json │ │ │ │ │ │ └── wrapper.html │ │ │ │ │ ├── Alaska │ │ │ │ │ │ ├── dataset-Alaska.js │ │ │ │ │ │ ├── images │ │ │ │ │ │ │ ├── aura.png │ │ │ │ │ │ │ ├── cal3.png │ │ │ │ │ │ │ ├── chkboxes3.png │ │ │ │ │ │ │ ├── clear_text2.png │ │ │ │ │ │ │ ├── collapse.png │ │ │ │ │ │ │ ├── expand.png │ │ │ │ │ │ │ ├── flight_arrow.png │ │ │ │ │ │ │ ├── geo.png │ │ │ │ │ │ │ ├── home.png │ │ │ │ │ │ │ ├── info2.png │ │ │ │ │ │ │ ├── leftright.png │ │ │ │ │ │ │ ├── logo2.png │ │ │ │ │ │ │ └── logos │ │ │ │ │ │ │ │ ├── AA.png │ │ │ │ │ │ │ │ ├── AS.png │ │ │ │ │ │ │ │ ├── DL.png │ │ │ │ │ │ │ │ └── VX.png │ │ │ │ │ │ ├── index.html │ │ │ │ │ │ ├── mobileweb-v3-28-6227-21813.css │ │ │ │ │ │ ├── original.html │ │ │ │ │ │ ├── scripts │ │ │ │ │ │ │ ├── datepickr.js │ │ │ │ │ │ │ ├── main.js │ │ │ │ │ │ │ └── shopbook.js │ │ │ │ │ │ ├── stylesheets │ │ │ │ │ │ │ └── circular │ │ │ │ │ │ │ │ ├── ASCircularWeb-Bold.woff │ │ │ │ │ │ │ │ └── ASCircularWeb-Book.woff │ │ │ │ │ │ ├── surrogate │ │ │ │ │ │ │ ├── airportLookup.js │ │ │ │ │ │ │ └── airports.json │ │ │ │ │ │ └── wrapper.html │ │ │ │ │ └── flight-common │ │ │ │ │ │ ├── inject.js │ │ │ │ │ │ ├── wrapper.css │ │ │ │ │ │ └── wrapper.js │ │ │ │ └── miniwob │ │ │ │ │ ├── bisect-angle.html │ │ │ │ │ ├── book-flight-nodelay.html │ │ │ │ │ ├── book-flight.html │ │ │ │ │ ├── chase-circle.html │ │ │ │ │ ├── choose-date-easy.html │ │ │ │ │ ├── choose-date-medium.html │ │ │ │ │ ├── choose-date-nodelay.html │ │ │ │ │ ├── choose-date.html │ │ │ │ │ ├── choose-list.html │ │ │ │ │ ├── circle-center.html │ │ │ │ │ ├── click-button-sequence.html │ │ │ │ │ ├── click-button.html │ │ │ │ │ ├── click-checkboxes-large.html │ │ │ │ │ ├── click-checkboxes-soft.html │ │ │ │ │ ├── click-checkboxes-transfer.html │ │ │ │ │ ├── click-checkboxes.html │ │ │ │ │ ├── click-collapsible-2-nodelay.html │ │ │ │ │ ├── click-collapsible-2.html │ │ │ │ │ ├── click-collapsible-nodelay.html │ │ │ │ │ ├── click-collapsible.html │ │ │ │ │ ├── click-color.html │ │ │ │ │ ├── click-dialog-2.html │ │ │ │ │ ├── click-dialog.html │ │ │ │ │ ├── click-link.html │ │ │ │ │ ├── click-menu-2.html │ │ │ │ │ ├── click-menu.html │ │ │ │ │ ├── click-option.html │ │ │ │ │ ├── click-pie-nodelay.html │ │ │ │ │ ├── click-pie.html │ │ │ │ │ ├── click-scroll-list.html │ │ │ │ │ ├── click-shades.html │ │ │ │ │ ├── click-shape.html │ │ │ │ │ ├── click-tab-2-easy.html │ │ │ │ │ ├── click-tab-2-hard.html │ │ │ │ │ ├── click-tab-2-medium.html │ │ │ │ │ ├── click-tab-2.html │ │ │ │ │ ├── click-tab.html │ │ │ │ │ ├── click-test-2.html │ │ │ │ │ ├── click-test-transfer.html │ │ │ │ │ ├── click-test.html │ │ │ │ │ ├── click-widget.html │ │ │ │ │ ├── copy-paste-2.html │ │ │ │ │ ├── copy-paste.html │ │ │ │ │ ├── count-shape.html │ │ │ │ │ ├── count-sides.html │ │ │ │ │ ├── drag-box.html │ │ │ │ │ ├── drag-cube.html │ │ │ │ │ ├── drag-item.html │ │ │ │ │ ├── drag-items-grid.html │ │ │ │ │ ├── drag-items.html │ │ │ │ │ ├── drag-shapes.html │ │ │ │ │ ├── drag-sort-numbers.html │ │ │ │ │ ├── email-inbox-delete.html │ │ │ │ │ ├── email-inbox-forward-nl-turk.html │ │ │ │ │ ├── email-inbox-forward-nl.html │ │ │ │ │ ├── email-inbox-forward.html │ │ │ │ │ ├── email-inbox-important.html │ │ │ │ │ ├── email-inbox-nl-turk.html │ │ │ │ │ ├── email-inbox-noscroll.html │ │ │ │ │ ├── email-inbox-reply.html │ │ │ │ │ ├── email-inbox-star-reply.html │ │ │ │ │ ├── email-inbox.html │ │ │ │ │ ├── enter-date.html │ │ │ │ │ ├── enter-password.html │ │ │ │ │ ├── enter-text-2.html │ │ │ │ │ ├── enter-text-dynamic.html │ │ │ │ │ ├── enter-text.html │ │ │ │ │ ├── enter-time.html │ │ │ │ │ ├── find-midpoint.html │ │ │ │ │ ├── find-word.html │ │ │ │ │ ├── focus-text-2.html │ │ │ │ │ ├── focus-text.html │ │ │ │ │ ├── grid-coordinate.html │ │ │ │ │ ├── guess-number.html │ │ │ │ │ ├── highlight-text-2.html │ │ │ │ │ ├── highlight-text.html │ │ │ │ │ ├── identify-shape.html │ │ │ │ │ ├── login-user-popup.html │ │ │ │ │ ├── login-user.html │ │ │ │ │ ├── moving-items.html │ │ │ │ │ ├── multi-layouts.html │ │ │ │ │ ├── multi-orderings.html │ │ │ │ │ ├── navigate-tree.html │ │ │ │ │ ├── number-checkboxes.html │ │ │ │ │ ├── read-table-2.html │ │ │ │ │ ├── read-table.html │ │ │ │ │ ├── resize-textarea.html │ │ │ │ │ ├── right-angle.html │ │ │ │ │ ├── scroll-text-2.html │ │ │ │ │ ├── scroll-text.html │ │ │ │ │ ├── search-engine.html │ │ │ │ │ ├── simon-says.html │ │ │ │ │ ├── simple-algebra.html │ │ │ │ │ ├── simple-arithmetic.html │ │ │ │ │ ├── social-media-all.html │ │ │ │ │ ├── social-media-some.html │ │ │ │ │ ├── social-media.html │ │ │ │ │ ├── terminal.html │ │ │ │ │ ├── terminal_reproduce.html │ │ │ │ │ ├── text-editor.html │ │ │ │ │ ├── text-transform.html │ │ │ │ │ ├── tic-tac-toe.html │ │ │ │ │ ├── unicode-test.html │ │ │ │ │ ├── use-autocomplete-nodelay.html │ │ │ │ │ ├── use-autocomplete.html │ │ │ │ │ ├── use-colorwheel-2.html │ │ │ │ │ ├── use-colorwheel.html │ │ │ │ │ ├── use-slider-2.html │ │ │ │ │ ├── use-slider.html │ │ │ │ │ ├── use-spinner.html │ │ │ │ │ └── visual-addition.html │ │ │ │ ├── instance.py │ │ │ │ ├── reward.py │ │ │ │ ├── screenshot.py │ │ │ │ ├── state.py │ │ │ │ └── utils.py │ │ └── setup.py │ ├── llm_agent.py │ ├── main.py │ ├── metrics.py │ ├── miniwob++.sh │ ├── prompt.py │ ├── prompt │ │ ├── action.txt │ │ ├── base.txt │ │ ├── choose-list │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-button-sequence │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-button │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-checkboxes-large │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-checkboxes-soft │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-checkboxes-transfer │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-checkboxes │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-collapsible-2 │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-collapsible │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-dialog-2 │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-dialog │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-menu │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-option │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-scroll-list │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-shades │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-shape │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-tab-2-hard │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-tab-2 │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-tab │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-test │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── click-widget │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── count-shape │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── email-inbox-forward-nl-turk │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── email-inbox-forward-nl │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── email-inbox-nl-turk │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── email-inbox │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── enter-date │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── enter-time │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── example.txt │ │ ├── few-shot.json │ │ ├── first_action.txt │ │ ├── focus-text │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── grid-coordinate │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── check_finish.txt │ │ │ ├── done.txt │ │ │ ├── edit_plan.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── new_plan.txt │ │ │ ├── rci_action.txt │ │ │ ├── rci_answer.txt │ │ │ └── update_action.txt │ │ ├── identify-shape │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── initialize_plan.txt │ │ ├── login-user-popup │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── multi-layouts │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── navigate-tree │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── rci_action.txt │ │ ├── search-engine │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── simple-algebra │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── check_finish.txt │ │ │ ├── done.txt │ │ │ ├── edit_plan.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── new_plan.txt │ │ │ ├── rci_action.txt │ │ │ ├── rci_answer.txt │ │ │ └── update_action.txt │ │ ├── social-media-all │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── social-media-some │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── social-media │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── terminal │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── tic-tac-toe │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ ├── update_action.txt │ │ ├── use-autocomplete │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ │ └── use-spinner │ │ │ ├── action.txt │ │ │ ├── base.txt │ │ │ ├── example.txt │ │ │ ├── first_action.txt │ │ │ ├── initialize_plan.txt │ │ │ ├── rci_action.txt │ │ │ └── update_action.txt │ └── requirements.txt ├── mint-bench │ ├── config_variables.py │ ├── convert_outputs.py │ ├── mint-bench-run.sh │ ├── mint.sh │ └── remove_dups.py ├── mmlu │ ├── evaluate_mmlu.py │ └── mmlu.sh ├── mt-bench │ ├── mt-bench.sh │ └── process_micro_avg.py ├── run_all.sh ├── science-world │ ├── .gitignore │ ├── README.md │ ├── code_actions.py │ ├── data_utils │ │ ├── READMD.md │ │ ├── __init__.py │ │ ├── data_convert.py │ │ ├── data_utils.py │ │ ├── demos.json │ │ └── goldpaths-all.zip │ ├── eval.py │ ├── eval_code_as_action.py │ ├── eval_utils.py │ ├── fast_agent │ │ ├── deepspeed_reqs.txt │ │ ├── ds_train.py │ │ ├── ds_train.sh │ │ └── zero_2_bf16.json │ ├── metrics.py │ ├── prompts │ │ ├── README.md │ │ ├── convert.py │ │ ├── prompt.json │ │ ├── prompt_code_action.json │ │ └── prompt_orig.json │ ├── science-world.sh │ └── slow_agent │ │ ├── local_llm.py │ │ ├── run_gradio.py │ │ └── utils.py ├── serve │ └── serve_ckpt.sh ├── setup_data.sh ├── setup_env.sh └── source.sh ├── models ├── add_chat_format.py └── megatron │ ├── convert_llama.sh │ ├── convert_mistral.sh │ ├── convert_sharded_to_hf.sh │ ├── finetune_4xA100_4tp_mixture_llama.sh │ ├── finetune_4xA100_4tp_mixture_mistral.sh │ ├── shard_model_4tp.sh │ └── source.sh └── slurm ├── configs ├── eval_2xA100.slurm └── finetune_4xA100_4tp.slurm ├── run_4gpu_interactive.sh ├── run_gpu_interactive.sh ├── run_gpu_interactive_A100.sh └── run_megatron_gpu_interactive.sh /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/.gitignore -------------------------------------------------------------------------------- /.gitmodules: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/.gitmodules -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/README.md -------------------------------------------------------------------------------- /docs/DATA_GENERATION.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/docs/DATA_GENERATION.md -------------------------------------------------------------------------------- /docs/EVALUATION.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/docs/EVALUATION.md -------------------------------------------------------------------------------- /docs/KUBERNETES_DEPLOY.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/docs/KUBERNETES_DEPLOY.md -------------------------------------------------------------------------------- /docs/MODEL_TRAINING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/docs/MODEL_TRAINING.md -------------------------------------------------------------------------------- /environment.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/environment.yml -------------------------------------------------------------------------------- /figures/codeact-comparison-perf.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/figures/codeact-comparison-perf.png -------------------------------------------------------------------------------- /figures/codeact-comparison-table.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/figures/codeact-comparison-table.png -------------------------------------------------------------------------------- /figures/data-stats.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/figures/data-stats.png -------------------------------------------------------------------------------- /figures/json-text-comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/figures/json-text-comparison.png -------------------------------------------------------------------------------- /figures/model-performance.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/figures/model-performance.png -------------------------------------------------------------------------------- /figures/overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/figures/overview.png -------------------------------------------------------------------------------- /mint/agents/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/agents/__init__.py -------------------------------------------------------------------------------- /mint/agents/bard_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/agents/bard_agent.py -------------------------------------------------------------------------------- /mint/agents/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/agents/base.py -------------------------------------------------------------------------------- /mint/agents/claude_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/agents/claude_agent.py -------------------------------------------------------------------------------- /mint/agents/claude_feedback_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/agents/claude_feedback_agent.py -------------------------------------------------------------------------------- /mint/agents/openai_feedback_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/agents/openai_feedback_agent.py -------------------------------------------------------------------------------- /mint/agents/openai_lm_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/agents/openai_lm_agent.py -------------------------------------------------------------------------------- /mint/agents/vllm_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/agents/vllm_agent.py -------------------------------------------------------------------------------- /mint/agents/vllm_feedback_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/agents/vllm_feedback_agent.py -------------------------------------------------------------------------------- /mint/configs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /mint/configs/config_variables.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/configs/config_variables.py -------------------------------------------------------------------------------- /mint/configs/generate_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/configs/generate_config.py -------------------------------------------------------------------------------- /mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/code_generation/APPS/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/code_generation/APPS/train.json -------------------------------------------------------------------------------- /mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/reasoning/algebra/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/reasoning/algebra/train.json -------------------------------------------------------------------------------- /mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/reasoning/geometry/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/reasoning/geometry/train.json -------------------------------------------------------------------------------- /mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/reasoning/hotpotqa/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/reasoning/hotpotqa/train.json -------------------------------------------------------------------------------- /mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/reasoning/prealgebra/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/reasoning/prealgebra/train.json -------------------------------------------------------------------------------- /mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/reasoning/precalculus/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/reasoning/precalculus/train.json -------------------------------------------------------------------------------- /mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/reasoning/strategyqa/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/claude-2/F=None/max5_p2+tool+cd/reasoning/strategyqa/train.json -------------------------------------------------------------------------------- /mint/data_gen_configs/gpt-4-0613/F=None/max5_p2+tool+cd/code_generation/APPS/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/gpt-4-0613/F=None/max5_p2+tool+cd/code_generation/APPS/train.json -------------------------------------------------------------------------------- /mint/data_gen_configs/gpt-4-0613/F=None/max5_p2+tool+cd/reasoning/algebra/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/gpt-4-0613/F=None/max5_p2+tool+cd/reasoning/algebra/train.json -------------------------------------------------------------------------------- /mint/data_gen_configs/gpt-4-0613/F=None/max5_p2+tool+cd/reasoning/geometry/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/gpt-4-0613/F=None/max5_p2+tool+cd/reasoning/geometry/train.json -------------------------------------------------------------------------------- /mint/data_gen_configs/gpt-4-0613/F=None/max5_p2+tool+cd/reasoning/hotpotqa/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/gpt-4-0613/F=None/max5_p2+tool+cd/reasoning/hotpotqa/train.json -------------------------------------------------------------------------------- /mint/data_gen_configs/gpt-4-0613/F=None/max5_p2+tool+cd/reasoning/prealgebra/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/gpt-4-0613/F=None/max5_p2+tool+cd/reasoning/prealgebra/train.json -------------------------------------------------------------------------------- /mint/data_gen_configs/gpt-4-0613/F=None/max5_p2+tool+cd/reasoning/strategyqa/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/data_gen_configs/gpt-4-0613/F=None/max5_p2+tool+cd/reasoning/strategyqa/train.json -------------------------------------------------------------------------------- /mint/datatypes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/datatypes.py -------------------------------------------------------------------------------- /mint/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/envs/__init__.py -------------------------------------------------------------------------------- /mint/envs/alfworld_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/envs/alfworld_env.py -------------------------------------------------------------------------------- /mint/envs/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/envs/base.py -------------------------------------------------------------------------------- /mint/envs/general_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/envs/general_env.py -------------------------------------------------------------------------------- /mint/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/main.py -------------------------------------------------------------------------------- /mint/prompt/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/prompt/__init__.py -------------------------------------------------------------------------------- /mint/prompt/templates/template_feedback_agent.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/prompt/templates/template_feedback_agent.txt -------------------------------------------------------------------------------- /mint/prompt/templates/template_with_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/prompt/templates/template_with_tool.txt -------------------------------------------------------------------------------- /mint/prompt/templates/template_without_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/prompt/templates/template_without_tool.txt -------------------------------------------------------------------------------- /mint/tasks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/__init__.py -------------------------------------------------------------------------------- /mint/tasks/alfworld.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/alfworld.py -------------------------------------------------------------------------------- /mint/tasks/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/base.py -------------------------------------------------------------------------------- /mint/tasks/codegen/APPS/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /mint/tasks/codegen/APPS/testing_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/codegen/APPS/testing_util.py -------------------------------------------------------------------------------- /mint/tasks/codegen/APPS/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/codegen/APPS/utils.py -------------------------------------------------------------------------------- /mint/tasks/codegen/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/codegen/__init__.py -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/APPS/with_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/APPS/with_tool.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/APPS/with_tool_and_feedback.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/APPS/with_tool_and_feedback.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/README.md -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/alfworld/clean/with_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/alfworld/clean/with_tool.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/alfworld/clean/with_tool_and_feedback.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/alfworld/clean/with_tool_and_feedback.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/alfworld/cool/with_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/alfworld/cool/with_tool.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/alfworld/cool/with_tool_and_feedback.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/alfworld/cool/with_tool_and_feedback.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/alfworld/examine/with_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/alfworld/examine/with_tool.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/alfworld/examine/with_tool_and_feedback.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/alfworld/examine/with_tool_and_feedback.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/alfworld/heat/with_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/alfworld/heat/with_tool.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/alfworld/heat/with_tool_and_feedback.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/alfworld/heat/with_tool_and_feedback.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/alfworld/put/with_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/alfworld/put/with_tool.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/alfworld/put/with_tool_and_feedback.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/alfworld/put/with_tool_and_feedback.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/alfworld/puttwo/with_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/alfworld/puttwo/with_tool.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/alfworld/puttwo/with_tool_and_feedback.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/alfworld/puttwo/with_tool_and_feedback.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/humaneval/with_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/humaneval/with_tool.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/humaneval/with_tool_and_feedback.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/humaneval/with_tool_and_feedback.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/mbpp/with_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/mbpp/with_tool.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/mbpp/with_tool_and_feedback.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/mbpp/with_tool_and_feedback.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/reasoning/with_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/reasoning/with_tool.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/reasoning/with_tool_and_feedback.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/reasoning/with_tool_and_feedback.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/tabular/with_tool.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/tabular/with_tool.txt -------------------------------------------------------------------------------- /mint/tasks/in_context_examples/tabular/with_tool_and_feedback.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/in_context_examples/tabular/with_tool_and_feedback.txt -------------------------------------------------------------------------------- /mint/tasks/reasoning/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/reasoning/__init__.py -------------------------------------------------------------------------------- /mint/tasks/reasoning/grader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/reasoning/grader.py -------------------------------------------------------------------------------- /mint/tasks/reasoning/math_normalize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/reasoning/math_normalize.py -------------------------------------------------------------------------------- /mint/tasks/tabular/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/tabular/__init__.py -------------------------------------------------------------------------------- /mint/tasks/tabular/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tasks/tabular/evaluator.py -------------------------------------------------------------------------------- /mint/tools/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tools/__init__.py -------------------------------------------------------------------------------- /mint/tools/alfworld.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tools/alfworld.py -------------------------------------------------------------------------------- /mint/tools/arxiv_search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tools/arxiv_search.py -------------------------------------------------------------------------------- /mint/tools/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tools/base.py -------------------------------------------------------------------------------- /mint/tools/python_tool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tools/python_tool.py -------------------------------------------------------------------------------- /mint/tools/web_search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tools/web_search.py -------------------------------------------------------------------------------- /mint/tools/wikipedia_search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/tools/wikipedia_search.py -------------------------------------------------------------------------------- /mint/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/utils/__init__.py -------------------------------------------------------------------------------- /mint/utils/exception.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/utils/exception.py -------------------------------------------------------------------------------- /mint/utils/exec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/mint/utils/exec.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/requirements.txt -------------------------------------------------------------------------------- /scripts/chat/code_execution/Dockerfile.api: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/code_execution/Dockerfile.api -------------------------------------------------------------------------------- /scripts/chat/code_execution/Dockerfile.executor: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/code_execution/Dockerfile.executor -------------------------------------------------------------------------------- /scripts/chat/code_execution/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/code_execution/api.py -------------------------------------------------------------------------------- /scripts/chat/code_execution/jupyter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/code_execution/jupyter.py -------------------------------------------------------------------------------- /scripts/chat/code_execution/start_jupyter_server.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/code_execution/start_jupyter_server.sh -------------------------------------------------------------------------------- /scripts/chat/demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/demo.py -------------------------------------------------------------------------------- /scripts/chat/kubernetes/build_chat_ui_and_push.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/kubernetes/build_chat_ui_and_push.sh -------------------------------------------------------------------------------- /scripts/chat/kubernetes/build_code_execute_api_and_push.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/kubernetes/build_code_execute_api_and_push.sh -------------------------------------------------------------------------------- /scripts/chat/kubernetes/build_code_executor_container_and_push.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/kubernetes/build_code_executor_container_and_push.sh -------------------------------------------------------------------------------- /scripts/chat/kubernetes/k8s.template.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/kubernetes/k8s.template.yml -------------------------------------------------------------------------------- /scripts/chat/run_chat_ui.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/run_chat_ui.sh -------------------------------------------------------------------------------- /scripts/chat/run_chat_ui_debug.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/run_chat_ui_debug.sh -------------------------------------------------------------------------------- /scripts/chat/start_mongodb.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/start_mongodb.sh -------------------------------------------------------------------------------- /scripts/chat/start_vllm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/chat/start_vllm.sh -------------------------------------------------------------------------------- /scripts/data/analyze_dataset.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/analyze_dataset.ipynb -------------------------------------------------------------------------------- /scripts/data/create_hf_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/create_hf_dataset.py -------------------------------------------------------------------------------- /scripts/data/download_from_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/download_from_hf.py -------------------------------------------------------------------------------- /scripts/data/general/process_capybara.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/general/process_capybara.py -------------------------------------------------------------------------------- /scripts/data/general/process_general_traj.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/general/process_general_traj.sh -------------------------------------------------------------------------------- /scripts/data/general/process_openorca.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/general/process_openorca.py -------------------------------------------------------------------------------- /scripts/data/general/process_sharegpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/general/process_sharegpt.py -------------------------------------------------------------------------------- /scripts/data/interaction/collection/convert_outputs.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/interaction/collection/convert_outputs.ipynb -------------------------------------------------------------------------------- /scripts/data/interaction/collection/process_trajectories.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/interaction/collection/process_trajectories.ipynb -------------------------------------------------------------------------------- /scripts/data/interaction/collection/run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/interaction/collection/run.sh -------------------------------------------------------------------------------- /scripts/data/interaction/collection/run_mint_docker_interactive.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/interaction/collection/run_mint_docker_interactive.sh -------------------------------------------------------------------------------- /scripts/data/interaction/download_raw_data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/interaction/download_raw_data.sh -------------------------------------------------------------------------------- /scripts/data/interaction/process_APPS.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/interaction/process_APPS.py -------------------------------------------------------------------------------- /scripts/data/interaction/process_MATH.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/interaction/process_MATH.py -------------------------------------------------------------------------------- /scripts/data/interaction/process_WikiTableQuestions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/interaction/process_WikiTableQuestions.py -------------------------------------------------------------------------------- /scripts/data/interaction/process_hotpotQA.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/interaction/process_hotpotQA.py -------------------------------------------------------------------------------- /scripts/data/megatron_conversion/process_mixture_llama.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/megatron_conversion/process_mixture_llama.sh -------------------------------------------------------------------------------- /scripts/data/megatron_conversion/process_mixture_mistral.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/data/megatron_conversion/process_mixture_mistral.sh -------------------------------------------------------------------------------- /scripts/docker/Dockerfile.megatron: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/docker/Dockerfile.megatron -------------------------------------------------------------------------------- /scripts/docker/Dockerfile.mint: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/docker/Dockerfile.mint -------------------------------------------------------------------------------- /scripts/docker/run_megatron_interactive.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/docker/run_megatron_interactive.sh -------------------------------------------------------------------------------- /scripts/docker/run_megatron_interactive_slurm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/docker/run_megatron_interactive_slurm.sh -------------------------------------------------------------------------------- /scripts/eval/aggregate_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/aggregate_eval.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/.gitignore: -------------------------------------------------------------------------------- 1 | prompt\ examples/ 2 | __pycache__/ 3 | .vscode 4 | .DS_Store -------------------------------------------------------------------------------- /scripts/eval/api-bank/API-Bank-arxiv-version.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/API-Bank-arxiv-version.pdf -------------------------------------------------------------------------------- /scripts/eval/api-bank/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/LICENSE -------------------------------------------------------------------------------- /scripts/eval/api-bank/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/README.md -------------------------------------------------------------------------------- /scripts/eval/api-bank/api_bank_analysis.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/api_bank_analysis.ipynb -------------------------------------------------------------------------------- /scripts/eval/api-bank/api_call_extraction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/api_call_extraction.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/__init__.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/add_agenda.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/add_agenda.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/add_alarm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/add_alarm.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/add_meeting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/add_meeting.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/add_reminder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/add_reminder.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/add_scene.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/add_scene.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/api.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/appointment_registration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/appointment_registration.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/book_hotel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/book_hotel.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/calculator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/calculator.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/cancel_registration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/cancel_registration.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/cancel_timed_switch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/cancel_timed_switch.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/check_token.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/check_token.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/delete_account.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/delete_account.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/delete_agenda.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/delete_agenda.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/delete_alarm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/delete_alarm.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/delete_meeting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/delete_meeting.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/delete_reminder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/delete_reminder.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/delete_scene.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/delete_scene.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/dictionary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/dictionary.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/document_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/document_qa.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/emergency_knowledge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/emergency_knowledge.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/forgot_password.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/forgot_password.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/get_today.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/get_today.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/get_user_token.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/get_user_token.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/image_caption.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/image_caption.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/modify_agenda.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/modify_agenda.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/modify_alarm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/modify_alarm.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/modify_meeting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/modify_meeting.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/modify_password.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/modify_password.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/modify_registration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/modify_registration.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/modify_reminder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/modify_reminder.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/modify_scene.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/modify_scene.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/open_bank_account.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/open_bank_account.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/play_music.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/play_music.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/query_agenda.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/query_agenda.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/query_alarm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/query_alarm.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/query_balance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/query_balance.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/query_health_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/query_health_data.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/query_history_today.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/query_history_today.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/query_meeting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/query_meeting.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/query_registration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/query_registration.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/query_reminder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/query_reminder.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/query_scene.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/query_scene.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/query_stock.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/query_stock.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/record_health_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/record_health_data.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/register_user.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/register_user.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/search_engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/search_engine.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/send_email.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/send_email.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/speech_recognition.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/speech_recognition.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/symptom_search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/symptom_search.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/timed_switch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/timed_switch.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/tool_search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/tool_search.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/translate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/translate.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/apis/wiki.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/apis/wiki.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/data/all_apis.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/data/all_apis.csv -------------------------------------------------------------------------------- /scripts/eval/api-bank/data/exceptions.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/data/exceptions.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/demo.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/evaluator.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/evaluator_by_json.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/evaluator_by_json.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/figures/multi-agent.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/figures/multi-agent.png -------------------------------------------------------------------------------- /scripts/eval/api-bank/figures/three_ability.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/figures/three_ability.png -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/Account.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/Account.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/Agenda.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/Agenda.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/Alarm.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/Alarm.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/Appointments.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/Appointments.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/Bank.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/Bank.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/HealthData.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/HealthData.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/History.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/History.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/Hotel.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/Hotel.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/ImageCaptioning.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/ImageCaptioning.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/Meeting.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/Meeting.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/QuestionAnswering.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/QuestionAnswering.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/Reminder.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/Reminder.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/Scenes.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/Scenes.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/SearchEngine.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/SearchEngine.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/SpeechRecognition.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/SpeechRecognition.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/Stock.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/Stock.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/Symptom.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/Symptom.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/TimeSwitch.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/TimeSwitch.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/init_database/Wiki.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/init_database/Wiki.json -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddAgenda-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddAgenda-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddAgenda-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddAgenda-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddAlarm-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddAlarm-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddMeeting-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddMeeting-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddReminder-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddReminder-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddReminder-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddReminder-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddReminder-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/AddReminder-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/BookHotel-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/BookHotel-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/BookHotel-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/BookHotel-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/BookHotel-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/BookHotel-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/BookHotel-level-1-4.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/BookHotel-level-1-4.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/BookHotel-level-1-5.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/BookHotel-level-1-5.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Calculator-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Calculator-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Calculator-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Calculator-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Calculator-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Calculator-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteAccount-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteAccount-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteAccount-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteAccount-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteAccount-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteAccount-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteAgenda-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteAgenda-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteAlarm-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteAlarm-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteAlarm-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteAlarm-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteMeeting-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteMeeting-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteReminder-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteReminder-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteScene-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteScene-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteScene-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteScene-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteScene-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DeleteScene-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Dictionary-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Dictionary-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Dictionary-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Dictionary-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Dictionary-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Dictionary-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Dictionary-level-1-4.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Dictionary-level-1-4.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DocumentQA-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DocumentQA-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DocumentQA-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DocumentQA-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DocumentQA-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DocumentQA-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DocumentQA-level-1-4.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/DocumentQA-level-1-4.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ForgotPassword-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ForgotPassword-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetMeeting-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetMeeting-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetMeeting-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetMeeting-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetReminder-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetReminder-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetReminder-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetReminder-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetToday-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetToday-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetToday-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetToday-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetToday-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetToday-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetToday-level-1-4.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/GetToday-level-1-4.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ImageCaption-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ImageCaption-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyAgenda-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyAgenda-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyAgenda-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyAgenda-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyAlarm-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyAlarm-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyAlarm-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyAlarm-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyMeeting-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyMeeting-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyMeeting-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyMeeting-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyMeeting-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyMeeting-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyPassword-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyPassword-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyPassword-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyPassword-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyReminder-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyReminder-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyReminder-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyReminder-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyReminder-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/ModifyReminder-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/PlayMusic-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/PlayMusic-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/PlayMusic-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/PlayMusic-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/PlayMusic-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/PlayMusic-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryAgenda-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryAgenda-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryAlarm-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryAlarm-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryBalance-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryBalance-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryBalance-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryBalance-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryMeeting-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryMeeting-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryReminder-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryReminder-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryReminder-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryReminder-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryScene-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryScene-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryScene-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryScene-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryScene-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryScene-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryScene-level-1-4.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryScene-level-1-4.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryScene-level-1-5.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryScene-level-1-5.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryStock-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryStock-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryStock-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryStock-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryStock-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryStock-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryStock-level-1-4.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryStock-level-1-4.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryStock-level-1-5.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/QueryStock-level-1-5.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/RegisterUser-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/RegisterUser-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/RegisterUser-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/RegisterUser-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/RegisterUser-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/RegisterUser-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/SearchEngine-level-1-1.jsonl: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/SearchEngine-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/SearchEngine-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/SendEmail-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/SendEmail-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/SymptomSearch-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/SymptomSearch-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/SymptomSearch-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/SymptomSearch-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/TimedSwitch-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/TimedSwitch-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/TimedSwitch-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/TimedSwitch-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/TimedSwitch-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/TimedSwitch-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Translate-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Translate-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Translate-level-1-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Translate-level-1-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Translate-level-1-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Translate-level-1-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Translate-level-1-4.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Translate-level-1-4.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Wiki-level-1-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-1-given-desc/Wiki-level-1-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddAgenda-level-3-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddAgenda-level-3-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddAgenda-level-3-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddAgenda-level-3-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddAlarm-level-3-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddAlarm-level-3-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddAlarm-level-3-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddAlarm-level-3-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddMeeting-level-3-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddMeeting-level-3-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddMeeting-level-3-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddMeeting-level-3-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddReminder-level-3-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/AddReminder-level-3-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/BookHotel-level-3-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/BookHotel-level-3-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/BookHotel-level-3-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/BookHotel-level-3-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/BookHotel-level-3-3.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/BookHotel-level-3-3.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/Calculator-level-3-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/Calculator-level-3-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/Calculator-level-3-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/Calculator-level-3-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/DeleteAgenda-level-3-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/DeleteAgenda-level-3-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/DeleteAgenda-level-3-2.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/DeleteAgenda-level-3-2.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/DeleteAlarm-level-3-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/DeleteAlarm-level-3-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/GetToday-level-3-1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv1-lv2-samples/level-2-toolsearcher/GetToday-level-3-1.jsonl -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3-samples/Financial Management.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3-samples/Financial Management.txt -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3-samples/Health Management.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3-samples/Health Management.txt -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3-samples/Hospital.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3-samples/Hospital.txt -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3-samples/Hotel Booking.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3-samples/Hotel Booking.txt -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3-samples/Meeting Schedule.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3-samples/Meeting Schedule.txt -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3-samples/Personal Assistant.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3-samples/Personal Assistant.txt -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3-samples/Reminder.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3-samples/Reminder.txt -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3-samples/Shopping.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3-samples/Shopping.txt -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/account_info.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/account_info.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/add_meeting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/add_meeting.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/calculator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/calculator.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/clothing_recommandation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/clothing_recommandation.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/email_reminder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/email_reminder.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/flight_search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/flight_search.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/geocoding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/geocoding.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/get_occupation_salary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/get_occupation_salary.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/get_weather.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/get_weather.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/hotel_availability.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/hotel_availability.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/like_count.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/like_count.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/movie_recommandation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/movie_recommandation.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/nearby_restaurants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/nearby_restaurants.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/organization_members.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/organization_members.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/query_meeting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/query_meeting.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/tax_calculator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/tax_calculator.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/tool_search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/tool_search.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/travel_status.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/travel_status.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/update_account_info.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/update_account_info.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/user_posts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/user_posts.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/user_watched_movies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/user_watched_movies.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_apis/users_movie_preference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_apis/users_movie_preference.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/lv3_evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/lv3_evaluator.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/requirements.txt -------------------------------------------------------------------------------- /scripts/eval/api-bank/run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/run.sh -------------------------------------------------------------------------------- /scripts/eval/api-bank/simulator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/simulator.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/tool_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/tool_manager.py -------------------------------------------------------------------------------- /scripts/eval/api-bank/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/api-bank/utils.py -------------------------------------------------------------------------------- /scripts/eval/gsm8k/evaluate_gsm8k.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/gsm8k/evaluate_gsm8k.py -------------------------------------------------------------------------------- /scripts/eval/gsm8k/gsm8k.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/gsm8k/gsm8k.sh -------------------------------------------------------------------------------- /scripts/eval/human_eval/HumanEval.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/human_eval/HumanEval.jsonl -------------------------------------------------------------------------------- /scripts/eval/human_eval/evaluate_human_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/human_eval/evaluate_human_eval.py -------------------------------------------------------------------------------- /scripts/eval/human_eval/human_eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/human_eval/human_eval.sh -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/m3tooleval_analysis.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/m3tooleval_analysis.ipynb -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/main.py -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/run.sh -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/tasks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/tasks/__init__.py -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/tasks/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/tasks/base.py -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/tasks/impl/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/tasks/impl/dna_sequencer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/tasks/impl/dna_sequencer.py -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/tasks/impl/message_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/tasks/impl/message_decoder.py -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/tasks/impl/trade_calculator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/tasks/impl/trade_calculator.py -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/tasks/impl/travel_itinerary_planning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/tasks/impl/travel_itinerary_planning.py -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/tasks/impl/web_browsing/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/tasks/impl/web_browsing/__init__.py -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/tasks/impl/web_browsing/generate_web_pages.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/tasks/impl/web_browsing/generate_web_pages.py -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/tasks/impl/web_browsing/metadata.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/tasks/impl/web_browsing/metadata.json -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/tasks/impl/web_browsing/web_pages.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/tasks/impl/web_browsing/web_pages.jsonl -------------------------------------------------------------------------------- /scripts/eval/m3tooleval/tasks/repl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/m3tooleval/tasks/repl.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/.gitignore -------------------------------------------------------------------------------- /scripts/eval/miniwob++/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/LICENSE -------------------------------------------------------------------------------- /scripts/eval/miniwob++/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/README.md -------------------------------------------------------------------------------- /scripts/eval/miniwob++/available_tasks.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/available_tasks.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/computergym/.gitignore -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/computergym/README.md -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/computergym/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/computergym/computergym/__init__.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/computergym/miniwob/base_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/computergym/computergym/miniwob/base_env.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/action.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/action.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/fields.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/fields.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/html/.gitignore: -------------------------------------------------------------------------------- 1 | twistd.pid 2 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/html/flight/AA/js/aa/modules/commonsetup.js: -------------------------------------------------------------------------------- 1 | AAcom.modules.commonsetup=function(AAUI){/* NOT NEEDED */}; 2 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/instance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/instance.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/reward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/reward.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/state.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/state.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/computergym/computergym/miniwob/miniwob_interface/utils.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/computergym/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/computergym/setup.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/llm_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/llm_agent.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/main.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/metrics.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/miniwob++.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/miniwob++.sh -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt.py -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/choose-list/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/choose-list/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/choose-list/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/choose-list/example.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/choose-list/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/choose-list/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/choose-list/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/choose-list/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/choose-list/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button-sequence/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button-sequence/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-button-sequence/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button-sequence/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-button-sequence/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button-sequence/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button-sequence/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button-sequence/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-button-sequence/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button-sequence/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-button-sequence/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-button/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-button/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-button/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-button/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-button/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-large/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-large/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes-large/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-large/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes-large/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-large/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-large/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-large/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes-large/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-large/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes-large/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-soft/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-soft/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes-soft/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-soft/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes-soft/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-soft/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-soft/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-soft/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes-soft/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-soft/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes-soft/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-transfer/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-transfer/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes-transfer/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-transfer/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes-transfer/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-transfer/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-transfer/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-transfer/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes-transfer/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes-transfer/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes-transfer/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-checkboxes/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-checkboxes/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible-2/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible-2/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-collapsible-2/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible-2/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-collapsible-2/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible-2/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible-2/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible-2/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-collapsible-2/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible-2/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-collapsible-2/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-collapsible/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-collapsible/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-collapsible/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-collapsible/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-collapsible/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog-2/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog-2/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-dialog-2/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog-2/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-dialog-2/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog-2/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog-2/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog-2/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-dialog-2/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog-2/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-dialog/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-dialog/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-dialog/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-dialog/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-menu/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-menu/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-menu/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-menu/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-menu/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-menu/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-menu/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-menu/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-menu/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-menu/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-option/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-option/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-option/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-option/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-option/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-option/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-option/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-option/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-option/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-option/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-option/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-scroll-list/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-scroll-list/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-scroll-list/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-scroll-list/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-scroll-list/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-scroll-list/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-scroll-list/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-scroll-list/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-scroll-list/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-scroll-list/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-scroll-list/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shades/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shades/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-shades/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shades/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-shades/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shades/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shades/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shades/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-shades/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shades/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-shades/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shape/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shape/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-shape/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shape/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-shape/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shape/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shape/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shape/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-shape/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-shape/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-shape/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2-hard/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2-hard/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-tab-2-hard/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2-hard/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-tab-2-hard/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2-hard/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2-hard/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2-hard/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-tab-2-hard/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2-hard/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-tab-2-hard/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-tab-2/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-tab-2/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-tab-2/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab-2/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-tab-2/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-tab/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-tab/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-tab/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-tab/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-test/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-test/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-test/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-test/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-test/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-test/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-test/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-test/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-test/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-test/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-test/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-widget/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-widget/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-widget/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-widget/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-widget/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-widget/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-widget/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-widget/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-widget/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/click-widget/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/click-widget/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/count-shape/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/count-shape/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/count-shape/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/count-shape/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/count-shape/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/count-shape/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/count-shape/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/count-shape/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/count-shape/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/count-shape/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/count-shape/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl-turk/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl-turk/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/email-inbox-forward-nl-turk/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl-turk/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/email-inbox-forward-nl-turk/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl-turk/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl-turk/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl-turk/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/email-inbox-forward-nl-turk/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl-turk/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl/action.txt: -------------------------------------------------------------------------------- 1 | the next instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/email-inbox-forward-nl/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/email-inbox-forward-nl/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/email-inbox-forward-nl/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-forward-nl/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-nl-turk/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-nl-turk/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/email-inbox-nl-turk/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-nl-turk/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/email-inbox-nl-turk/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-nl-turk/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-nl-turk/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-nl-turk/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/email-inbox-nl-turk/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox-nl-turk/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/email-inbox/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/email-inbox/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/email-inbox/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/email-inbox/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-date/action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/enter-date/action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-date/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/enter-date/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-date/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/enter-date/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-date/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-date/initialize_plan.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/enter-date/initialize_plan.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-date/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/enter-date/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-date/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/enter-date/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-time/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-time/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/enter-time/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-time/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/enter-time/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-time/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-time/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-time/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/enter-time/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/enter-time/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/example.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/few-shot.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/few-shot.json -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/focus-text/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/focus-text/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/focus-text/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/focus-text/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/focus-text/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/focus-text/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/focus-text/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/focus-text/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/focus-text/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/focus-text/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/grid-coordinate/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/grid-coordinate/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/grid-coordinate/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/grid-coordinate/check_finish.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/grid-coordinate/check_finish.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/grid-coordinate/done.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/grid-coordinate/done.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/grid-coordinate/edit_plan.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/grid-coordinate/edit_plan.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/grid-coordinate/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/grid-coordinate/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/grid-coordinate/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/grid-coordinate/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/grid-coordinate/new_plan.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/grid-coordinate/new_plan.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/grid-coordinate/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/grid-coordinate/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/grid-coordinate/rci_answer.txt: -------------------------------------------------------------------------------- 1 | Answer Yes or No. -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/grid-coordinate/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/identify-shape/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/identify-shape/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/identify-shape/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/identify-shape/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/identify-shape/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/identify-shape/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/identify-shape/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/identify-shape/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/identify-shape/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/identify-shape/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/login-user-popup/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/login-user-popup/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/login-user-popup/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/login-user-popup/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/login-user-popup/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/login-user-popup/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/login-user-popup/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/login-user-popup/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/login-user-popup/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/login-user-popup/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/multi-layouts/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/multi-layouts/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/multi-layouts/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/multi-layouts/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/multi-layouts/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/multi-layouts/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/multi-layouts/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/multi-layouts/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/multi-layouts/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/multi-layouts/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/navigate-tree/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/navigate-tree/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/navigate-tree/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/navigate-tree/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/navigate-tree/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/navigate-tree/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/navigate-tree/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/navigate-tree/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/navigate-tree/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/navigate-tree/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/search-engine/action.txt: -------------------------------------------------------------------------------- 1 | the next instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/search-engine/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/search-engine/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/search-engine/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/search-engine/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/search-engine/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/search-engine/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/search-engine/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/search-engine/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/search-engine/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/search-engine/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/simple-algebra/action.txt: -------------------------------------------------------------------------------- 1 | the next instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/simple-algebra/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/simple-algebra/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/simple-algebra/check_finish.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/simple-algebra/check_finish.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/simple-algebra/done.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/simple-algebra/done.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/simple-algebra/edit_plan.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/simple-algebra/edit_plan.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/simple-algebra/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/simple-algebra/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/simple-algebra/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/simple-algebra/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/simple-algebra/new_plan.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/simple-algebra/new_plan.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/simple-algebra/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/simple-algebra/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/simple-algebra/rci_answer.txt: -------------------------------------------------------------------------------- 1 | Answer Yes or No. -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/simple-algebra/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-all/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-all/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/social-media-all/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-all/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/social-media-all/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-all/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-all/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-all/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/social-media-all/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-all/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/social-media-all/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-some/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-some/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/social-media-some/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-some/example.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-some/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-some/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-some/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/social-media-some/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media-some/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/social-media/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/social-media/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/social-media/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/social-media/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/social-media/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/terminal/action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/terminal/action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/terminal/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/terminal/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/terminal/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/terminal/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/terminal/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/terminal/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/terminal/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/terminal/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/terminal/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/terminal/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/tic-tac-toe/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/tic-tac-toe/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/tic-tac-toe/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/tic-tac-toe/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/tic-tac-toe/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/tic-tac-toe/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/tic-tac-toe/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/tic-tac-toe/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/tic-tac-toe/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/tic-tac-toe/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/update_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/update_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-autocomplete/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-autocomplete/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/use-autocomplete/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-autocomplete/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/use-autocomplete/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-autocomplete/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-autocomplete/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-autocomplete/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/use-autocomplete/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-autocomplete/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-spinner/action.txt: -------------------------------------------------------------------------------- 1 | the next proper instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-spinner/base.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/use-spinner/base.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-spinner/example.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/use-spinner/example.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-spinner/first_action.txt: -------------------------------------------------------------------------------- 1 | the first instruction should be ` -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-spinner/initialize_plan.txt: -------------------------------------------------------------------------------- 1 | plan: -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-spinner/rci_action.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/prompt/use-spinner/rci_action.txt -------------------------------------------------------------------------------- /scripts/eval/miniwob++/prompt/use-spinner/update_action.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/miniwob++/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/miniwob++/requirements.txt -------------------------------------------------------------------------------- /scripts/eval/mint-bench/config_variables.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/mint-bench/config_variables.py -------------------------------------------------------------------------------- /scripts/eval/mint-bench/convert_outputs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/mint-bench/convert_outputs.py -------------------------------------------------------------------------------- /scripts/eval/mint-bench/mint-bench-run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/mint-bench/mint-bench-run.sh -------------------------------------------------------------------------------- /scripts/eval/mint-bench/mint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/mint-bench/mint.sh -------------------------------------------------------------------------------- /scripts/eval/mint-bench/remove_dups.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/mint-bench/remove_dups.py -------------------------------------------------------------------------------- /scripts/eval/mmlu/evaluate_mmlu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/mmlu/evaluate_mmlu.py -------------------------------------------------------------------------------- /scripts/eval/mmlu/mmlu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/mmlu/mmlu.sh -------------------------------------------------------------------------------- /scripts/eval/mt-bench/mt-bench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/mt-bench/mt-bench.sh -------------------------------------------------------------------------------- /scripts/eval/mt-bench/process_micro_avg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/mt-bench/process_micro_avg.py -------------------------------------------------------------------------------- /scripts/eval/run_all.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/run_all.sh -------------------------------------------------------------------------------- /scripts/eval/science-world/.gitignore: -------------------------------------------------------------------------------- 1 | .env 2 | .DS_Store 3 | logs/ 4 | *.pyc 5 | .vscode/ 6 | __pycache__/ -------------------------------------------------------------------------------- /scripts/eval/science-world/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/README.md -------------------------------------------------------------------------------- /scripts/eval/science-world/code_actions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/code_actions.py -------------------------------------------------------------------------------- /scripts/eval/science-world/data_utils/READMD.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/data_utils/READMD.md -------------------------------------------------------------------------------- /scripts/eval/science-world/data_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/eval/science-world/data_utils/data_convert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/data_utils/data_convert.py -------------------------------------------------------------------------------- /scripts/eval/science-world/data_utils/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/data_utils/data_utils.py -------------------------------------------------------------------------------- /scripts/eval/science-world/data_utils/demos.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/data_utils/demos.json -------------------------------------------------------------------------------- /scripts/eval/science-world/data_utils/goldpaths-all.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/data_utils/goldpaths-all.zip -------------------------------------------------------------------------------- /scripts/eval/science-world/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/eval.py -------------------------------------------------------------------------------- /scripts/eval/science-world/eval_code_as_action.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/eval_code_as_action.py -------------------------------------------------------------------------------- /scripts/eval/science-world/eval_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/eval_utils.py -------------------------------------------------------------------------------- /scripts/eval/science-world/fast_agent/deepspeed_reqs.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/fast_agent/deepspeed_reqs.txt -------------------------------------------------------------------------------- /scripts/eval/science-world/fast_agent/ds_train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/fast_agent/ds_train.py -------------------------------------------------------------------------------- /scripts/eval/science-world/fast_agent/ds_train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/fast_agent/ds_train.sh -------------------------------------------------------------------------------- /scripts/eval/science-world/fast_agent/zero_2_bf16.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/fast_agent/zero_2_bf16.json -------------------------------------------------------------------------------- /scripts/eval/science-world/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/metrics.py -------------------------------------------------------------------------------- /scripts/eval/science-world/prompts/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/prompts/README.md -------------------------------------------------------------------------------- /scripts/eval/science-world/prompts/convert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/prompts/convert.py -------------------------------------------------------------------------------- /scripts/eval/science-world/prompts/prompt.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/prompts/prompt.json -------------------------------------------------------------------------------- /scripts/eval/science-world/prompts/prompt_code_action.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/prompts/prompt_code_action.json -------------------------------------------------------------------------------- /scripts/eval/science-world/prompts/prompt_orig.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/prompts/prompt_orig.json -------------------------------------------------------------------------------- /scripts/eval/science-world/science-world.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/science-world.sh -------------------------------------------------------------------------------- /scripts/eval/science-world/slow_agent/local_llm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/slow_agent/local_llm.py -------------------------------------------------------------------------------- /scripts/eval/science-world/slow_agent/run_gradio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/slow_agent/run_gradio.py -------------------------------------------------------------------------------- /scripts/eval/science-world/slow_agent/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/science-world/slow_agent/utils.py -------------------------------------------------------------------------------- /scripts/eval/serve/serve_ckpt.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/serve/serve_ckpt.sh -------------------------------------------------------------------------------- /scripts/eval/setup_data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/setup_data.sh -------------------------------------------------------------------------------- /scripts/eval/setup_env.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/setup_env.sh -------------------------------------------------------------------------------- /scripts/eval/source.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/eval/source.sh -------------------------------------------------------------------------------- /scripts/models/add_chat_format.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/models/add_chat_format.py -------------------------------------------------------------------------------- /scripts/models/megatron/convert_llama.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/models/megatron/convert_llama.sh -------------------------------------------------------------------------------- /scripts/models/megatron/convert_mistral.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/models/megatron/convert_mistral.sh -------------------------------------------------------------------------------- /scripts/models/megatron/convert_sharded_to_hf.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/models/megatron/convert_sharded_to_hf.sh -------------------------------------------------------------------------------- /scripts/models/megatron/finetune_4xA100_4tp_mixture_llama.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/models/megatron/finetune_4xA100_4tp_mixture_llama.sh -------------------------------------------------------------------------------- /scripts/models/megatron/finetune_4xA100_4tp_mixture_mistral.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/models/megatron/finetune_4xA100_4tp_mixture_mistral.sh -------------------------------------------------------------------------------- /scripts/models/megatron/shard_model_4tp.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/models/megatron/shard_model_4tp.sh -------------------------------------------------------------------------------- /scripts/models/megatron/source.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/models/megatron/source.sh -------------------------------------------------------------------------------- /scripts/slurm/configs/eval_2xA100.slurm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/slurm/configs/eval_2xA100.slurm -------------------------------------------------------------------------------- /scripts/slurm/configs/finetune_4xA100_4tp.slurm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/slurm/configs/finetune_4xA100_4tp.slurm -------------------------------------------------------------------------------- /scripts/slurm/run_4gpu_interactive.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/slurm/run_4gpu_interactive.sh -------------------------------------------------------------------------------- /scripts/slurm/run_gpu_interactive.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/slurm/run_gpu_interactive.sh -------------------------------------------------------------------------------- /scripts/slurm/run_gpu_interactive_A100.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/slurm/run_gpu_interactive_A100.sh -------------------------------------------------------------------------------- /scripts/slurm/run_megatron_gpu_interactive.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xingyaoww/code-act/HEAD/scripts/slurm/run_megatron_gpu_interactive.sh --------------------------------------------------------------------------------