├── .gitignore ├── README.md ├── __init__.py ├── assets ├── aime_fewshot.jsonl ├── cipher_fewshot.jsonl ├── cn_exam_step_fewshot.jsonl └── math_fewstep_fewshot.jsonl ├── components.py ├── data ├── aime │ └── input │ │ └── aime_random_300.jsonl └── arrowmaze │ └── input │ └── arrowmaze.jsonl ├── figs ├── fastmcts_new_01.png ├── intro_fig_cn_01.png ├── mcts_v2_2018-II-3 └── mcts_v2_2018-II-3.png ├── requirements.txt ├── task_configs ├── fastmcts │ └── aime.py └── rejection_sampling │ └── arrowmaze.py ├── tools ├── process_tree_data_to_dpo.py ├── serialize_tree_data_to_sft.py ├── test_server.py └── visualize.py ├── training_scripts ├── dpo_example.sh ├── dpo_train_qwen_base.py ├── dpo_trainer.py ├── ds_config_zero2.json ├── ds_config_zero3.json ├── ds_config_zero3_trl_fix.json ├── finetune_example.sh ├── finetune_qwen_base.py └── finetune_qwen_instruct.py └── utils ├── __init__.py ├── eval_func.py ├── prompt_func.py ├── score_visualize.py └── tree.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/README.md -------------------------------------------------------------------------------- /__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /assets/aime_fewshot.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/assets/aime_fewshot.jsonl -------------------------------------------------------------------------------- /assets/cipher_fewshot.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/assets/cipher_fewshot.jsonl -------------------------------------------------------------------------------- /assets/cn_exam_step_fewshot.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/assets/cn_exam_step_fewshot.jsonl -------------------------------------------------------------------------------- /assets/math_fewstep_fewshot.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/assets/math_fewstep_fewshot.jsonl -------------------------------------------------------------------------------- /components.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/components.py -------------------------------------------------------------------------------- /data/aime/input/aime_random_300.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/data/aime/input/aime_random_300.jsonl -------------------------------------------------------------------------------- /data/arrowmaze/input/arrowmaze.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/data/arrowmaze/input/arrowmaze.jsonl -------------------------------------------------------------------------------- /figs/fastmcts_new_01.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/figs/fastmcts_new_01.png -------------------------------------------------------------------------------- /figs/intro_fig_cn_01.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/figs/intro_fig_cn_01.png -------------------------------------------------------------------------------- /figs/mcts_v2_2018-II-3: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/figs/mcts_v2_2018-II-3 -------------------------------------------------------------------------------- /figs/mcts_v2_2018-II-3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/figs/mcts_v2_2018-II-3.png -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/requirements.txt -------------------------------------------------------------------------------- /task_configs/fastmcts/aime.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/task_configs/fastmcts/aime.py -------------------------------------------------------------------------------- /task_configs/rejection_sampling/arrowmaze.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/task_configs/rejection_sampling/arrowmaze.py -------------------------------------------------------------------------------- /tools/process_tree_data_to_dpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/tools/process_tree_data_to_dpo.py -------------------------------------------------------------------------------- /tools/serialize_tree_data_to_sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/tools/serialize_tree_data_to_sft.py -------------------------------------------------------------------------------- /tools/test_server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/tools/test_server.py -------------------------------------------------------------------------------- /tools/visualize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/tools/visualize.py -------------------------------------------------------------------------------- /training_scripts/dpo_example.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/training_scripts/dpo_example.sh -------------------------------------------------------------------------------- /training_scripts/dpo_train_qwen_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/training_scripts/dpo_train_qwen_base.py -------------------------------------------------------------------------------- /training_scripts/dpo_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/training_scripts/dpo_trainer.py -------------------------------------------------------------------------------- /training_scripts/ds_config_zero2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/training_scripts/ds_config_zero2.json -------------------------------------------------------------------------------- /training_scripts/ds_config_zero3.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/training_scripts/ds_config_zero3.json -------------------------------------------------------------------------------- /training_scripts/ds_config_zero3_trl_fix.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/training_scripts/ds_config_zero3_trl_fix.json -------------------------------------------------------------------------------- /training_scripts/finetune_example.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/training_scripts/finetune_example.sh -------------------------------------------------------------------------------- /training_scripts/finetune_qwen_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/training_scripts/finetune_qwen_base.py -------------------------------------------------------------------------------- /training_scripts/finetune_qwen_instruct.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/training_scripts/finetune_qwen_instruct.py -------------------------------------------------------------------------------- /utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /utils/eval_func.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/utils/eval_func.py -------------------------------------------------------------------------------- /utils/prompt_func.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/utils/prompt_func.py -------------------------------------------------------------------------------- /utils/score_visualize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/utils/score_visualize.py -------------------------------------------------------------------------------- /utils/tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FlyingDutchman26/FastMCTS/HEAD/utils/tree.py --------------------------------------------------------------------------------