├── README.md ├── dataset_collect ├── README.md ├── evaluate │ ├── __init__.py │ ├── data_processing │ │ ├── answer_extraction.py │ │ └── process_utils.py │ ├── eval_deepseek │ │ ├── eval_script.py │ │ ├── eval_utils.py │ │ ├── ocwcourses_eval_utils.py │ │ ├── python_executor.py │ │ └── utils.py │ ├── evaluate.sh │ └── evaluate_utils │ │ ├── __init__.py │ │ ├── grader.py │ │ └── math_normalize.py ├── gpt_access.py ├── interpolate.py ├── requirements.txt ├── scripts │ ├── gpt_sample.sh │ ├── interpolate.sh │ ├── sample_solution.sh │ └── sgl_model.sh └── tora_sample.py ├── finetune_code ├── LICENSE ├── README.md ├── convert_checkpoint_to_hf.py ├── data_utils │ ├── common_utils.py │ ├── data_utils_rm_pointwise.py │ ├── data_utils_sft.py │ └── tokenizer_utils.py ├── finetune.py ├── finetune_rm.py ├── models │ ├── model.py │ ├── quantize.py │ ├── reward_model.py │ ├── rl_model.py │ ├── rl_trainer.py │ └── tp.py ├── requirements.txt ├── scripts │ ├── convert_hf_checkpoint.py │ └── download.py ├── scripts_aimo │ ├── convert_checkpoint_to_hf.sh │ ├── finetune_policy.sh │ ├── finetune_reward.sh │ └── prepare_deepseek_rl.sh └── training_utils │ ├── checkpoint_hook.py │ ├── fsdp_utils.py │ ├── hf_argparser.py │ ├── memory_efficient_adam.py │ ├── trainer_utils.py │ └── training_args.py ├── finetune_dataset ├── policy_train.json └── reward_train.json ├── image └── CMU_AIMO.png ├── problem_set ├── AIME.json ├── AMC_10.json ├── AMC_12.json └── odyssey.json └── validation_set └── validation.json /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/README.md -------------------------------------------------------------------------------- /dataset_collect/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/README.md -------------------------------------------------------------------------------- /dataset_collect/evaluate/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dataset_collect/evaluate/data_processing/answer_extraction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/evaluate/data_processing/answer_extraction.py -------------------------------------------------------------------------------- /dataset_collect/evaluate/data_processing/process_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/evaluate/data_processing/process_utils.py -------------------------------------------------------------------------------- /dataset_collect/evaluate/eval_deepseek/eval_script.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/evaluate/eval_deepseek/eval_script.py -------------------------------------------------------------------------------- /dataset_collect/evaluate/eval_deepseek/eval_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/evaluate/eval_deepseek/eval_utils.py -------------------------------------------------------------------------------- /dataset_collect/evaluate/eval_deepseek/ocwcourses_eval_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/evaluate/eval_deepseek/ocwcourses_eval_utils.py -------------------------------------------------------------------------------- /dataset_collect/evaluate/eval_deepseek/python_executor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/evaluate/eval_deepseek/python_executor.py -------------------------------------------------------------------------------- /dataset_collect/evaluate/eval_deepseek/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/evaluate/eval_deepseek/utils.py -------------------------------------------------------------------------------- /dataset_collect/evaluate/evaluate.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/evaluate/evaluate.sh -------------------------------------------------------------------------------- /dataset_collect/evaluate/evaluate_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /dataset_collect/evaluate/evaluate_utils/grader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/evaluate/evaluate_utils/grader.py -------------------------------------------------------------------------------- /dataset_collect/evaluate/evaluate_utils/math_normalize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/evaluate/evaluate_utils/math_normalize.py -------------------------------------------------------------------------------- /dataset_collect/gpt_access.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/gpt_access.py -------------------------------------------------------------------------------- /dataset_collect/interpolate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/interpolate.py -------------------------------------------------------------------------------- /dataset_collect/requirements.txt: -------------------------------------------------------------------------------- 1 | torch 2 | transformers 3 | datasets 4 | openai 5 | sglang -------------------------------------------------------------------------------- /dataset_collect/scripts/gpt_sample.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/scripts/gpt_sample.sh -------------------------------------------------------------------------------- /dataset_collect/scripts/interpolate.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/scripts/interpolate.sh -------------------------------------------------------------------------------- /dataset_collect/scripts/sample_solution.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/scripts/sample_solution.sh -------------------------------------------------------------------------------- /dataset_collect/scripts/sgl_model.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/scripts/sgl_model.sh -------------------------------------------------------------------------------- /dataset_collect/tora_sample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/dataset_collect/tora_sample.py -------------------------------------------------------------------------------- /finetune_code/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/LICENSE -------------------------------------------------------------------------------- /finetune_code/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/README.md -------------------------------------------------------------------------------- /finetune_code/convert_checkpoint_to_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/convert_checkpoint_to_hf.py -------------------------------------------------------------------------------- /finetune_code/data_utils/common_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/data_utils/common_utils.py -------------------------------------------------------------------------------- /finetune_code/data_utils/data_utils_rm_pointwise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/data_utils/data_utils_rm_pointwise.py -------------------------------------------------------------------------------- /finetune_code/data_utils/data_utils_sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/data_utils/data_utils_sft.py -------------------------------------------------------------------------------- /finetune_code/data_utils/tokenizer_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/data_utils/tokenizer_utils.py -------------------------------------------------------------------------------- /finetune_code/finetune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/finetune.py -------------------------------------------------------------------------------- /finetune_code/finetune_rm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/finetune_rm.py -------------------------------------------------------------------------------- /finetune_code/models/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/models/model.py -------------------------------------------------------------------------------- /finetune_code/models/quantize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/models/quantize.py -------------------------------------------------------------------------------- /finetune_code/models/reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/models/reward_model.py -------------------------------------------------------------------------------- /finetune_code/models/rl_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/models/rl_model.py -------------------------------------------------------------------------------- /finetune_code/models/rl_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/models/rl_trainer.py -------------------------------------------------------------------------------- /finetune_code/models/tp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/models/tp.py -------------------------------------------------------------------------------- /finetune_code/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/requirements.txt -------------------------------------------------------------------------------- /finetune_code/scripts/convert_hf_checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/scripts/convert_hf_checkpoint.py -------------------------------------------------------------------------------- /finetune_code/scripts/download.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/scripts/download.py -------------------------------------------------------------------------------- /finetune_code/scripts_aimo/convert_checkpoint_to_hf.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/scripts_aimo/convert_checkpoint_to_hf.sh -------------------------------------------------------------------------------- /finetune_code/scripts_aimo/finetune_policy.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/scripts_aimo/finetune_policy.sh -------------------------------------------------------------------------------- /finetune_code/scripts_aimo/finetune_reward.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/scripts_aimo/finetune_reward.sh -------------------------------------------------------------------------------- /finetune_code/scripts_aimo/prepare_deepseek_rl.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/scripts_aimo/prepare_deepseek_rl.sh -------------------------------------------------------------------------------- /finetune_code/training_utils/checkpoint_hook.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/training_utils/checkpoint_hook.py -------------------------------------------------------------------------------- /finetune_code/training_utils/fsdp_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/training_utils/fsdp_utils.py -------------------------------------------------------------------------------- /finetune_code/training_utils/hf_argparser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/training_utils/hf_argparser.py -------------------------------------------------------------------------------- /finetune_code/training_utils/memory_efficient_adam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/training_utils/memory_efficient_adam.py -------------------------------------------------------------------------------- /finetune_code/training_utils/trainer_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/training_utils/trainer_utils.py -------------------------------------------------------------------------------- /finetune_code/training_utils/training_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_code/training_utils/training_args.py -------------------------------------------------------------------------------- /finetune_dataset/policy_train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_dataset/policy_train.json -------------------------------------------------------------------------------- /finetune_dataset/reward_train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/finetune_dataset/reward_train.json -------------------------------------------------------------------------------- /image/CMU_AIMO.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/image/CMU_AIMO.png -------------------------------------------------------------------------------- /problem_set/AIME.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/problem_set/AIME.json -------------------------------------------------------------------------------- /problem_set/AMC_10.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/problem_set/AMC_10.json -------------------------------------------------------------------------------- /problem_set/AMC_12.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/problem_set/AMC_12.json -------------------------------------------------------------------------------- /problem_set/odyssey.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/problem_set/odyssey.json -------------------------------------------------------------------------------- /validation_set/validation.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AIMO-CMU-MATH/CMU_MATH-AIMO/HEAD/validation_set/validation.json --------------------------------------------------------------------------------