├── .gitignore ├── LICENSE ├── README.md ├── docker └── Dockerfile ├── img ├── method.png └── results.png ├── requirements.txt ├── samples └── samples.jsonl └── src ├── data_generation ├── gen.py ├── question_filtering │ ├── generate_difficulty_score.py │ ├── language_solvability_check.py │ └── vllm_gen.py ├── reward_filtering │ └── rm_score.py ├── run.sh └── vllm_gen.py └── train_question_generator ├── qft_train └── train.py ├── qpo_train ├── dpo.py └── train.py ├── question_optim ├── openai_gen.py ├── optim_difficulty.py ├── optim_solvability.py └── prompts.py └── scripts ├── run_dscode_qft.sh ├── run_dsmath_qft.sh ├── run_qwen2code_qft.sh ├── run_qwen2math_qft.sh └── zero3.yaml /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/README.md -------------------------------------------------------------------------------- /docker/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/docker/Dockerfile -------------------------------------------------------------------------------- /img/method.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/img/method.png -------------------------------------------------------------------------------- /img/results.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/img/results.png -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/requirements.txt -------------------------------------------------------------------------------- /samples/samples.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/samples/samples.jsonl -------------------------------------------------------------------------------- /src/data_generation/gen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/data_generation/gen.py -------------------------------------------------------------------------------- /src/data_generation/question_filtering/generate_difficulty_score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/data_generation/question_filtering/generate_difficulty_score.py -------------------------------------------------------------------------------- /src/data_generation/question_filtering/language_solvability_check.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/data_generation/question_filtering/language_solvability_check.py -------------------------------------------------------------------------------- /src/data_generation/question_filtering/vllm_gen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/data_generation/question_filtering/vllm_gen.py -------------------------------------------------------------------------------- /src/data_generation/reward_filtering/rm_score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/data_generation/reward_filtering/rm_score.py -------------------------------------------------------------------------------- /src/data_generation/run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/data_generation/run.sh -------------------------------------------------------------------------------- /src/data_generation/vllm_gen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/data_generation/vllm_gen.py -------------------------------------------------------------------------------- /src/train_question_generator/qft_train/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/train_question_generator/qft_train/train.py -------------------------------------------------------------------------------- /src/train_question_generator/qpo_train/dpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/train_question_generator/qpo_train/dpo.py -------------------------------------------------------------------------------- /src/train_question_generator/qpo_train/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/train_question_generator/qpo_train/train.py -------------------------------------------------------------------------------- /src/train_question_generator/question_optim/openai_gen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/train_question_generator/question_optim/openai_gen.py -------------------------------------------------------------------------------- /src/train_question_generator/question_optim/optim_difficulty.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/train_question_generator/question_optim/optim_difficulty.py -------------------------------------------------------------------------------- /src/train_question_generator/question_optim/optim_solvability.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/train_question_generator/question_optim/optim_solvability.py -------------------------------------------------------------------------------- /src/train_question_generator/question_optim/prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/train_question_generator/question_optim/prompts.py -------------------------------------------------------------------------------- /src/train_question_generator/scripts/run_dscode_qft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/train_question_generator/scripts/run_dscode_qft.sh -------------------------------------------------------------------------------- /src/train_question_generator/scripts/run_dsmath_qft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/train_question_generator/scripts/run_dsmath_qft.sh -------------------------------------------------------------------------------- /src/train_question_generator/scripts/run_qwen2code_qft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/train_question_generator/scripts/run_qwen2code_qft.sh -------------------------------------------------------------------------------- /src/train_question_generator/scripts/run_qwen2math_qft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/train_question_generator/scripts/run_qwen2math_qft.sh -------------------------------------------------------------------------------- /src/train_question_generator/scripts/zero3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yyDing1/ScaleQuest/HEAD/src/train_question_generator/scripts/zero3.yaml --------------------------------------------------------------------------------