├── .gitignore ├── README.md ├── accelerate_configs ├── deepspeed_zero2.yaml ├── deepspeed_zero3.yaml ├── fsdp.yaml └── multi_gpu.yaml ├── eval ├── alpacaeval │ └── alpaca_eval.json ├── api_request_parallel_processor.py ├── build_evaluation.py ├── evol-instruct │ └── evol_inst_eval.json ├── grading.py ├── reference_answer.py ├── run.sh └── ultrafeedback │ └── ultrafeedback_eval.json ├── generate ├── generate.py ├── generate_humaneval.py ├── generate_vllm.py ├── generate_vllm_vlm.py └── reformat.py ├── setup.cfg ├── setup.py ├── src ├── alignment │ ├── __init__.py │ ├── configs.py │ ├── data.py │ ├── decontaminate.py │ ├── model_utils.py │ └── release.py ├── distillm_trainer.py ├── run_distillm.py ├── run_distivlm.py └── run_sft.py ├── training_configs ├── deepseek-coder-1.3b-distillm2.yaml ├── deepseek-coder-1.3b-sft.yaml ├── qwen2.5-1.5b-distillm2.yaml ├── qwen2.5-1.5b-sft.yaml └── vlm.yaml └── utils ├── merging.py └── resize_embedding.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/README.md -------------------------------------------------------------------------------- /accelerate_configs/deepspeed_zero2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/accelerate_configs/deepspeed_zero2.yaml -------------------------------------------------------------------------------- /accelerate_configs/deepspeed_zero3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/accelerate_configs/deepspeed_zero3.yaml -------------------------------------------------------------------------------- /accelerate_configs/fsdp.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/accelerate_configs/fsdp.yaml -------------------------------------------------------------------------------- /accelerate_configs/multi_gpu.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/accelerate_configs/multi_gpu.yaml -------------------------------------------------------------------------------- /eval/alpacaeval/alpaca_eval.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/eval/alpacaeval/alpaca_eval.json -------------------------------------------------------------------------------- /eval/api_request_parallel_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/eval/api_request_parallel_processor.py -------------------------------------------------------------------------------- /eval/build_evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/eval/build_evaluation.py -------------------------------------------------------------------------------- /eval/evol-instruct/evol_inst_eval.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/eval/evol-instruct/evol_inst_eval.json -------------------------------------------------------------------------------- /eval/grading.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/eval/grading.py -------------------------------------------------------------------------------- /eval/reference_answer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/eval/reference_answer.py -------------------------------------------------------------------------------- /eval/run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/eval/run.sh -------------------------------------------------------------------------------- /eval/ultrafeedback/ultrafeedback_eval.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/eval/ultrafeedback/ultrafeedback_eval.json -------------------------------------------------------------------------------- /generate/generate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/generate/generate.py -------------------------------------------------------------------------------- /generate/generate_humaneval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/generate/generate_humaneval.py -------------------------------------------------------------------------------- /generate/generate_vllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/generate/generate_vllm.py -------------------------------------------------------------------------------- /generate/generate_vllm_vlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/generate/generate_vllm_vlm.py -------------------------------------------------------------------------------- /generate/reformat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/generate/reformat.py -------------------------------------------------------------------------------- /setup.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/setup.cfg -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/setup.py -------------------------------------------------------------------------------- /src/alignment/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/src/alignment/__init__.py -------------------------------------------------------------------------------- /src/alignment/configs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/src/alignment/configs.py -------------------------------------------------------------------------------- /src/alignment/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/src/alignment/data.py -------------------------------------------------------------------------------- /src/alignment/decontaminate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/src/alignment/decontaminate.py -------------------------------------------------------------------------------- /src/alignment/model_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/src/alignment/model_utils.py -------------------------------------------------------------------------------- /src/alignment/release.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/src/alignment/release.py -------------------------------------------------------------------------------- /src/distillm_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/src/distillm_trainer.py -------------------------------------------------------------------------------- /src/run_distillm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/src/run_distillm.py -------------------------------------------------------------------------------- /src/run_distivlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/src/run_distivlm.py -------------------------------------------------------------------------------- /src/run_sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/src/run_sft.py -------------------------------------------------------------------------------- /training_configs/deepseek-coder-1.3b-distillm2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/training_configs/deepseek-coder-1.3b-distillm2.yaml -------------------------------------------------------------------------------- /training_configs/deepseek-coder-1.3b-sft.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/training_configs/deepseek-coder-1.3b-sft.yaml -------------------------------------------------------------------------------- /training_configs/qwen2.5-1.5b-distillm2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/training_configs/qwen2.5-1.5b-distillm2.yaml -------------------------------------------------------------------------------- /training_configs/qwen2.5-1.5b-sft.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/training_configs/qwen2.5-1.5b-sft.yaml -------------------------------------------------------------------------------- /training_configs/vlm.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/training_configs/vlm.yaml -------------------------------------------------------------------------------- /utils/merging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/utils/merging.py -------------------------------------------------------------------------------- /utils/resize_embedding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jongwooko/distillm-2/HEAD/utils/resize_embedding.py --------------------------------------------------------------------------------