├── LICENSE ├── README.md ├── examples └── talk_like_a_pirate │ ├── README.md │ └── pirate.yaml ├── grpo ├── README.md ├── assets │ └── wandb.png ├── cloud.yaml ├── gsm8k.yaml ├── gsm8k_grpo.py └── stats.py ├── lambda ├── configs │ ├── llama-3_1-405b-fft.yaml │ ├── llama-3_1-405b-qlora.yaml │ ├── llama-3_1-70b-fft.yaml │ └── llama-3_1-8b.yaml ├── setup.sh └── train.sh └── prm ├── README.md ├── bon.py ├── bon_qwen1.5B-instruct_n=16_results.txt ├── bon_qwen1.5B-instruct_n=1_results.txt ├── eval_process_bench.py └── prm.yaml /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # axolotl-cookbook -------------------------------------------------------------------------------- /examples/talk_like_a_pirate/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/examples/talk_like_a_pirate/README.md -------------------------------------------------------------------------------- /examples/talk_like_a_pirate/pirate.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/examples/talk_like_a_pirate/pirate.yaml -------------------------------------------------------------------------------- /grpo/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/grpo/README.md -------------------------------------------------------------------------------- /grpo/assets/wandb.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/grpo/assets/wandb.png -------------------------------------------------------------------------------- /grpo/cloud.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/grpo/cloud.yaml -------------------------------------------------------------------------------- /grpo/gsm8k.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/grpo/gsm8k.yaml -------------------------------------------------------------------------------- /grpo/gsm8k_grpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/grpo/gsm8k_grpo.py -------------------------------------------------------------------------------- /grpo/stats.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/grpo/stats.py -------------------------------------------------------------------------------- /lambda/configs/llama-3_1-405b-fft.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/lambda/configs/llama-3_1-405b-fft.yaml -------------------------------------------------------------------------------- /lambda/configs/llama-3_1-405b-qlora.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/lambda/configs/llama-3_1-405b-qlora.yaml -------------------------------------------------------------------------------- /lambda/configs/llama-3_1-70b-fft.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/lambda/configs/llama-3_1-70b-fft.yaml -------------------------------------------------------------------------------- /lambda/configs/llama-3_1-8b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/lambda/configs/llama-3_1-8b.yaml -------------------------------------------------------------------------------- /lambda/setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/lambda/setup.sh -------------------------------------------------------------------------------- /lambda/train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/lambda/train.sh -------------------------------------------------------------------------------- /prm/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/prm/README.md -------------------------------------------------------------------------------- /prm/bon.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/prm/bon.py -------------------------------------------------------------------------------- /prm/bon_qwen1.5B-instruct_n=16_results.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/prm/bon_qwen1.5B-instruct_n=16_results.txt -------------------------------------------------------------------------------- /prm/bon_qwen1.5B-instruct_n=1_results.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/prm/bon_qwen1.5B-instruct_n=1_results.txt -------------------------------------------------------------------------------- /prm/eval_process_bench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/prm/eval_process_bench.py -------------------------------------------------------------------------------- /prm/prm.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/axolotl-ai-cloud/axolotl-cookbook/HEAD/prm/prm.yaml --------------------------------------------------------------------------------