├── .gitignore ├── LICENSE ├── README.md ├── _eval ├── [24_07_05]dfurman_qwen2_hf_leaderboard.zsh └── setup.zsh ├── _merge └── LazyMergekit_HermesBagel_34B_v0.1.ipynb ├── _peft ├── calme │ ├── v1 │ │ ├── [24_09_23]basic_usage.ipynb │ │ ├── [24_09_23]merge_and_upload.ipynb │ │ ├── [24_09_23]train_calme_78b_orpo.py │ │ └── train_setup.zsh │ └── v2 │ │ ├── [24_09_23]basic_usage.ipynb │ │ ├── [24_09_23]merge_and_upload.ipynb │ │ ├── [24_09_23]train_calme_78b_orpo.py │ │ └── train_setup.zsh ├── falcon │ ├── peft_falcon_180b_instruct.py │ └── postprocessing_falcon_180b_instruct.ipynb ├── llama-2 │ ├── peft_Llama_2_13B_Instruct_v0_2.ipynb │ ├── peft_Llama_2_70B_Instruct_v0_1.py │ └── postprocessing_Llama_2_70B_Instruct_v0_1.ipynb ├── llama-3 │ ├── [24_04_25]llama_3_70b_orpo.py │ ├── [24_04_25]llama_3_8b_orpo.ipynb │ └── [24_04_26]llama_3_8b_orpo.py ├── mistral │ ├── peft_Mistral_7B_Instruct_v0_1.ipynb │ └── peft_Mistral_7B_Instruct_v0_2.ipynb ├── mixtral │ ├── basic_usage_Mixtral_8x7B_Instruct_v0_1.ipynb │ └── peft_Mixtral_8x7B_Instruct_v0_1.py └── qwen-2 │ ├── [24_07_03]train_qwen_2_72b_orpo.py │ ├── [24_07_05]basic_usage.ipynb │ ├── [24_07_05]merge_and_upload.ipynb │ └── train_setup.zsh ├── _quantize ├── mlx_bnb_4bit_quantize.ipynb └── mlx_inference_example.ipynb ├── _sft ├── assets │ └── mid_training_GPU_usage.png ├── phi-2 │ └── sft_phi_2_base_v0_1.ipynb └── text-classification │ └── imdb │ ├── [24_03_27]text_classification_deberta_large_v02_imdb.ipynb │ └── [24_03_30]text_classification_deberta_xxl_v01_boilerplate.ipynb └── requirements.txt /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/README.md -------------------------------------------------------------------------------- /_eval/[24_07_05]dfurman_qwen2_hf_leaderboard.zsh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_eval/[24_07_05]dfurman_qwen2_hf_leaderboard.zsh -------------------------------------------------------------------------------- /_eval/setup.zsh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_eval/setup.zsh -------------------------------------------------------------------------------- /_merge/LazyMergekit_HermesBagel_34B_v0.1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_merge/LazyMergekit_HermesBagel_34B_v0.1.ipynb -------------------------------------------------------------------------------- /_peft/calme/v1/[24_09_23]basic_usage.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/calme/v1/[24_09_23]basic_usage.ipynb -------------------------------------------------------------------------------- /_peft/calme/v1/[24_09_23]merge_and_upload.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/calme/v1/[24_09_23]merge_and_upload.ipynb -------------------------------------------------------------------------------- /_peft/calme/v1/[24_09_23]train_calme_78b_orpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/calme/v1/[24_09_23]train_calme_78b_orpo.py -------------------------------------------------------------------------------- /_peft/calme/v1/train_setup.zsh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/calme/v1/train_setup.zsh -------------------------------------------------------------------------------- /_peft/calme/v2/[24_09_23]basic_usage.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/calme/v2/[24_09_23]basic_usage.ipynb -------------------------------------------------------------------------------- /_peft/calme/v2/[24_09_23]merge_and_upload.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/calme/v2/[24_09_23]merge_and_upload.ipynb -------------------------------------------------------------------------------- /_peft/calme/v2/[24_09_23]train_calme_78b_orpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/calme/v2/[24_09_23]train_calme_78b_orpo.py -------------------------------------------------------------------------------- /_peft/calme/v2/train_setup.zsh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/calme/v2/train_setup.zsh -------------------------------------------------------------------------------- /_peft/falcon/peft_falcon_180b_instruct.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/falcon/peft_falcon_180b_instruct.py -------------------------------------------------------------------------------- /_peft/falcon/postprocessing_falcon_180b_instruct.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/falcon/postprocessing_falcon_180b_instruct.ipynb -------------------------------------------------------------------------------- /_peft/llama-2/peft_Llama_2_13B_Instruct_v0_2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/llama-2/peft_Llama_2_13B_Instruct_v0_2.ipynb -------------------------------------------------------------------------------- /_peft/llama-2/peft_Llama_2_70B_Instruct_v0_1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/llama-2/peft_Llama_2_70B_Instruct_v0_1.py -------------------------------------------------------------------------------- /_peft/llama-2/postprocessing_Llama_2_70B_Instruct_v0_1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/llama-2/postprocessing_Llama_2_70B_Instruct_v0_1.ipynb -------------------------------------------------------------------------------- /_peft/llama-3/[24_04_25]llama_3_70b_orpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/llama-3/[24_04_25]llama_3_70b_orpo.py -------------------------------------------------------------------------------- /_peft/llama-3/[24_04_25]llama_3_8b_orpo.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/llama-3/[24_04_25]llama_3_8b_orpo.ipynb -------------------------------------------------------------------------------- /_peft/llama-3/[24_04_26]llama_3_8b_orpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/llama-3/[24_04_26]llama_3_8b_orpo.py -------------------------------------------------------------------------------- /_peft/mistral/peft_Mistral_7B_Instruct_v0_1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/mistral/peft_Mistral_7B_Instruct_v0_1.ipynb -------------------------------------------------------------------------------- /_peft/mistral/peft_Mistral_7B_Instruct_v0_2.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/mistral/peft_Mistral_7B_Instruct_v0_2.ipynb -------------------------------------------------------------------------------- /_peft/mixtral/basic_usage_Mixtral_8x7B_Instruct_v0_1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/mixtral/basic_usage_Mixtral_8x7B_Instruct_v0_1.ipynb -------------------------------------------------------------------------------- /_peft/mixtral/peft_Mixtral_8x7B_Instruct_v0_1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/mixtral/peft_Mixtral_8x7B_Instruct_v0_1.py -------------------------------------------------------------------------------- /_peft/qwen-2/[24_07_03]train_qwen_2_72b_orpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/qwen-2/[24_07_03]train_qwen_2_72b_orpo.py -------------------------------------------------------------------------------- /_peft/qwen-2/[24_07_05]basic_usage.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/qwen-2/[24_07_05]basic_usage.ipynb -------------------------------------------------------------------------------- /_peft/qwen-2/[24_07_05]merge_and_upload.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/qwen-2/[24_07_05]merge_and_upload.ipynb -------------------------------------------------------------------------------- /_peft/qwen-2/train_setup.zsh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_peft/qwen-2/train_setup.zsh -------------------------------------------------------------------------------- /_quantize/mlx_bnb_4bit_quantize.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_quantize/mlx_bnb_4bit_quantize.ipynb -------------------------------------------------------------------------------- /_quantize/mlx_inference_example.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_quantize/mlx_inference_example.ipynb -------------------------------------------------------------------------------- /_sft/assets/mid_training_GPU_usage.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_sft/assets/mid_training_GPU_usage.png -------------------------------------------------------------------------------- /_sft/phi-2/sft_phi_2_base_v0_1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_sft/phi-2/sft_phi_2_base_v0_1.ipynb -------------------------------------------------------------------------------- /_sft/text-classification/imdb/[24_03_27]text_classification_deberta_large_v02_imdb.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_sft/text-classification/imdb/[24_03_27]text_classification_deberta_large_v02_imdb.ipynb -------------------------------------------------------------------------------- /_sft/text-classification/imdb/[24_03_30]text_classification_deberta_xxl_v01_boilerplate.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/_sft/text-classification/imdb/[24_03_30]text_classification_deberta_xxl_v01_boilerplate.ipynb -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/daniel-furman/sft-demos/HEAD/requirements.txt --------------------------------------------------------------------------------