├── .gitignore ├── .pre-commit-config.yaml ├── LICENSE ├── README.md ├── configs ├── accelerate_config_ddp.yaml ├── accelerate_config_zero1.4node.yaml ├── accelerate_config_zero1.8node.yaml ├── accelerate_config_zero1.yaml ├── accelerate_config_zero2.8node.yaml ├── accelerate_config_zero2.yaml ├── accelerate_config_zero3.16node.yaml ├── accelerate_config_zero3.8node.yaml └── accelerate_config_zero3.yaml ├── converter └── gptq_converter.py ├── data └── example.jsonl ├── mdx ├── README.md ├── dataset_dolly_oasst.sh ├── dataset_gpt4_self_inst_ja.sh ├── dataset_jaster.sh ├── dataset_jaster_dolly_oasst.sh ├── train_full_multi_node.sh ├── train_full_multi_node_gradient_checkpointing.sh ├── train_full_single_node.sh ├── train_full_single_node_gradient_checkpointing.sh ├── train_peft_multi_gpu.sh ├── train_peft_multi_gpu_gradient_checkpointing.sh ├── train_peft_multi_node.sh ├── train_peft_single_gpu.sh └── train_peft_single_gpu_gradient_checkpointing.sh ├── requirements.in ├── requirements.txt └── train.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/.gitignore -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/README.md -------------------------------------------------------------------------------- /configs/accelerate_config_ddp.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/configs/accelerate_config_ddp.yaml -------------------------------------------------------------------------------- /configs/accelerate_config_zero1.4node.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/configs/accelerate_config_zero1.4node.yaml -------------------------------------------------------------------------------- /configs/accelerate_config_zero1.8node.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/configs/accelerate_config_zero1.8node.yaml -------------------------------------------------------------------------------- /configs/accelerate_config_zero1.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/configs/accelerate_config_zero1.yaml -------------------------------------------------------------------------------- /configs/accelerate_config_zero2.8node.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/configs/accelerate_config_zero2.8node.yaml -------------------------------------------------------------------------------- /configs/accelerate_config_zero2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/configs/accelerate_config_zero2.yaml -------------------------------------------------------------------------------- /configs/accelerate_config_zero3.16node.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/configs/accelerate_config_zero3.16node.yaml -------------------------------------------------------------------------------- /configs/accelerate_config_zero3.8node.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/configs/accelerate_config_zero3.8node.yaml -------------------------------------------------------------------------------- /configs/accelerate_config_zero3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/configs/accelerate_config_zero3.yaml -------------------------------------------------------------------------------- /converter/gptq_converter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/converter/gptq_converter.py -------------------------------------------------------------------------------- /data/example.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/data/example.jsonl -------------------------------------------------------------------------------- /mdx/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/README.md -------------------------------------------------------------------------------- /mdx/dataset_dolly_oasst.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/dataset_dolly_oasst.sh -------------------------------------------------------------------------------- /mdx/dataset_gpt4_self_inst_ja.sh: -------------------------------------------------------------------------------- 1 | #!/bin/sh 2 | echo $1/gpt4_self_inst_ja.json 3 | -------------------------------------------------------------------------------- /mdx/dataset_jaster.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/dataset_jaster.sh -------------------------------------------------------------------------------- /mdx/dataset_jaster_dolly_oasst.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/dataset_jaster_dolly_oasst.sh -------------------------------------------------------------------------------- /mdx/train_full_multi_node.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/train_full_multi_node.sh -------------------------------------------------------------------------------- /mdx/train_full_multi_node_gradient_checkpointing.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/train_full_multi_node_gradient_checkpointing.sh -------------------------------------------------------------------------------- /mdx/train_full_single_node.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/train_full_single_node.sh -------------------------------------------------------------------------------- /mdx/train_full_single_node_gradient_checkpointing.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/train_full_single_node_gradient_checkpointing.sh -------------------------------------------------------------------------------- /mdx/train_peft_multi_gpu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/train_peft_multi_gpu.sh -------------------------------------------------------------------------------- /mdx/train_peft_multi_gpu_gradient_checkpointing.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/train_peft_multi_gpu_gradient_checkpointing.sh -------------------------------------------------------------------------------- /mdx/train_peft_multi_node.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/train_peft_multi_node.sh -------------------------------------------------------------------------------- /mdx/train_peft_single_gpu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/train_peft_single_gpu.sh -------------------------------------------------------------------------------- /mdx/train_peft_single_gpu_gradient_checkpointing.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/mdx/train_peft_single_gpu_gradient_checkpointing.sh -------------------------------------------------------------------------------- /requirements.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/requirements.in -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/requirements.txt -------------------------------------------------------------------------------- /train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/llm-jp/llm-jp-sft/HEAD/train.py --------------------------------------------------------------------------------