├── .gitignore ├── README.md └── chs ├── ch10-optimization └── vLLM │ ├── README.md │ ├── main.py │ └── requirements.txt ├── ch11-evaluation └── McNemarTest │ ├── README.md │ ├── main.py │ └── requirements.txt ├── ch2-foundations ├── PreTrain │ ├── README.md │ ├── main.py │ ├── pretrained-bert │ │ ├── config.json │ │ └── vocab.txt │ └── requirements.txt └── Transformer │ ├── README.md │ ├── batch.py │ ├── embed.py │ ├── layers.py │ ├── main.py │ ├── models.py │ ├── process.py │ ├── requirements.txt │ ├── sublayers.py │ └── tokenizer.py ├── ch3-pretrain-data ├── DataProcess │ ├── README.md │ ├── __init__.py │ ├── dedup │ │ ├── __init__.py │ │ ├── dedup_train.py │ │ ├── generate_connected_components.py │ │ ├── generate_duplicate_pairs.py │ │ ├── generate_duplicates_dict.py │ │ └── to_hash.py │ ├── main.ipynb │ ├── main.py │ ├── preprocessing │ │ ├── __init__.py │ │ ├── datasets.py │ │ ├── filter.py │ │ ├── normalize_text.py │ │ └── shuffle_holdout.py │ ├── requirements.txt │ ├── split_dataset.py │ └── utils.py └── Tokenization │ ├── README.md │ ├── main.py │ └── requirements.txt ├── ch4-distributed ├── CollectiveCommunication │ ├── README.md │ ├── all_reduce.py │ └── requirements.txt ├── DeepSpeed │ ├── README.md │ ├── dschat │ │ └── utils │ │ │ ├── data │ │ │ ├── data_utils.py │ │ │ └── raw_datasets.py │ │ │ ├── ds_utils.py │ │ │ ├── model │ │ │ ├── model_utils.py │ │ │ └── reward_model.py │ │ │ ├── module │ │ │ └── lora.py │ │ │ ├── perf.py │ │ │ └── utils.py │ ├── main.py │ ├── requirements.txt │ └── run_llama2_7b.sh ├── DistributedDataParallel │ ├── README.md │ ├── dataset.py │ ├── main.py │ ├── models.py │ └── requirements.txt ├── ModelParallel │ ├── README.md │ ├── pipeline_parallel.py │ ├── requirements.txt │ └── tensor_parallel.py └── ZeRO │ ├── README.md │ ├── optimizer.py │ └── requirements.txt ├── ch5-finetuning ├── DeepSpeedChatSFT │ ├── README.md │ ├── chat.py │ ├── dschat │ │ ├── rlhf │ │ │ ├── ppo_trainer.py │ │ │ └── rlhf_engine.py │ │ └── utils │ │ │ ├── data │ │ │ ├── data_utils.py │ │ │ └── raw_datasets.py │ │ │ ├── ds_utils.py │ │ │ ├── model │ │ │ ├── model_utils.py │ │ │ └── reward_model.py │ │ │ ├── module │ │ │ └── lora.py │ │ │ ├── perf.py │ │ │ └── utils.py │ ├── e2e_rlhf.py │ ├── inference │ │ └── chatbot.py │ ├── main.py │ ├── requirements.txt │ ├── setup.py │ ├── tests │ │ └── test_training.py │ └── training │ │ ├── README.md │ │ ├── step1_supervised_finetuning │ │ ├── README.md │ │ ├── evaluation_scripts │ │ │ └── run_prompt.sh │ │ ├── main.py │ │ ├── prompt_eval.py │ │ └── training_scripts │ │ │ ├── README.md │ │ │ ├── baichuan │ │ │ └── run_baichuan_7b.sh │ │ │ ├── llama2 │ │ │ ├── run_llama2_7b.sh │ │ │ └── run_llama2_7b_lora.sh │ │ │ ├── opt │ │ │ ├── multi_node │ │ │ │ └── run_66b.sh │ │ │ ├── single_gpu │ │ │ │ ├── run_1.3b.sh │ │ │ │ └── run_6.7b_lora.sh │ │ │ └── single_node │ │ │ │ ├── run_1.3b.sh │ │ │ │ ├── run_1.3b_lora.sh │ │ │ │ ├── run_13b.sh │ │ │ │ ├── run_30b_lora.sh │ │ │ │ ├── run_6.7b.sh │ │ │ │ └── sweep │ │ │ │ ├── README.md │ │ │ │ ├── run_single.sh │ │ │ │ └── run_step1_sweep.sh │ │ │ └── other_language │ │ │ ├── run_chinese.sh │ │ │ └── run_japanese.sh │ │ ├── step2_dpo_finetuning │ │ ├── README.md │ │ ├── main.py │ │ └── training_scripts │ │ │ ├── README.md │ │ │ ├── llama2 │ │ │ ├── run_llama2_7b.sh │ │ │ └── run_llama2_7b_lora.sh │ │ │ └── opt │ │ │ ├── multi_node │ │ │ └── run_350m.sh │ │ │ ├── single_gpu │ │ │ └── run_350m.sh │ │ │ └── single_node │ │ │ ├── run_350m.sh │ │ │ └── sweep │ │ │ ├── README.md │ │ │ ├── run_single.sh │ │ │ └── run_step2_sweep.sh │ │ ├── step2_reward_model_finetuning │ │ ├── README.md │ │ ├── evaluation_scripts │ │ │ └── run_eval.sh │ │ ├── main.py │ │ ├── rw_eval.py │ │ └── training_scripts │ │ │ ├── README.md │ │ │ ├── llama2 │ │ │ ├── run_llama2_7b.sh │ │ │ └── run_llama2_7b_lora.sh │ │ │ └── opt │ │ │ ├── multi_node │ │ │ └── run_350m.sh │ │ │ ├── single_gpu │ │ │ └── run_350m.sh │ │ │ └── single_node │ │ │ ├── run_350m.sh │ │ │ └── sweep │ │ │ ├── README.md │ │ │ ├── run_single.sh │ │ │ └── run_step2_sweep.sh │ │ └── step3_rlhf_finetuning │ │ ├── BenckmarkSetting.md │ │ ├── README.md │ │ ├── main.py │ │ └── training_scripts │ │ ├── README.md │ │ ├── llama2 │ │ ├── run_llama2_7b.sh │ │ ├── run_llama2_7b_lora.sh │ │ └── run_llama2_7b_mixz.sh │ │ └── opt │ │ ├── multi_node │ │ └── run_66b.sh │ │ ├── single_gpu │ │ ├── run_1.3b.sh │ │ └── run_6.7b_lora.sh │ │ └── single_node │ │ ├── run_1.3b.sh │ │ ├── run_1.3b_lora.sh │ │ ├── run_13b.sh │ │ ├── run_30b_lora.sh │ │ ├── run_6.7b.sh │ │ └── sweep │ │ ├── README.md │ │ ├── run_single.sh │ │ └── run_step3_sweep.sh └── LoRA │ ├── README.md │ ├── main.py │ └── requirements.txt ├── ch6-rl ├── README.md ├── config │ └── ppo_megatron_trainer.yaml ├── dataset.py ├── requirements.txt └── verl_train_script.sh ├── ch7-multimodal └── MiniGPT-4 │ ├── README.md │ ├── blip2.py │ ├── blip_processor.py │ ├── conversation.py │ ├── eva_vit.py │ ├── icbm_bicycle.png │ ├── llama.py │ ├── main.py │ ├── minigpt4.py │ ├── qformer.py │ └── requirements.txt ├── ch8-agents ├── Debate │ ├── README.md │ ├── main.py │ └── requirements.txt ├── LangChain │ ├── README.md │ ├── callback.py │ ├── chain.py │ ├── data_connection.py │ ├── memory.py │ ├── model_io.py │ ├── rag.py │ └── requirements.txt └── RolePlaying │ ├── README.md │ ├── main.py │ └── requirements.txt └── ch9-rag └── RAG ├── README.md ├── base_rag.py ├── multi_query_rag.py └── requirements.txt /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/README.md -------------------------------------------------------------------------------- /chs/ch10-optimization/vLLM/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch10-optimization/vLLM/README.md -------------------------------------------------------------------------------- /chs/ch10-optimization/vLLM/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch10-optimization/vLLM/main.py -------------------------------------------------------------------------------- /chs/ch10-optimization/vLLM/requirements.txt: -------------------------------------------------------------------------------- 1 | python==3.10.16 2 | vllm==0.7.2 -------------------------------------------------------------------------------- /chs/ch11-evaluation/McNemarTest/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch11-evaluation/McNemarTest/README.md -------------------------------------------------------------------------------- /chs/ch11-evaluation/McNemarTest/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch11-evaluation/McNemarTest/main.py -------------------------------------------------------------------------------- /chs/ch11-evaluation/McNemarTest/requirements.txt: -------------------------------------------------------------------------------- 1 | python==3.10.16 2 | mlxtend==0.23.4 3 | numpy==2.2.3 -------------------------------------------------------------------------------- /chs/ch2-foundations/PreTrain/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/PreTrain/README.md -------------------------------------------------------------------------------- /chs/ch2-foundations/PreTrain/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/PreTrain/main.py -------------------------------------------------------------------------------- /chs/ch2-foundations/PreTrain/pretrained-bert/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/PreTrain/pretrained-bert/config.json -------------------------------------------------------------------------------- /chs/ch2-foundations/PreTrain/pretrained-bert/vocab.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/PreTrain/pretrained-bert/vocab.txt -------------------------------------------------------------------------------- /chs/ch2-foundations/PreTrain/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/PreTrain/requirements.txt -------------------------------------------------------------------------------- /chs/ch2-foundations/Transformer/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/Transformer/README.md -------------------------------------------------------------------------------- /chs/ch2-foundations/Transformer/batch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/Transformer/batch.py -------------------------------------------------------------------------------- /chs/ch2-foundations/Transformer/embed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/Transformer/embed.py -------------------------------------------------------------------------------- /chs/ch2-foundations/Transformer/layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/Transformer/layers.py -------------------------------------------------------------------------------- /chs/ch2-foundations/Transformer/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/Transformer/main.py -------------------------------------------------------------------------------- /chs/ch2-foundations/Transformer/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/Transformer/models.py -------------------------------------------------------------------------------- /chs/ch2-foundations/Transformer/process.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/Transformer/process.py -------------------------------------------------------------------------------- /chs/ch2-foundations/Transformer/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/Transformer/requirements.txt -------------------------------------------------------------------------------- /chs/ch2-foundations/Transformer/sublayers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/Transformer/sublayers.py -------------------------------------------------------------------------------- /chs/ch2-foundations/Transformer/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch2-foundations/Transformer/tokenizer.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/README.md -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/dedup/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/dedup/dedup_train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/dedup/dedup_train.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/dedup/generate_connected_components.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/dedup/generate_connected_components.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/dedup/generate_duplicate_pairs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/dedup/generate_duplicate_pairs.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/dedup/generate_duplicates_dict.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/dedup/generate_duplicates_dict.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/dedup/to_hash.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/dedup/to_hash.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/main.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/main.ipynb -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/main.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/preprocessing/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/preprocessing/datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/preprocessing/datasets.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/preprocessing/filter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/preprocessing/filter.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/preprocessing/normalize_text.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/preprocessing/normalize_text.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/preprocessing/shuffle_holdout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/preprocessing/shuffle_holdout.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/requirements.txt -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/split_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/split_dataset.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/DataProcess/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/DataProcess/utils.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/Tokenization/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/Tokenization/README.md -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/Tokenization/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch3-pretrain-data/Tokenization/main.py -------------------------------------------------------------------------------- /chs/ch3-pretrain-data/Tokenization/requirements.txt: -------------------------------------------------------------------------------- 1 | python==3.10.16 2 | torch==2.5.1 3 | transformers==4.45.2 -------------------------------------------------------------------------------- /chs/ch4-distributed/CollectiveCommunication/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/CollectiveCommunication/README.md -------------------------------------------------------------------------------- /chs/ch4-distributed/CollectiveCommunication/all_reduce.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/CollectiveCommunication/all_reduce.py -------------------------------------------------------------------------------- /chs/ch4-distributed/CollectiveCommunication/requirements.txt: -------------------------------------------------------------------------------- 1 | python==3.10.16 2 | torch==2.6.0+cu118 3 | typing==3.7.4.3 -------------------------------------------------------------------------------- /chs/ch4-distributed/DeepSpeed/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DeepSpeed/README.md -------------------------------------------------------------------------------- /chs/ch4-distributed/DeepSpeed/dschat/utils/data/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DeepSpeed/dschat/utils/data/data_utils.py -------------------------------------------------------------------------------- /chs/ch4-distributed/DeepSpeed/dschat/utils/data/raw_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DeepSpeed/dschat/utils/data/raw_datasets.py -------------------------------------------------------------------------------- /chs/ch4-distributed/DeepSpeed/dschat/utils/ds_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DeepSpeed/dschat/utils/ds_utils.py -------------------------------------------------------------------------------- /chs/ch4-distributed/DeepSpeed/dschat/utils/model/model_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DeepSpeed/dschat/utils/model/model_utils.py -------------------------------------------------------------------------------- /chs/ch4-distributed/DeepSpeed/dschat/utils/model/reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DeepSpeed/dschat/utils/model/reward_model.py -------------------------------------------------------------------------------- /chs/ch4-distributed/DeepSpeed/dschat/utils/module/lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DeepSpeed/dschat/utils/module/lora.py -------------------------------------------------------------------------------- /chs/ch4-distributed/DeepSpeed/dschat/utils/perf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DeepSpeed/dschat/utils/perf.py -------------------------------------------------------------------------------- /chs/ch4-distributed/DeepSpeed/dschat/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DeepSpeed/dschat/utils/utils.py -------------------------------------------------------------------------------- /chs/ch4-distributed/DeepSpeed/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DeepSpeed/main.py -------------------------------------------------------------------------------- /chs/ch4-distributed/DeepSpeed/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DeepSpeed/requirements.txt -------------------------------------------------------------------------------- /chs/ch4-distributed/DeepSpeed/run_llama2_7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DeepSpeed/run_llama2_7b.sh -------------------------------------------------------------------------------- /chs/ch4-distributed/DistributedDataParallel/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DistributedDataParallel/README.md -------------------------------------------------------------------------------- /chs/ch4-distributed/DistributedDataParallel/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DistributedDataParallel/dataset.py -------------------------------------------------------------------------------- /chs/ch4-distributed/DistributedDataParallel/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DistributedDataParallel/main.py -------------------------------------------------------------------------------- /chs/ch4-distributed/DistributedDataParallel/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DistributedDataParallel/models.py -------------------------------------------------------------------------------- /chs/ch4-distributed/DistributedDataParallel/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/DistributedDataParallel/requirements.txt -------------------------------------------------------------------------------- /chs/ch4-distributed/ModelParallel/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/ModelParallel/README.md -------------------------------------------------------------------------------- /chs/ch4-distributed/ModelParallel/pipeline_parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/ModelParallel/pipeline_parallel.py -------------------------------------------------------------------------------- /chs/ch4-distributed/ModelParallel/requirements.txt: -------------------------------------------------------------------------------- 1 | python==3.10.16 2 | torch==2.6.0+cu118 -------------------------------------------------------------------------------- /chs/ch4-distributed/ModelParallel/tensor_parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/ModelParallel/tensor_parallel.py -------------------------------------------------------------------------------- /chs/ch4-distributed/ZeRO/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/ZeRO/README.md -------------------------------------------------------------------------------- /chs/ch4-distributed/ZeRO/optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch4-distributed/ZeRO/optimizer.py -------------------------------------------------------------------------------- /chs/ch4-distributed/ZeRO/requirements.txt: -------------------------------------------------------------------------------- 1 | python==3.10.16 2 | torch==2.6.0+cu118 -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/chat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/chat.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/dschat/rlhf/ppo_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/dschat/rlhf/ppo_trainer.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/dschat/rlhf/rlhf_engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/dschat/rlhf/rlhf_engine.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/data/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/data/data_utils.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/data/raw_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/data/raw_datasets.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/ds_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/ds_utils.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/model/model_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/model/model_utils.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/model/reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/model/reward_model.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/module/lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/module/lora.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/perf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/perf.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/dschat/utils/utils.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/e2e_rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/e2e_rlhf.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/inference/chatbot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/inference/chatbot.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/main.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/requirements.txt -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/setup.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/tests/test_training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/tests/test_training.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/evaluation_scripts/run_prompt.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/evaluation_scripts/run_prompt.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/main.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/prompt_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/prompt_eval.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/baichuan/run_baichuan_7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/baichuan/run_baichuan_7b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/llama2/run_llama2_7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/llama2/run_llama2_7b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/llama2/run_llama2_7b_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/llama2/run_llama2_7b_lora.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/multi_node/run_66b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/multi_node/run_66b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_gpu/run_1.3b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_gpu/run_1.3b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_gpu/run_6.7b_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_gpu/run_6.7b_lora.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/run_1.3b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/run_1.3b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/run_1.3b_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/run_1.3b_lora.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/run_13b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/run_13b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/run_30b_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/run_30b_lora.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/run_6.7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/run_6.7b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/sweep/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/sweep/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/sweep/run_single.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/sweep/run_single.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/sweep/run_step1_sweep.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/opt/single_node/sweep/run_step1_sweep.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/other_language/run_chinese.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/other_language/run_chinese.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/other_language/run_japanese.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step1_supervised_finetuning/training_scripts/other_language/run_japanese.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/main.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/llama2/run_llama2_7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/llama2/run_llama2_7b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/llama2/run_llama2_7b_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/llama2/run_llama2_7b_lora.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/opt/multi_node/run_350m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/opt/multi_node/run_350m.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/opt/single_gpu/run_350m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/opt/single_gpu/run_350m.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/opt/single_node/run_350m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/opt/single_node/run_350m.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/opt/single_node/sweep/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/opt/single_node/sweep/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/opt/single_node/sweep/run_single.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/opt/single_node/sweep/run_single.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/opt/single_node/sweep/run_step2_sweep.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_dpo_finetuning/training_scripts/opt/single_node/sweep/run_step2_sweep.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/evaluation_scripts/run_eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/evaluation_scripts/run_eval.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/main.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/rw_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/rw_eval.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/llama2/run_llama2_7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/llama2/run_llama2_7b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/llama2/run_llama2_7b_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/llama2/run_llama2_7b_lora.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/opt/multi_node/run_350m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/opt/multi_node/run_350m.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/opt/single_gpu/run_350m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/opt/single_gpu/run_350m.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/opt/single_node/run_350m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/opt/single_node/run_350m.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/opt/single_node/sweep/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/opt/single_node/sweep/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/opt/single_node/sweep/run_single.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/opt/single_node/sweep/run_single.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/opt/single_node/sweep/run_step2_sweep.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step2_reward_model_finetuning/training_scripts/opt/single_node/sweep/run_step2_sweep.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/BenckmarkSetting.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/BenckmarkSetting.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/main.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/llama2/run_llama2_7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/llama2/run_llama2_7b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/llama2/run_llama2_7b_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/llama2/run_llama2_7b_lora.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/llama2/run_llama2_7b_mixz.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/llama2/run_llama2_7b_mixz.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/multi_node/run_66b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/multi_node/run_66b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_gpu/run_1.3b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_gpu/run_1.3b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_gpu/run_6.7b_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_gpu/run_6.7b_lora.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/run_1.3b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/run_1.3b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/run_1.3b_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/run_1.3b_lora.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/run_13b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/run_13b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/run_30b_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/run_30b_lora.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/run_6.7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/run_6.7b.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/sweep/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/sweep/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/sweep/run_single.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/sweep/run_single.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/sweep/run_step3_sweep.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/DeepSpeedChatSFT/training/step3_rlhf_finetuning/training_scripts/opt/single_node/sweep/run_step3_sweep.sh -------------------------------------------------------------------------------- /chs/ch5-finetuning/LoRA/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/LoRA/README.md -------------------------------------------------------------------------------- /chs/ch5-finetuning/LoRA/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch5-finetuning/LoRA/main.py -------------------------------------------------------------------------------- /chs/ch5-finetuning/LoRA/requirements.txt: -------------------------------------------------------------------------------- 1 | python==3.10.16 2 | torch==2.6.0 3 | transformers==4.45.2 4 | peft==0.14.0 -------------------------------------------------------------------------------- /chs/ch6-rl/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch6-rl/README.md -------------------------------------------------------------------------------- /chs/ch6-rl/config/ppo_megatron_trainer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch6-rl/config/ppo_megatron_trainer.yaml -------------------------------------------------------------------------------- /chs/ch6-rl/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch6-rl/dataset.py -------------------------------------------------------------------------------- /chs/ch6-rl/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch6-rl/requirements.txt -------------------------------------------------------------------------------- /chs/ch6-rl/verl_train_script.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch6-rl/verl_train_script.sh -------------------------------------------------------------------------------- /chs/ch7-multimodal/MiniGPT-4/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch7-multimodal/MiniGPT-4/README.md -------------------------------------------------------------------------------- /chs/ch7-multimodal/MiniGPT-4/blip2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch7-multimodal/MiniGPT-4/blip2.py -------------------------------------------------------------------------------- /chs/ch7-multimodal/MiniGPT-4/blip_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch7-multimodal/MiniGPT-4/blip_processor.py -------------------------------------------------------------------------------- /chs/ch7-multimodal/MiniGPT-4/conversation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch7-multimodal/MiniGPT-4/conversation.py -------------------------------------------------------------------------------- /chs/ch7-multimodal/MiniGPT-4/eva_vit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch7-multimodal/MiniGPT-4/eva_vit.py -------------------------------------------------------------------------------- /chs/ch7-multimodal/MiniGPT-4/icbm_bicycle.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch7-multimodal/MiniGPT-4/icbm_bicycle.png -------------------------------------------------------------------------------- /chs/ch7-multimodal/MiniGPT-4/llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch7-multimodal/MiniGPT-4/llama.py -------------------------------------------------------------------------------- /chs/ch7-multimodal/MiniGPT-4/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch7-multimodal/MiniGPT-4/main.py -------------------------------------------------------------------------------- /chs/ch7-multimodal/MiniGPT-4/minigpt4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch7-multimodal/MiniGPT-4/minigpt4.py -------------------------------------------------------------------------------- /chs/ch7-multimodal/MiniGPT-4/qformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch7-multimodal/MiniGPT-4/qformer.py -------------------------------------------------------------------------------- /chs/ch7-multimodal/MiniGPT-4/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch7-multimodal/MiniGPT-4/requirements.txt -------------------------------------------------------------------------------- /chs/ch8-agents/Debate/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch8-agents/Debate/README.md -------------------------------------------------------------------------------- /chs/ch8-agents/Debate/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch8-agents/Debate/main.py -------------------------------------------------------------------------------- /chs/ch8-agents/Debate/requirements.txt: -------------------------------------------------------------------------------- 1 | python==3.10.16 2 | openai==1.63.2 -------------------------------------------------------------------------------- /chs/ch8-agents/LangChain/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch8-agents/LangChain/README.md -------------------------------------------------------------------------------- /chs/ch8-agents/LangChain/callback.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch8-agents/LangChain/callback.py -------------------------------------------------------------------------------- /chs/ch8-agents/LangChain/chain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch8-agents/LangChain/chain.py -------------------------------------------------------------------------------- /chs/ch8-agents/LangChain/data_connection.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch8-agents/LangChain/data_connection.py -------------------------------------------------------------------------------- /chs/ch8-agents/LangChain/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch8-agents/LangChain/memory.py -------------------------------------------------------------------------------- /chs/ch8-agents/LangChain/model_io.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch8-agents/LangChain/model_io.py -------------------------------------------------------------------------------- /chs/ch8-agents/LangChain/rag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch8-agents/LangChain/rag.py -------------------------------------------------------------------------------- /chs/ch8-agents/LangChain/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch8-agents/LangChain/requirements.txt -------------------------------------------------------------------------------- /chs/ch8-agents/RolePlaying/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch8-agents/RolePlaying/README.md -------------------------------------------------------------------------------- /chs/ch8-agents/RolePlaying/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch8-agents/RolePlaying/main.py -------------------------------------------------------------------------------- /chs/ch8-agents/RolePlaying/requirements.txt: -------------------------------------------------------------------------------- 1 | python==3.10.16 2 | 'camel-ai[all]' -------------------------------------------------------------------------------- /chs/ch9-rag/RAG/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch9-rag/RAG/README.md -------------------------------------------------------------------------------- /chs/ch9-rag/RAG/base_rag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch9-rag/RAG/base_rag.py -------------------------------------------------------------------------------- /chs/ch9-rag/RAG/multi_query_rag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch9-rag/RAG/multi_query_rag.py -------------------------------------------------------------------------------- /chs/ch9-rag/RAG/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/intro-llm/intro-llm-code/HEAD/chs/ch9-rag/RAG/requirements.txt --------------------------------------------------------------------------------