├── .gitignore ├── LICENSE ├── README.md ├── assets ├── hf-logo.pdf ├── method.pdf └── overview.png ├── dataset └── transfer_text2token.py ├── demo_dLLM-var.py ├── evaluation ├── accelerate_config.yaml ├── eval_model │ ├── Dream.py │ ├── LLaDA.py │ └── __init__.py ├── evaluation_script.py ├── requirements.txt ├── run_batch.sh ├── run_eval_block_diffusion_no_template.sh ├── run_eval_block_diffusion_template.sh └── utils │ ├── __init__.py │ ├── generate_function.py │ └── utils.py ├── install.sh ├── requirements.txt └── sft_training ├── argsparser ├── __init__.py └── argsparser.py ├── config ├── CONFIG.md ├── accelerate │ ├── config_zero1.yaml │ ├── config_zero2.yaml │ ├── config_zero3.yaml │ ├── fp8_config_zero1.yaml │ ├── fp8_config_zero2.yaml │ ├── fp8_config_zero3.yaml │ └── fp8_fsdp_config.yaml ├── deepspeed │ ├── ds_config_zero2.json │ └── ds_config_zero3.json ├── lora │ └── default_config.yaml └── sft │ └── default_config.yaml ├── data ├── __init__.py ├── dataloader.py └── dataset.py ├── run_training.sh ├── run_training_fp8.sh ├── sft.py ├── trainer ├── __init__.py └── trainer.py └── utils ├── __init__.py ├── lora_builder ├── __init__.py └── lora_builder.py ├── model_loader ├── __init__.py ├── model_loder.py └── transformers_loader.py ├── rl └── __init__.py └── sampling ├── __init__.py └── generate_slow_fast_sampling.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/README.md -------------------------------------------------------------------------------- /assets/hf-logo.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/assets/hf-logo.pdf -------------------------------------------------------------------------------- /assets/method.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/assets/method.pdf -------------------------------------------------------------------------------- /assets/overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/assets/overview.png -------------------------------------------------------------------------------- /dataset/transfer_text2token.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/dataset/transfer_text2token.py -------------------------------------------------------------------------------- /demo_dLLM-var.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/demo_dLLM-var.py -------------------------------------------------------------------------------- /evaluation/accelerate_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/evaluation/accelerate_config.yaml -------------------------------------------------------------------------------- /evaluation/eval_model/Dream.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/evaluation/eval_model/Dream.py -------------------------------------------------------------------------------- /evaluation/eval_model/LLaDA.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/evaluation/eval_model/LLaDA.py -------------------------------------------------------------------------------- /evaluation/eval_model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/evaluation/eval_model/__init__.py -------------------------------------------------------------------------------- /evaluation/evaluation_script.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/evaluation/evaluation_script.py -------------------------------------------------------------------------------- /evaluation/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/evaluation/requirements.txt -------------------------------------------------------------------------------- /evaluation/run_batch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/evaluation/run_batch.sh -------------------------------------------------------------------------------- /evaluation/run_eval_block_diffusion_no_template.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/evaluation/run_eval_block_diffusion_no_template.sh -------------------------------------------------------------------------------- /evaluation/run_eval_block_diffusion_template.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/evaluation/run_eval_block_diffusion_template.sh -------------------------------------------------------------------------------- /evaluation/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/evaluation/utils/__init__.py -------------------------------------------------------------------------------- /evaluation/utils/generate_function.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/evaluation/utils/generate_function.py -------------------------------------------------------------------------------- /evaluation/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/evaluation/utils/utils.py -------------------------------------------------------------------------------- /install.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/install.sh -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/requirements.txt -------------------------------------------------------------------------------- /sft_training/argsparser/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/argsparser/__init__.py -------------------------------------------------------------------------------- /sft_training/argsparser/argsparser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/argsparser/argsparser.py -------------------------------------------------------------------------------- /sft_training/config/CONFIG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/config/CONFIG.md -------------------------------------------------------------------------------- /sft_training/config/accelerate/config_zero1.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/config/accelerate/config_zero1.yaml -------------------------------------------------------------------------------- /sft_training/config/accelerate/config_zero2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/config/accelerate/config_zero2.yaml -------------------------------------------------------------------------------- /sft_training/config/accelerate/config_zero3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/config/accelerate/config_zero3.yaml -------------------------------------------------------------------------------- /sft_training/config/accelerate/fp8_config_zero1.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/config/accelerate/fp8_config_zero1.yaml -------------------------------------------------------------------------------- /sft_training/config/accelerate/fp8_config_zero2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/config/accelerate/fp8_config_zero2.yaml -------------------------------------------------------------------------------- /sft_training/config/accelerate/fp8_config_zero3.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/config/accelerate/fp8_config_zero3.yaml -------------------------------------------------------------------------------- /sft_training/config/accelerate/fp8_fsdp_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/config/accelerate/fp8_fsdp_config.yaml -------------------------------------------------------------------------------- /sft_training/config/deepspeed/ds_config_zero2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/config/deepspeed/ds_config_zero2.json -------------------------------------------------------------------------------- /sft_training/config/deepspeed/ds_config_zero3.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/config/deepspeed/ds_config_zero3.json -------------------------------------------------------------------------------- /sft_training/config/lora/default_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/config/lora/default_config.yaml -------------------------------------------------------------------------------- /sft_training/config/sft/default_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/config/sft/default_config.yaml -------------------------------------------------------------------------------- /sft_training/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/data/__init__.py -------------------------------------------------------------------------------- /sft_training/data/dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/data/dataloader.py -------------------------------------------------------------------------------- /sft_training/data/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/data/dataset.py -------------------------------------------------------------------------------- /sft_training/run_training.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/run_training.sh -------------------------------------------------------------------------------- /sft_training/run_training_fp8.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/run_training_fp8.sh -------------------------------------------------------------------------------- /sft_training/sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/sft.py -------------------------------------------------------------------------------- /sft_training/trainer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/trainer/__init__.py -------------------------------------------------------------------------------- /sft_training/trainer/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/trainer/trainer.py -------------------------------------------------------------------------------- /sft_training/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/utils/__init__.py -------------------------------------------------------------------------------- /sft_training/utils/lora_builder/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/utils/lora_builder/__init__.py -------------------------------------------------------------------------------- /sft_training/utils/lora_builder/lora_builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/utils/lora_builder/lora_builder.py -------------------------------------------------------------------------------- /sft_training/utils/model_loader/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/utils/model_loader/__init__.py -------------------------------------------------------------------------------- /sft_training/utils/model_loader/model_loder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/utils/model_loader/model_loder.py -------------------------------------------------------------------------------- /sft_training/utils/model_loader/transformers_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/utils/model_loader/transformers_loader.py -------------------------------------------------------------------------------- /sft_training/utils/rl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/utils/rl/__init__.py -------------------------------------------------------------------------------- /sft_training/utils/sampling/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/utils/sampling/__init__.py -------------------------------------------------------------------------------- /sft_training/utils/sampling/generate_slow_fast_sampling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maomaocun/dLLM-Var/HEAD/sft_training/utils/sampling/generate_slow_fast_sampling.py --------------------------------------------------------------------------------