├── .gitignore ├── LICENSE ├── LLaMA-Factory ├── .dockerignore ├── .gitattributes ├── .gitignore ├── CITATION.cff ├── Dockerfile ├── LICENSE ├── Makefile ├── README.md ├── README_zh.md ├── assets │ ├── benchmark.svg │ ├── logo.png │ └── wechat.jpg ├── data │ └── dataset_info.json ├── docker-compose.yml ├── evaluation │ ├── ceval │ │ ├── ceval.py │ │ ├── ceval.zip │ │ └── mapping.json │ ├── cmmlu │ │ ├── cmmlu.py │ │ ├── cmmlu.zip │ │ └── mapping.json │ └── mmlu │ │ ├── mapping.json │ │ ├── mmlu.py │ │ └── mmlu.zip ├── examples │ ├── README.md │ ├── README_zh.md │ ├── accelerate │ │ ├── fsdp_config.yaml │ │ ├── master_config.yaml │ │ ├── single_config.yaml │ │ └── slave_config.yaml │ ├── deepspeed │ │ ├── ds_z2_config.json │ │ ├── ds_z2_offload_config.json │ │ ├── ds_z3_config.json │ │ └── ds_z3_offload_config.json │ ├── extras │ │ ├── badam │ │ │ └── sft.sh │ │ ├── fsdp_qlora │ │ │ └── sft.sh │ │ ├── galore │ │ │ └── sft.sh │ │ ├── llama_pro │ │ │ ├── expand.sh │ │ │ └── sft.sh │ │ ├── loraplus │ │ │ └── sft.sh │ │ └── mod │ │ │ └── sft.sh │ ├── full_multi_gpu │ │ ├── multi_node.sh │ │ ├── predict.sh │ │ └── single_node.sh │ ├── inference │ │ ├── api_demo.sh │ │ ├── cli_demo.sh │ │ ├── evaluate.sh │ │ └── web_demo.sh │ ├── lora_multi_gpu │ │ ├── ds_zero3.sh │ │ ├── multi_node.sh │ │ └── single_node.sh │ ├── lora_single_gpu │ │ ├── dpo.sh │ │ ├── orpo.sh │ │ ├── ppo.sh │ │ ├── predict.sh │ │ ├── prepare.sh │ │ ├── pretrain.sh │ │ ├── reward.sh │ │ ├── sft.sh │ │ └── sft_mllm.sh │ ├── merge_lora │ │ ├── merge.sh │ │ └── quantize.sh │ └── qlora_single_gpu │ │ ├── aqlm.sh │ │ ├── awq.sh │ │ ├── bitsandbytes.sh │ │ └── gptq.sh ├── pyproject.toml ├── requirements.txt ├── run_dpo_om.sh ├── scripts │ ├── cal_flops.py │ ├── cal_lr.py │ ├── length_cdf.py │ ├── llama_pro.py │ ├── llamafy_baichuan2.py │ ├── llamafy_qwen.py │ └── loftq_init.py ├── setup.py ├── src │ ├── api_demo.py │ ├── cli_demo.py │ ├── evaluate.py │ ├── export_model.py │ ├── llmtuner │ │ ├── __init__.py │ │ ├── api │ │ │ ├── __init__.py │ │ │ ├── app.py │ │ │ └── protocol.py │ │ ├── chat │ │ │ ├── __init__.py │ │ │ ├── base_engine.py │ │ │ ├── chat_model.py │ │ │ ├── hf_engine.py │ │ │ └── vllm_engine.py │ │ ├── data │ │ │ ├── __init__.py │ │ │ ├── aligner.py │ │ │ ├── collator.py │ │ │ ├── formatter.py │ │ │ ├── loader.py │ │ │ ├── parser.py │ │ │ ├── preprocess.py │ │ │ ├── template.py │ │ │ └── utils.py │ │ ├── eval │ │ │ ├── __init__.py │ │ │ ├── evaluator.py │ │ │ └── template.py │ │ ├── extras │ │ │ ├── __init__.py │ │ │ ├── callbacks.py │ │ │ ├── constants.py │ │ │ ├── logging.py │ │ │ ├── misc.py │ │ │ ├── packages.py │ │ │ └── ploting.py │ │ ├── hparams │ │ │ ├── __init__.py │ │ │ ├── data_args.py │ │ │ ├── evaluation_args.py │ │ │ ├── finetuning_args.py │ │ │ ├── generating_args.py │ │ │ ├── model_args.py │ │ │ └── parser.py │ │ ├── model │ │ │ ├── __init__.py │ │ │ ├── adapter.py │ │ │ ├── loader.py │ │ │ ├── patcher.py │ │ │ └── utils │ │ │ │ ├── __init__.py │ │ │ │ ├── attention.py │ │ │ │ ├── checkpointing.py │ │ │ │ ├── embedding.py │ │ │ │ ├── longlora.py │ │ │ │ ├── misc.py │ │ │ │ ├── mod.py │ │ │ │ ├── moe.py │ │ │ │ ├── quantization.py │ │ │ │ ├── rope.py │ │ │ │ ├── unsloth.py │ │ │ │ └── visual.py │ │ ├── train │ │ │ ├── __init__.py │ │ │ ├── dpo │ │ │ │ ├── __init__.py │ │ │ │ ├── trainer.py │ │ │ │ └── workflow.py │ │ │ ├── optimizers.py │ │ │ ├── orpo │ │ │ │ ├── __init__.py │ │ │ │ ├── trainer.py │ │ │ │ └── workflow.py │ │ │ ├── ppo │ │ │ │ ├── __init__.py │ │ │ │ ├── trainer.py │ │ │ │ ├── utils.py │ │ │ │ └── workflow.py │ │ │ ├── pt │ │ │ │ ├── __init__.py │ │ │ │ ├── trainer.py │ │ │ │ └── workflow.py │ │ │ ├── rm │ │ │ │ ├── __init__.py │ │ │ │ ├── metric.py │ │ │ │ ├── trainer.py │ │ │ │ └── workflow.py │ │ │ ├── sft │ │ │ │ ├── __init__.py │ │ │ │ ├── metric.py │ │ │ │ ├── trainer.py │ │ │ │ └── workflow.py │ │ │ ├── tuner.py │ │ │ └── utils.py │ │ └── webui │ │ │ ├── __init__.py │ │ │ ├── chatter.py │ │ │ ├── common.py │ │ │ ├── components │ │ │ ├── __init__.py │ │ │ ├── chatbot.py │ │ │ ├── data.py │ │ │ ├── eval.py │ │ │ ├── export.py │ │ │ ├── infer.py │ │ │ ├── top.py │ │ │ └── train.py │ │ │ ├── css.py │ │ │ ├── engine.py │ │ │ ├── interface.py │ │ │ ├── locales.py │ │ │ ├── manager.py │ │ │ ├── runner.py │ │ │ └── utils.py │ ├── train_bash.py │ ├── train_web.py │ └── web_demo.py ├── tests │ ├── test_throughput.py │ └── test_toolcall.py └── wandb │ ├── latest-run │ ├── files │ │ ├── conda-environment.yaml │ │ └── wandb-metadata.json │ └── run-a3tc9o7r.wandb │ ├── offline-run-20240428_174351-fyjche3m │ ├── files │ │ ├── conda-environment.yaml │ │ └── wandb-metadata.json │ └── run-fyjche3m.wandb │ ├── offline-run-20240428_174832-f9xe0v01 │ ├── files │ │ ├── conda-environment.yaml │ │ ├── wandb-metadata.json │ │ └── wandb-summary.json │ └── run-f9xe0v01.wandb │ └── offline-run-20240428_175713-a3tc9o7r │ ├── files │ ├── conda-environment.yaml │ └── wandb-metadata.json │ └── run-a3tc9o7r.wandb ├── README.md ├── assets ├── main.jpg └── online_merging_arxiv_review.pdf ├── online_merging ├── __init__.py └── optimizers.py ├── requirements.txt └── setup.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LICENSE -------------------------------------------------------------------------------- /LLaMA-Factory/.dockerignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/.dockerignore -------------------------------------------------------------------------------- /LLaMA-Factory/.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/.gitattributes -------------------------------------------------------------------------------- /LLaMA-Factory/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/.gitignore -------------------------------------------------------------------------------- /LLaMA-Factory/CITATION.cff: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/CITATION.cff -------------------------------------------------------------------------------- /LLaMA-Factory/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/Dockerfile -------------------------------------------------------------------------------- /LLaMA-Factory/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/LICENSE -------------------------------------------------------------------------------- /LLaMA-Factory/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/Makefile -------------------------------------------------------------------------------- /LLaMA-Factory/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/README.md -------------------------------------------------------------------------------- /LLaMA-Factory/README_zh.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/README_zh.md -------------------------------------------------------------------------------- /LLaMA-Factory/assets/benchmark.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/assets/benchmark.svg -------------------------------------------------------------------------------- /LLaMA-Factory/assets/logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/assets/logo.png -------------------------------------------------------------------------------- /LLaMA-Factory/assets/wechat.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/assets/wechat.jpg -------------------------------------------------------------------------------- /LLaMA-Factory/data/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/data/dataset_info.json -------------------------------------------------------------------------------- /LLaMA-Factory/docker-compose.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/docker-compose.yml -------------------------------------------------------------------------------- /LLaMA-Factory/evaluation/ceval/ceval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/evaluation/ceval/ceval.py -------------------------------------------------------------------------------- /LLaMA-Factory/evaluation/ceval/ceval.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/evaluation/ceval/ceval.zip -------------------------------------------------------------------------------- /LLaMA-Factory/evaluation/ceval/mapping.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/evaluation/ceval/mapping.json -------------------------------------------------------------------------------- /LLaMA-Factory/evaluation/cmmlu/cmmlu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/evaluation/cmmlu/cmmlu.py -------------------------------------------------------------------------------- /LLaMA-Factory/evaluation/cmmlu/cmmlu.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/evaluation/cmmlu/cmmlu.zip -------------------------------------------------------------------------------- /LLaMA-Factory/evaluation/cmmlu/mapping.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/evaluation/cmmlu/mapping.json -------------------------------------------------------------------------------- /LLaMA-Factory/evaluation/mmlu/mapping.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/evaluation/mmlu/mapping.json -------------------------------------------------------------------------------- /LLaMA-Factory/evaluation/mmlu/mmlu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/evaluation/mmlu/mmlu.py -------------------------------------------------------------------------------- /LLaMA-Factory/evaluation/mmlu/mmlu.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/evaluation/mmlu/mmlu.zip -------------------------------------------------------------------------------- /LLaMA-Factory/examples/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/README.md -------------------------------------------------------------------------------- /LLaMA-Factory/examples/README_zh.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/README_zh.md -------------------------------------------------------------------------------- /LLaMA-Factory/examples/accelerate/fsdp_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/accelerate/fsdp_config.yaml -------------------------------------------------------------------------------- /LLaMA-Factory/examples/accelerate/master_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/accelerate/master_config.yaml -------------------------------------------------------------------------------- /LLaMA-Factory/examples/accelerate/single_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/accelerate/single_config.yaml -------------------------------------------------------------------------------- /LLaMA-Factory/examples/accelerate/slave_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/accelerate/slave_config.yaml -------------------------------------------------------------------------------- /LLaMA-Factory/examples/deepspeed/ds_z2_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/deepspeed/ds_z2_config.json -------------------------------------------------------------------------------- /LLaMA-Factory/examples/deepspeed/ds_z2_offload_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/deepspeed/ds_z2_offload_config.json -------------------------------------------------------------------------------- /LLaMA-Factory/examples/deepspeed/ds_z3_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/deepspeed/ds_z3_config.json -------------------------------------------------------------------------------- /LLaMA-Factory/examples/deepspeed/ds_z3_offload_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/deepspeed/ds_z3_offload_config.json -------------------------------------------------------------------------------- /LLaMA-Factory/examples/extras/badam/sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/extras/badam/sft.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/extras/fsdp_qlora/sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/extras/fsdp_qlora/sft.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/extras/galore/sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/extras/galore/sft.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/extras/llama_pro/expand.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/extras/llama_pro/expand.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/extras/llama_pro/sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/extras/llama_pro/sft.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/extras/loraplus/sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/extras/loraplus/sft.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/extras/mod/sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/extras/mod/sft.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/full_multi_gpu/multi_node.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/full_multi_gpu/multi_node.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/full_multi_gpu/predict.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/full_multi_gpu/predict.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/full_multi_gpu/single_node.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/full_multi_gpu/single_node.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/inference/api_demo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/inference/api_demo.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/inference/cli_demo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/inference/cli_demo.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/inference/evaluate.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/inference/evaluate.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/inference/web_demo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/inference/web_demo.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/lora_multi_gpu/ds_zero3.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/lora_multi_gpu/ds_zero3.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/lora_multi_gpu/multi_node.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/lora_multi_gpu/multi_node.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/lora_multi_gpu/single_node.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/lora_multi_gpu/single_node.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/lora_single_gpu/dpo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/lora_single_gpu/dpo.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/lora_single_gpu/orpo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/lora_single_gpu/orpo.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/lora_single_gpu/ppo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/lora_single_gpu/ppo.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/lora_single_gpu/predict.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/lora_single_gpu/predict.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/lora_single_gpu/prepare.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/lora_single_gpu/prepare.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/lora_single_gpu/pretrain.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/lora_single_gpu/pretrain.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/lora_single_gpu/reward.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/lora_single_gpu/reward.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/lora_single_gpu/sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/lora_single_gpu/sft.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/lora_single_gpu/sft_mllm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/lora_single_gpu/sft_mllm.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/merge_lora/merge.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/merge_lora/merge.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/merge_lora/quantize.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/merge_lora/quantize.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/qlora_single_gpu/aqlm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/qlora_single_gpu/aqlm.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/qlora_single_gpu/awq.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/qlora_single_gpu/awq.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/qlora_single_gpu/bitsandbytes.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/qlora_single_gpu/bitsandbytes.sh -------------------------------------------------------------------------------- /LLaMA-Factory/examples/qlora_single_gpu/gptq.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/examples/qlora_single_gpu/gptq.sh -------------------------------------------------------------------------------- /LLaMA-Factory/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/pyproject.toml -------------------------------------------------------------------------------- /LLaMA-Factory/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/requirements.txt -------------------------------------------------------------------------------- /LLaMA-Factory/run_dpo_om.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/run_dpo_om.sh -------------------------------------------------------------------------------- /LLaMA-Factory/scripts/cal_flops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/scripts/cal_flops.py -------------------------------------------------------------------------------- /LLaMA-Factory/scripts/cal_lr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/scripts/cal_lr.py -------------------------------------------------------------------------------- /LLaMA-Factory/scripts/length_cdf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/scripts/length_cdf.py -------------------------------------------------------------------------------- /LLaMA-Factory/scripts/llama_pro.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/scripts/llama_pro.py -------------------------------------------------------------------------------- /LLaMA-Factory/scripts/llamafy_baichuan2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/scripts/llamafy_baichuan2.py -------------------------------------------------------------------------------- /LLaMA-Factory/scripts/llamafy_qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/scripts/llamafy_qwen.py -------------------------------------------------------------------------------- /LLaMA-Factory/scripts/loftq_init.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/scripts/loftq_init.py -------------------------------------------------------------------------------- /LLaMA-Factory/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/setup.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/api_demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/api_demo.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/cli_demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/cli_demo.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/evaluate.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/export_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/export_model.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/api/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/api/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/api/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/api/app.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/api/protocol.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/api/protocol.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/chat/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/chat/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/chat/base_engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/chat/base_engine.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/chat/chat_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/chat/chat_model.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/chat/hf_engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/chat/hf_engine.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/chat/vllm_engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/chat/vllm_engine.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/data/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/data/aligner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/data/aligner.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/data/collator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/data/collator.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/data/formatter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/data/formatter.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/data/loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/data/loader.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/data/parser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/data/parser.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/data/preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/data/preprocess.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/data/template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/data/template.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/data/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/data/utils.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/eval/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/eval/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/eval/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/eval/evaluator.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/eval/template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/eval/template.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/extras/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/extras/callbacks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/extras/callbacks.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/extras/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/extras/constants.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/extras/logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/extras/logging.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/extras/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/extras/misc.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/extras/packages.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/extras/packages.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/extras/ploting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/extras/ploting.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/hparams/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/hparams/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/hparams/data_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/hparams/data_args.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/hparams/evaluation_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/hparams/evaluation_args.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/hparams/finetuning_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/hparams/finetuning_args.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/hparams/generating_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/hparams/generating_args.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/hparams/model_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/hparams/model_args.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/hparams/parser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/hparams/parser.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/adapter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/adapter.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/loader.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/patcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/patcher.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/utils/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/utils/attention.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/utils/checkpointing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/utils/checkpointing.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/utils/embedding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/utils/embedding.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/utils/longlora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/utils/longlora.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/utils/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/utils/misc.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/utils/mod.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/utils/mod.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/utils/moe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/utils/moe.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/utils/quantization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/utils/quantization.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/utils/rope.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/utils/rope.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/utils/unsloth.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/utils/unsloth.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/model/utils/visual.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/model/utils/visual.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/dpo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/dpo/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/dpo/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/dpo/trainer.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/dpo/workflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/dpo/workflow.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/optimizers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/optimizers.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/orpo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/orpo/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/orpo/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/orpo/trainer.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/orpo/workflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/orpo/workflow.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/ppo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/ppo/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/ppo/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/ppo/trainer.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/ppo/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/ppo/utils.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/ppo/workflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/ppo/workflow.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/pt/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/pt/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/pt/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/pt/trainer.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/pt/workflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/pt/workflow.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/rm/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/rm/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/rm/metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/rm/metric.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/rm/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/rm/trainer.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/rm/workflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/rm/workflow.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/sft/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/sft/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/sft/metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/sft/metric.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/sft/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/sft/trainer.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/sft/workflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/sft/workflow.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/tuner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/tuner.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/train/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/train/utils.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/chatter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/chatter.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/common.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/components/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/components/__init__.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/components/chatbot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/components/chatbot.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/components/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/components/data.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/components/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/components/eval.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/components/export.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/components/export.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/components/infer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/components/infer.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/components/top.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/components/top.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/components/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/components/train.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/css.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/css.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/engine.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/interface.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/locales.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/locales.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/manager.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/runner.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/llmtuner/webui/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/llmtuner/webui/utils.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/train_bash.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/train_bash.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/train_web.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/train_web.py -------------------------------------------------------------------------------- /LLaMA-Factory/src/web_demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/src/web_demo.py -------------------------------------------------------------------------------- /LLaMA-Factory/tests/test_throughput.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/tests/test_throughput.py -------------------------------------------------------------------------------- /LLaMA-Factory/tests/test_toolcall.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/tests/test_toolcall.py -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/latest-run/files/conda-environment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/wandb/latest-run/files/conda-environment.yaml -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/latest-run/files/wandb-metadata.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/wandb/latest-run/files/wandb-metadata.json -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/latest-run/run-a3tc9o7r.wandb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/wandb/latest-run/run-a3tc9o7r.wandb -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/offline-run-20240428_174351-fyjche3m/files/conda-environment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/wandb/offline-run-20240428_174351-fyjche3m/files/conda-environment.yaml -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/offline-run-20240428_174351-fyjche3m/files/wandb-metadata.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/wandb/offline-run-20240428_174351-fyjche3m/files/wandb-metadata.json -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/offline-run-20240428_174351-fyjche3m/run-fyjche3m.wandb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/wandb/offline-run-20240428_174351-fyjche3m/run-fyjche3m.wandb -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/offline-run-20240428_174832-f9xe0v01/files/conda-environment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/wandb/offline-run-20240428_174832-f9xe0v01/files/conda-environment.yaml -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/offline-run-20240428_174832-f9xe0v01/files/wandb-metadata.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/wandb/offline-run-20240428_174832-f9xe0v01/files/wandb-metadata.json -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/offline-run-20240428_174832-f9xe0v01/files/wandb-summary.json: -------------------------------------------------------------------------------- 1 | {"_wandb": {"runtime": 11}} -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/offline-run-20240428_174832-f9xe0v01/run-f9xe0v01.wandb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/wandb/offline-run-20240428_174832-f9xe0v01/run-f9xe0v01.wandb -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/offline-run-20240428_175713-a3tc9o7r/files/conda-environment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/wandb/offline-run-20240428_175713-a3tc9o7r/files/conda-environment.yaml -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/offline-run-20240428_175713-a3tc9o7r/files/wandb-metadata.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/wandb/offline-run-20240428_175713-a3tc9o7r/files/wandb-metadata.json -------------------------------------------------------------------------------- /LLaMA-Factory/wandb/offline-run-20240428_175713-a3tc9o7r/run-a3tc9o7r.wandb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/LLaMA-Factory/wandb/offline-run-20240428_175713-a3tc9o7r/run-a3tc9o7r.wandb -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/README.md -------------------------------------------------------------------------------- /assets/main.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/assets/main.jpg -------------------------------------------------------------------------------- /assets/online_merging_arxiv_review.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/assets/online_merging_arxiv_review.pdf -------------------------------------------------------------------------------- /online_merging/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/online_merging/__init__.py -------------------------------------------------------------------------------- /online_merging/optimizers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/online_merging/optimizers.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | torch==2.2.0 2 | -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/QwenLM/online_merging_optimizers/HEAD/setup.py --------------------------------------------------------------------------------