├── .gitignore
├── LICENSE
├── README.md
├── requirements.txt
├── tools
    ├── download_data
    │   └── download_cft_data_hf.py
    ├── evaluate_gpqa
    │   ├── __init__.py
    │   ├── code_utils.py
    │   ├── compute_accuracy.py
    │   ├── data_loader.py
    │   ├── dataset
    │   │   ├── bbh
    │   │   │   ├── bbh.json
    │   │   │   └── template.json
    │   │   ├── gpqa
    │   │   │   ├── gpqa.jsonl
    │   │   │   ├── gpqa_diamond.jsonl
    │   │   │   ├── gpqa_experts.jsonl
    │   │   │   ├── gpqa_extended.jsonl
    │   │   │   └── gpqa_main.jsonl
    │   │   └── mmlu_pro
    │   │   │   ├── prompt.json
    │   │   │   └── test.json
    │   ├── eval_gpqa.sh
    │   ├── number_utils.py
    │   ├── prompt_utils.py
    │   ├── run_choice.py
    │   ├── run_open.py
    │   ├── run_open_sc.py
    │   ├── scripts
    │   │   └── evaluate_gpqa.sh
    │   └── utils.py
    ├── evaluate_math
    │   ├── LICENSE
    │   ├── data
    │   │   ├── aime24
    │   │   │   └── test.jsonl
    │   │   ├── amc23
    │   │   │   └── test.jsonl
    │   │   ├── gsm8k
    │   │   │   ├── test.jsonl
    │   │   │   └── train.jsonl
    │   │   ├── math-500
    │   │   │   └── test.jsonl
    │   │   ├── math
    │   │   │   ├── test.jsonl
    │   │   │   └── train.jsonl
    │   │   ├── minerva_math
    │   │   │   ├── README.md
    │   │   │   └── test.jsonl
    │   │   ├── olympiadbench
    │   │   │   ├── test.json
    │   │   │   └── test.jsonl
    │   │   └── theoremqa
    │   │   │   ├── test.json
    │   │   │   ├── test.jsonl
    │   │   │   └── trans_format.py
    │   ├── data_loader.py
    │   ├── evaluate.py
    │   ├── examples.py
    │   ├── grader.py
    │   ├── latex2sympy
    │   │   ├── .coveragerc
    │   │   ├── .gitignore
    │   │   ├── LICENSE.txt
    │   │   ├── PS.g4
    │   │   ├── README.md
    │   │   ├── __init__.py
    │   │   ├── antlr-4.11.1-complete.jar
    │   │   ├── asciimath_printer.py
    │   │   ├── description.txt
    │   │   ├── dev-requirements.in
    │   │   ├── dev-requirements.txt
    │   │   ├── gen
    │   │   │   ├── PS.interp
    │   │   │   ├── PS.tokens
    │   │   │   ├── PSLexer.interp
    │   │   │   ├── PSLexer.py
    │   │   │   ├── PSLexer.tokens
    │   │   │   ├── PSListener.py
    │   │   │   ├── PSParser.py
    │   │   │   └── __init__.py
    │   │   ├── icon.png
    │   │   ├── latex2sympy2.py
    │   │   ├── requirements.in
    │   │   ├── requirements.txt
    │   │   ├── sandbox
    │   │   │   ├── linalg_equations.py
    │   │   │   ├── linalg_span.py
    │   │   │   ├── matrix.py
    │   │   │   ├── matrix_placeholders.py
    │   │   │   ├── sandbox.py
    │   │   │   ├── sandbox_equality.py
    │   │   │   ├── sectan.py
    │   │   │   └── vector.py
    │   │   ├── scripts
    │   │   │   ├── compile.sh
    │   │   │   ├── coverage-ci.sh
    │   │   │   ├── coverage.sh
    │   │   │   ├── pre-commit
    │   │   │   ├── pre-push
    │   │   │   ├── publish.sh
    │   │   │   ├── setup-hooks.sh
    │   │   │   ├── setup.sh
    │   │   │   └── test.sh
    │   │   ├── setup.cfg
    │   │   ├── setup.py
    │   │   └── tests
    │   │   │   ├── __init__.py
    │   │   │   ├── abs_test.py
    │   │   │   ├── all_bad_test.py
    │   │   │   ├── all_good_test.py
    │   │   │   ├── atom_expr_test.py
    │   │   │   ├── binomial_test.py
    │   │   │   ├── ceil_test.py
    │   │   │   ├── complex_test.py
    │   │   │   ├── context.py
    │   │   │   ├── exp_test.py
    │   │   │   ├── floor_test.py
    │   │   │   ├── gcd_test.py
    │   │   │   ├── greek_test.py
    │   │   │   ├── grouping_test.py
    │   │   │   ├── lcm_test.py
    │   │   │   ├── left_right_cdot_test.py
    │   │   │   ├── linalg_test.py
    │   │   │   ├── max_test.py
    │   │   │   ├── min_test.py
    │   │   │   ├── mod_test.py
    │   │   │   ├── overline_test.py
    │   │   │   ├── pi_test.py
    │   │   │   ├── trig_test.py
    │   │   │   └── variable_test.py
    │   ├── math_eval.py
    │   ├── math_utils.py
    │   ├── model_utils.py
    │   ├── parser.py
    │   ├── python_executor.py
    │   ├── requirements.txt
    │   ├── rm_maj_eval.py
    │   ├── scripts
    │   │   ├── evaluate_deepseek.sh
    │   │   └── evaluate_qwen.sh
    │   ├── trajectory.py
    │   └── utils.py
    ├── evaluate_mmlu-pro
    │   ├── cot_prompt_lib
    │   │   ├── initial_prompt.txt
    │   │   ├── initial_prompt_1.txt
    │   │   └── initial_prompt_2.txt
    │   ├── evaluate_from_local.py
    │   └── mmlu-pro-eval.sh
    ├── scripts
    │   ├── download_data.sh
    │   └── evaluate.sh
    └── self_construct_critique_data
    │   ├── generate_critique_by_api.py
    │   └── run.sh
└── train
    ├── LLaMA-Factory
        ├── .env.local
        ├── .gitattributes
        ├── .pre-commit-config.yaml
        ├── CITATION.cff
        ├── LICENSE
        ├── MANIFEST.in
        ├── Makefile
        ├── README.md
        ├── README_zh.md
        ├── assets
        │   ├── benchmark.svg
        │   ├── logo.png
        │   ├── wechat.jpg
        │   └── wechat_npu.jpg
        ├── data
        │   ├── README.md
        │   ├── README_zh.md
        │   ├── alpaca_en_demo.json
        │   ├── alpaca_zh_demo.json
        │   ├── belle_multiturn
        │   │   └── belle_multiturn.py
        │   ├── c4_demo.json
        │   ├── dataset_info.json
        │   ├── dpo_en_demo.json
        │   ├── dpo_zh_demo.json
        │   ├── glaive_toolcall_en_demo.json
        │   ├── glaive_toolcall_zh_demo.json
        │   ├── hh_rlhf_en
        │   │   └── hh_rlhf_en.py
        │   ├── identity.json
        │   ├── kto_en_demo.json
        │   ├── mllm_demo.json
        │   ├── mllm_demo_data
        │   │   ├── 1.jpg
        │   │   ├── 1.mp4
        │   │   ├── 2.avi
        │   │   ├── 2.jpg
        │   │   ├── 3.jpg
        │   │   └── 3.mp4
        │   ├── mllm_video_demo.json
        │   ├── ultra_chat
        │   │   └── ultra_chat.py
        │   └── wiki_demo.txt
        ├── docker
        │   ├── docker-cuda
        │   │   ├── Dockerfile
        │   │   └── docker-compose.yml
        │   ├── docker-npu
        │   │   ├── Dockerfile
        │   │   └── docker-compose.yml
        │   └── docker-rocm
        │   │   ├── Dockerfile
        │   │   └── docker-compose.yml
        ├── evaluation
        │   ├── ceval
        │   │   ├── ceval.py
        │   │   ├── ceval.zip
        │   │   └── mapping.json
        │   ├── cmmlu
        │   │   ├── cmmlu.py
        │   │   ├── cmmlu.zip
        │   │   └── mapping.json
        │   └── mmlu
        │   │   ├── mapping.json
        │   │   ├── mmlu.py
        │   │   └── mmlu.zip
        ├── examples
        │   ├── README.md
        │   ├── README_zh.md
        │   ├── accelerate
        │   │   └── fsdp_config.yaml
        │   ├── deepspeed
        │   │   ├── ds_z0_config.json
        │   │   ├── ds_z2_config.json
        │   │   ├── ds_z2_offload_config.json
        │   │   ├── ds_z3_config.json
        │   │   └── ds_z3_offload_config.json
        │   ├── extras
        │   │   ├── adam_mini
        │   │   │   └── qwen2_full_sft.yaml
        │   │   ├── badam
        │   │   │   └── llama3_full_sft.yaml
        │   │   ├── fsdp_qlora
        │   │   │   ├── llama3_lora_sft.yaml
        │   │   │   └── train.sh
        │   │   ├── galore
        │   │   │   └── llama3_full_sft.yaml
        │   │   ├── llama_pro
        │   │   │   ├── expand.sh
        │   │   │   └── llama3_freeze_sft.yaml
        │   │   ├── loraplus
        │   │   │   └── llama3_lora_sft.yaml
        │   │   ├── mod
        │   │   │   └── llama3_full_sft.yaml
        │   │   ├── nlg_eval
        │   │   │   └── llama3_lora_predict.yaml
        │   │   └── pissa
        │   │   │   ├── init.sh
        │   │   │   └── llama3_lora_sft.yaml
        │   ├── inference
        │   │   ├── llama3.yaml
        │   │   ├── llama3_full_sft.yaml
        │   │   ├── llama3_lora_sft.yaml
        │   │   ├── llama3_vllm.yaml
        │   │   ├── llava1_5.yaml
        │   │   └── qwen2_vl.yaml
        │   ├── merge_lora
        │   │   ├── llama3_gptq.yaml
        │   │   ├── llama3_lora_sft.yaml
        │   │   └── qwen2vl_lora_sft.yaml
        │   ├── train_full
        │   │   ├── llama3_full_sft.yaml
        │   │   └── qwen2vl_full_sft.yaml
        │   ├── train_lora
        │   │   ├── llama3_lora_dpo.yaml
        │   │   ├── llama3_lora_eval.yaml
        │   │   ├── llama3_lora_kto.yaml
        │   │   ├── llama3_lora_ppo.yaml
        │   │   ├── llama3_lora_pretrain.yaml
        │   │   ├── llama3_lora_reward.yaml
        │   │   ├── llama3_lora_sft.yaml
        │   │   ├── llama3_lora_sft_ds3.yaml
        │   │   ├── llama3_preprocess.yaml
        │   │   ├── llava1_5_lora_sft.yaml
        │   │   ├── qwen2vl_lora_dpo.yaml
        │   │   └── qwen2vl_lora_sft.yaml
        │   └── train_qlora
        │   │   ├── llama3_lora_sft_aqlm.yaml
        │   │   ├── llama3_lora_sft_awq.yaml
        │   │   ├── llama3_lora_sft_gptq.yaml
        │   │   └── llama3_lora_sft_otfq.yaml
        ├── pyproject.toml
        ├── requirements.txt
        ├── scripts
        │   ├── api_example
        │   │   ├── test_image.py
        │   │   └── test_toolcall.py
        │   ├── convert_ckpt
        │   │   ├── llamafy_baichuan2.py
        │   │   └── llamafy_qwen.py
        │   ├── llama_pro.py
        │   ├── loftq_init.py
        │   ├── pissa_init.py
        │   ├── stat_utils
        │   │   ├── cal_flops.py
        │   │   ├── cal_lr.py
        │   │   ├── cal_mfu.py
        │   │   ├── cal_ppl.py
        │   │   └── length_cdf.py
        │   └── vllm_infer.py
        ├── setup.py
        ├── src
        │   ├── api.py
        │   ├── llamafactory.egg-info
        │   │   ├── PKG-INFO
        │   │   ├── SOURCES.txt
        │   │   ├── dependency_links.txt
        │   │   ├── entry_points.txt
        │   │   ├── requires.txt
        │   │   └── top_level.txt
        │   ├── llamafactory
        │   │   ├── __init__.py
        │   │   ├── __pycache__
        │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   ├── cli.cpython-311.pyc
        │   │   │   └── launcher.cpython-311.pyc
        │   │   ├── api
        │   │   │   ├── __init__.py
        │   │   │   ├── __pycache__
        │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   ├── app.cpython-311.pyc
        │   │   │   │   ├── chat.cpython-311.pyc
        │   │   │   │   ├── common.cpython-311.pyc
        │   │   │   │   └── protocol.cpython-311.pyc
        │   │   │   ├── app.py
        │   │   │   ├── chat.py
        │   │   │   ├── common.py
        │   │   │   └── protocol.py
        │   │   ├── chat
        │   │   │   ├── __init__.py
        │   │   │   ├── __pycache__
        │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   ├── base_engine.cpython-311.pyc
        │   │   │   │   ├── chat_model.cpython-311.pyc
        │   │   │   │   ├── hf_engine.cpython-311.pyc
        │   │   │   │   └── vllm_engine.cpython-311.pyc
        │   │   │   ├── base_engine.py
        │   │   │   ├── chat_model.py
        │   │   │   ├── hf_engine.py
        │   │   │   └── vllm_engine.py
        │   │   ├── cli.py
        │   │   ├── eval
        │   │   │   ├── __init__.py
        │   │   │   ├── __pycache__
        │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   ├── evaluator.cpython-311.pyc
        │   │   │   │   └── template.cpython-311.pyc
        │   │   │   ├── evaluator.py
        │   │   │   └── template.py
        │   │   ├── extras
        │   │   │   ├── __init__.py
        │   │   │   ├── __pycache__
        │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   ├── constants.cpython-311.pyc
        │   │   │   │   ├── env.cpython-311.pyc
        │   │   │   │   ├── logging.cpython-311.pyc
        │   │   │   │   ├── misc.cpython-311.pyc
        │   │   │   │   ├── packages.cpython-311.pyc
        │   │   │   │   └── ploting.cpython-311.pyc
        │   │   │   ├── constants.py
        │   │   │   ├── env.py
        │   │   │   ├── logging.py
        │   │   │   ├── misc.py
        │   │   │   ├── packages.py
        │   │   │   └── ploting.py
        │   │   ├── hparams
        │   │   │   ├── __init__.py
        │   │   │   ├── __pycache__
        │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   ├── data_args.cpython-311.pyc
        │   │   │   │   ├── evaluation_args.cpython-311.pyc
        │   │   │   │   ├── finetuning_args.cpython-311.pyc
        │   │   │   │   ├── generating_args.cpython-311.pyc
        │   │   │   │   ├── model_args.cpython-311.pyc
        │   │   │   │   └── parser.cpython-311.pyc
        │   │   │   ├── data_args.py
        │   │   │   ├── evaluation_args.py
        │   │   │   ├── finetuning_args.py
        │   │   │   ├── generating_args.py
        │   │   │   ├── model_args.py
        │   │   │   └── parser.py
        │   │   ├── launcher.py
        │   │   ├── model
        │   │   │   ├── __init__.py
        │   │   │   ├── __pycache__
        │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   ├── adapter.cpython-311.pyc
        │   │   │   │   ├── loader.cpython-311.pyc
        │   │   │   │   └── patcher.cpython-311.pyc
        │   │   │   ├── adapter.py
        │   │   │   ├── loader.py
        │   │   │   ├── model_utils
        │   │   │   │   ├── __init__.py
        │   │   │   │   ├── __pycache__
        │   │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   │   ├── attention.cpython-311.pyc
        │   │   │   │   │   ├── checkpointing.cpython-311.pyc
        │   │   │   │   │   ├── embedding.cpython-311.pyc
        │   │   │   │   │   ├── liger_kernel.cpython-311.pyc
        │   │   │   │   │   ├── longlora.cpython-311.pyc
        │   │   │   │   │   ├── misc.cpython-311.pyc
        │   │   │   │   │   ├── mod.cpython-311.pyc
        │   │   │   │   │   ├── moe.cpython-311.pyc
        │   │   │   │   │   ├── packing.cpython-311.pyc
        │   │   │   │   │   ├── quantization.cpython-311.pyc
        │   │   │   │   │   ├── rope.cpython-311.pyc
        │   │   │   │   │   ├── unsloth.cpython-311.pyc
        │   │   │   │   │   ├── valuehead.cpython-311.pyc
        │   │   │   │   │   └── visual.cpython-311.pyc
        │   │   │   │   ├── attention.py
        │   │   │   │   ├── checkpointing.py
        │   │   │   │   ├── embedding.py
        │   │   │   │   ├── liger_kernel.py
        │   │   │   │   ├── longlora.py
        │   │   │   │   ├── misc.py
        │   │   │   │   ├── mod.py
        │   │   │   │   ├── moe.py
        │   │   │   │   ├── packing.py
        │   │   │   │   ├── quantization.py
        │   │   │   │   ├── rope.py
        │   │   │   │   ├── unsloth.py
        │   │   │   │   ├── valuehead.py
        │   │   │   │   └── visual.py
        │   │   │   └── patcher.py
        │   │   ├── train
        │   │   │   ├── __init__.py
        │   │   │   ├── __pycache__
        │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   ├── callbacks.cpython-311.pyc
        │   │   │   │   ├── trainer_utils.cpython-311.pyc
        │   │   │   │   └── tuner.cpython-311.pyc
        │   │   │   ├── callbacks.py
        │   │   │   ├── dpo
        │   │   │   │   ├── __init__.py
        │   │   │   │   ├── __pycache__
        │   │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   │   ├── trainer.cpython-311.pyc
        │   │   │   │   │   └── workflow.cpython-311.pyc
        │   │   │   │   ├── trainer.py
        │   │   │   │   └── workflow.py
        │   │   │   ├── kto
        │   │   │   │   ├── __init__.py
        │   │   │   │   ├── __pycache__
        │   │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   │   ├── trainer.cpython-311.pyc
        │   │   │   │   │   └── workflow.cpython-311.pyc
        │   │   │   │   ├── trainer.py
        │   │   │   │   └── workflow.py
        │   │   │   ├── ppo
        │   │   │   │   ├── __init__.py
        │   │   │   │   ├── __pycache__
        │   │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   │   ├── ppo_utils.cpython-311.pyc
        │   │   │   │   │   ├── trainer.cpython-311.pyc
        │   │   │   │   │   └── workflow.cpython-311.pyc
        │   │   │   │   ├── ppo_utils.py
        │   │   │   │   ├── trainer.py
        │   │   │   │   └── workflow.py
        │   │   │   ├── pt
        │   │   │   │   ├── __init__.py
        │   │   │   │   ├── __pycache__
        │   │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   │   ├── trainer.cpython-311.pyc
        │   │   │   │   │   └── workflow.cpython-311.pyc
        │   │   │   │   ├── trainer.py
        │   │   │   │   └── workflow.py
        │   │   │   ├── rm
        │   │   │   │   ├── __init__.py
        │   │   │   │   ├── __pycache__
        │   │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   │   ├── metric.cpython-311.pyc
        │   │   │   │   │   ├── trainer.cpython-311.pyc
        │   │   │   │   │   └── workflow.cpython-311.pyc
        │   │   │   │   ├── metric.py
        │   │   │   │   ├── trainer.py
        │   │   │   │   └── workflow.py
        │   │   │   ├── sft
        │   │   │   │   ├── __init__.py
        │   │   │   │   ├── __pycache__
        │   │   │   │   │   ├── __init__.cpython-311.pyc
        │   │   │   │   │   ├── metric.cpython-311.pyc
        │   │   │   │   │   ├── trainer.cpython-311.pyc
        │   │   │   │   │   └── workflow.cpython-311.pyc
        │   │   │   │   ├── metric.py
        │   │   │   │   ├── trainer.py
        │   │   │   │   └── workflow.py
        │   │   │   ├── test_utils.py
        │   │   │   ├── trainer_utils.py
        │   │   │   └── tuner.py
        │   │   └── webui
        │   │   │   ├── __init__.py
        │   │   │   ├── __pycache__
        │   │   │       ├── __init__.cpython-311.pyc
        │   │   │       ├── chatter.cpython-311.pyc
        │   │   │       ├── common.cpython-311.pyc
        │   │   │       ├── css.cpython-311.pyc
        │   │   │       ├── engine.cpython-311.pyc
        │   │   │       ├── interface.cpython-311.pyc
        │   │   │       ├── manager.cpython-311.pyc
        │   │   │       ├── runner.cpython-311.pyc
        │   │   │       └── utils.cpython-311.pyc
        │   │   │   ├── chatter.py
        │   │   │   ├── common.py
        │   │   │   ├── components
        │   │   │       ├── __init__.py
        │   │   │       ├── __pycache__
        │   │   │       │   ├── __init__.cpython-311.pyc
        │   │   │       │   ├── chatbot.cpython-311.pyc
        │   │   │       │   ├── data.cpython-311.pyc
        │   │   │       │   ├── eval.cpython-311.pyc
        │   │   │       │   ├── export.cpython-311.pyc
        │   │   │       │   ├── infer.cpython-311.pyc
        │   │   │       │   ├── top.cpython-311.pyc
        │   │   │       │   └── train.cpython-311.pyc
        │   │   │       ├── chatbot.py
        │   │   │       ├── data.py
        │   │   │       ├── eval.py
        │   │   │       ├── export.py
        │   │   │       ├── infer.py
        │   │   │       ├── top.py
        │   │   │       └── train.py
        │   │   │   ├── css.py
        │   │   │   ├── engine.py
        │   │   │   ├── interface.py
        │   │   │   ├── manager.py
        │   │   │   ├── runner.py
        │   │   │   └── utils.py
        │   ├── train.py
        │   └── webui.py
        └── tests
        │   ├── e2e
        │       ├── test_chat.py
        │       └── test_train.py
        │   ├── eval
        │       └── test_eval_template.py
        │   ├── model
        │       ├── model_utils
        │       │   ├── test_attention.py
        │       │   ├── test_checkpointing.py
        │       │   └── test_packing.py
        │       ├── test_base.py
        │       ├── test_freeze.py
        │       ├── test_full.py
        │       ├── test_lora.py
        │       └── test_pissa.py
        │   └── train
        │       └── test_sft_trainer.py
    ├── Validation
        ├── start_validate.sh
        ├── validate_single.sh
        └── validation_on_math-500.py
    └── scripts
        ├── train_qwen2_5-32b-instruct-cft
            ├── qwen2.5-32b-cft-webinstruct-4k.yaml
            └── train.sh
        └── train_qwen2_5-math-7b-cft
            ├── qwen2.5-math-7b-cft-webinstruct-50k.yaml
            └── train.sh


/.gitignore:
--------------------------------------------------------------------------------
1 | .idea/
2 | .vscode/
3 | *.swp
4 | *.swo
5 | .DS_Store
6 | local*
7 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2025 TIGER Lab
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
 1 | vllm==0.6.6
 2 | tqdm
 3 | datasets
 4 | python_dateutil
 5 | flash_attn
 6 | 
 7 | # math_eval
 8 | sympy==1.12
 9 | antlr4-python3-runtime==4.11.1 # ! The version needs to be compatible with sympy.
10 | word2number
11 | Pebble
12 | timeout-decorator
13 | latex2sympy2
14 | 


--------------------------------------------------------------------------------
/tools/evaluate_gpqa/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/tools/evaluate_gpqa/__init__.py


--------------------------------------------------------------------------------
/tools/evaluate_gpqa/code_utils.py:
--------------------------------------------------------------------------------
 1 | import multiprocessing
 2 | import threading
 3 | from io import StringIO
 4 | from contextlib import redirect_stdout
 5 | 
 6 | 
 7 | def format_code(code_str: str):
 8 |     code = 'def run_it():\n'
 9 |     for line in code_str.split('\n'):
10 |         code += '  ' + line + '\n'
11 |     code += 'run_it()'
12 |     return code
13 | 
14 | 
15 | class CodeExecutor:
16 |     def __init__(self, code: str, timeout: int, use_process: bool):
17 |         self.code = format_code(code)
18 |         self.timeout = timeout
19 |         self.error = ''
20 |         self.use_process = use_process
21 | 
22 |     def execute_code(self, return_val):
23 |         try:
24 |             f = StringIO()
25 |             with redirect_stdout(f):
26 |                 exec(self.code, globals(), locals())
27 |             s = f.getvalue()
28 |             s = s.strip('\n')
29 |             return_val['result'] = s
30 |         except Exception:
31 |             pass
32 | 
33 |     @staticmethod
34 |     def execute_code_with_string(code, index, return_val):
35 |         code = format_code(code)
36 |         try:
37 |             f = StringIO()
38 |             with redirect_stdout(f):
39 |                 exec(code, globals(), locals())
40 |             s = f.getvalue()
41 |             s = s.strip('\n')
42 |             return_val[index] = s
43 |         except Exception as e:
44 |             pass
45 | 
46 |     def run(self):
47 |         if self.use_process:
48 |             manager = multiprocessing.Manager()
49 |             return_dict = manager.dict()
50 |             process = multiprocessing.Process(
51 |                 target=self.execute_code, args=(return_dict,))
52 |             process.start()
53 |             process.join(timeout=self.timeout)
54 |             process.terminate()
55 |         else:
56 |             return_dict = {}
57 |             thread = threading.Thread(
58 |                 target=self.execute_code, args=(return_dict,))
59 |             thread.start()
60 |             thread.join(timeout=self.timeout)
61 |             if thread.is_alive():
62 |                 thread.join()  # Ensures the thread is terminated before continuing
63 |                 print('time out!')
64 |                 self.error = 'Execution timed out'
65 | 
66 |         if 'result' in return_dict:
67 |             return return_dict['result']
68 |         else:
69 |             return ''
70 | 


--------------------------------------------------------------------------------
/tools/evaluate_gpqa/compute_accuracy.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | import sys
 3 | from utils import compare_answer_with_groundtruth
 4 | # from multiprocessing import Pool
 5 | 
 6 | assert len(sys.argv) >= 2, 'you need to feed in a file'
 7 | 
 8 | 
 9 | def func(filename: str):
10 |     results = {}
11 |     with open(filename) as f:
12 |         for line in f:
13 |             entry = json.loads(line)
14 | 
15 |             groundtruth = entry['correct']
16 |             if isinstance(groundtruth, str):
17 |                 groundtruth = [groundtruth]
18 | 
19 |             if entry['task'] not in results:
20 |                 results[entry['task']] = [0, 0, 0]
21 | 
22 |             if entry['pred'] == '':
23 |                 results[entry['task']][-1] += 1
24 | 
25 |             if compare_answer_with_groundtruth(entry['pred'], *groundtruth):
26 |                 results[entry['task']][0] += 1
27 |             else:
28 |                 results[entry['task']][1] += 1
29 | 
30 |     if results:
31 |         overall_correct, overall_wrong = 0, 0
32 |         tasks = sorted(results.keys())
33 |         for task in tasks:
34 |             correct, wrong, fail = results[task][0], results[task][1], results[task][2]
35 |             overall_correct += correct
36 |             overall_wrong += wrong
37 |             print(filename, '###', task, '###', f'accuracy={correct / (correct + wrong)}', f'fail={fail}')
38 |         print(filename,
39 |               '###',
40 |               'overall accuracy=',
41 |               overall_correct / (overall_correct + overall_wrong),
42 |               '###',
43 |               f'length={overall_correct + overall_wrong}')
44 |     else:
45 |         print(filename, ' is Empty!')
46 | 
47 | 
48 | if __name__ == '__main__':
49 |     for file in sys.argv[1:]:
50 |         func(file)
51 | 


--------------------------------------------------------------------------------
/tools/evaluate_gpqa/eval_gpqa.sh:
--------------------------------------------------------------------------------
 1 | set -ex
 2 | 
 3 | model_path=$1
 4 | output_dir=$2
 5 | summary_path=$3
 6 | n_shot=$4
 7 | 
 8 | datasets=("gpqa_diamond")
 9 | 
10 | for dataset in "${datasets[@]}"; do
11 |     echo "Processing dataset: $dataset"
12 |     python run_open.py \
13 |         --model $model_path \
14 |         --shots $n_shot \
15 |         --dataset $dataset \
16 |         --form "gpqa" \
17 |         --output_dir $output_dir \
18 |         --summary_path $summary_path
19 | done
20 | 
21 | 


--------------------------------------------------------------------------------
/tools/evaluate_gpqa/scripts/evaluate_gpqa.sh:
--------------------------------------------------------------------------------
 1 | set -ex
 2 | 
 3 | model_path=$1
 4 | output_dir=$2
 5 | summary_path=$3
 6 | 
 7 | datasets=("gpqa")
 8 | cd ..
 9 | for dataset in "${datasets[@]}"; do
10 |     echo "Processing dataset: $dataset"
11 |     python run_open.py \
12 |         --model $model_path \
13 |         --dataset $dataset \
14 |         --form qwen \
15 |         --output_dir $output_dir \
16 |         --summary_path $summary_path
17 | done
18 | 
19 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2024 Zhibin Gou
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/data/minerva_math/README.md:
--------------------------------------------------------------------------------
1 | MIT OpenCourseWare:
2 |     - Solving Quantitative Reasoning Problems with Language Models. https://openreview.net/forum?id=IFXTZERXdM7
3 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/data/theoremqa/trans_format.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | import os
 3 | 
 4 | 
 5 | def main():
 6 |     with open("test.json", "r") as fi:
 7 |         data = json.load(fi)
 8 |     output_data = []
 9 |     for each in data:
10 |         question = each["Question"]
11 |         answer = str(each["Answer"])
12 |         if answer == "True" or answer == "False":
13 |             question += " Answer with \\boxed{True} or \\boxed{False}."
14 |         output_data.append({"problem": question, "answer": answer})
15 |     with open("test.jsonl", "w") as fo:
16 |         for each in output_data:
17 |             fo.write(json.dumps(each) + "\n")
18 | 
19 | 
20 | main()
21 | 
22 | 
23 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/.coveragerc:
--------------------------------------------------------------------------------
 1 | # .coveragerc to control coverage.py
 2 | [run]
 3 | branch = True
 4 | include =
 5 |     latex2sympy.py
 6 | omit = 
 7 |     sandbox/*
 8 |     gen/*
 9 |     asciimath_printer.py
10 |     setup.py
11 |     __init__.py
12 | 
13 | [report]
14 | # Regexes for lines to exclude from consideration
15 | exclude_lines =
16 |     # Have to re-enable the standard pragma
17 |     pragma: no cover
18 | 
19 |     # Don't complain about missing debug-only code:
20 |     def __repr__
21 |     if self\.debug
22 | 
23 |     # Don't complain if tests don't hit defensive assertion code:
24 |     raise AssertionError
25 |     raise NotImplementedError
26 | 
27 |     # Don't complain if non-runnable code isn't run:
28 |     if 0:
29 |     if __name__ == .__main__.:
30 | 
31 | ignore_errors = True
32 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/.gitignore:
--------------------------------------------------------------------------------
  1 | # Byte-compiled / optimized / DLL files
  2 | __pycache__/
  3 | *.py[cod]
  4 | *$py.class
  5 | .antlr
  6 | 
  7 | # C extensions
  8 | *.so
  9 | 
 10 | # Distribution / packaging
 11 | .Python
 12 | build/
 13 | develop-eggs/
 14 | dist/
 15 | downloads/
 16 | eggs/
 17 | .eggs/
 18 | lib/
 19 | lib64/
 20 | parts/
 21 | sdist/
 22 | var/
 23 | wheels/
 24 | pip-wheel-metadata/
 25 | share/python-wheels/
 26 | *.egg-info/
 27 | .installed.cfg
 28 | *.egg
 29 | MANIFEST
 30 | 
 31 | # PyInstaller
 32 | #  Usually these files are written by a python script from a template
 33 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 34 | *.manifest
 35 | *.spec
 36 | 
 37 | # Installer logs
 38 | pip-log.txt
 39 | pip-delete-this-directory.txt
 40 | 
 41 | # Unit test / coverage reports
 42 | htmlcov/
 43 | .tox/
 44 | .nox/
 45 | .coverage
 46 | .coverage.*
 47 | .cache
 48 | nosetests.xml
 49 | coverage.xml
 50 | *.cover
 51 | .hypothesis/
 52 | .pytest_cache/
 53 | 
 54 | # Translations
 55 | *.mo
 56 | *.pot
 57 | 
 58 | # Django stuff:
 59 | *.log
 60 | local_settings.py
 61 | db.sqlite3
 62 | 
 63 | # Flask stuff:
 64 | instance/
 65 | .webassets-cache
 66 | 
 67 | # Scrapy stuff:
 68 | .scrapy
 69 | 
 70 | # Sphinx documentation
 71 | docs/_build/
 72 | 
 73 | # PyBuilder
 74 | target/
 75 | 
 76 | # Jupyter Notebook
 77 | .ipynb_checkpoints
 78 | 
 79 | # IPython
 80 | profile_default/
 81 | ipython_config.py
 82 | 
 83 | # pyenv
 84 | .python-version
 85 | 
 86 | # pipenv
 87 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 88 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 89 | #   having no cross-platform support, pipenv may install dependencies that don’t work, or not
 90 | #   install all needed dependencies.
 91 | #Pipfile.lock
 92 | 
 93 | # celery beat schedule file
 94 | celerybeat-schedule
 95 | 
 96 | # SageMath parsed files
 97 | *.sage.py
 98 | 
 99 | # Environments
100 | .env
101 | .venv
102 | env/
103 | venv/
104 | ENV/
105 | env.bak/
106 | venv.bak/
107 | 
108 | # Spyder project settings
109 | .spyderproject
110 | .spyproject
111 | 
112 | # Rope project settings
113 | .ropeproject
114 | 
115 | # mkdocs documentation
116 | /site
117 | 
118 | # mypy
119 | .mypy_cache/
120 | .dmypy.json
121 | dmypy.json
122 | 
123 | # Pyre type checker
124 | .pyre/
125 | 
126 | # Azure Functions artifacts
127 | bin
128 | obj
129 | appsettings.json
130 | local.settings.json
131 | .python_packages
132 | stemgen-solution-engine.zip


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/LICENSE.txt:
--------------------------------------------------------------------------------
 1 | The MIT License (MIT)
 2 | 
 3 | Copyright 2016, latex2sympy
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/__init__.py:
--------------------------------------------------------------------------------
1 | import latex2sympy


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/antlr-4.11.1-complete.jar:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/tools/evaluate_math/latex2sympy/antlr-4.11.1-complete.jar


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/asciimath_printer.py:
--------------------------------------------------------------------------------
 1 | from sympy.printing.str import StrPrinter
 2 | from sympy.core import S
 3 | 
 4 | class AsciiMathPrinter(StrPrinter):
 5 | 
 6 |     def _print_Limit(self, expr):
 7 |         e, z = expr.args
 8 | 
 9 |         return "lim_(%s -> %s) %s" % (self._print(z), self._print(z), self._print(e))
10 | 
11 |     def _print_Integral(self, expr):
12 |         e, lims = expr.args
13 |         if len(lims) > 1:
14 |             return "int_(%s)^(%s) %s d%s" % (self._print(lims[1]), self._print(lims[2]), self._print(e), self._print(lims[0]))
15 |         else:
16 |             return "int %s d%s" % (self._print(e), self._print(lims))
17 |     
18 |     def _print_Sum(self, expr):
19 |         e, lims = expr.args
20 |         return "sum_(%s = %s)^(%s) %s" % (self._print(lims[0]), self._print(lims[1]), self._print(lims[2]), self._print(e))
21 | 
22 |     def _print_Product(self, expr):
23 |         e, lims = expr.args
24 |         return "prod_(%s = %s)^(%s) %s" % (self._print(lims[0]), self._print(lims[1]), self._print(lims[2]), self._print(e))
25 | 
26 |     def _print_factorial(self, expr):
27 |         return "%s!" % self._print(expr.args[0])
28 | 
29 |     def _print_Derivative(self, expr):
30 |         e = expr.args[0]
31 |         wrt = expr.args[1]
32 |         return "d/d%s %s" % (self._print(wrt), self._print(e))
33 | 
34 |     def _print_Abs(self, expr):
35 |         return "|%s|" % self._print(expr.args[0])
36 | 
37 |     def _print_Equality(self, expr):
38 |         return "%s = %s" % (self._print(expr.args[0]), self._print(expr.args[1]))
39 | 
40 |     def _print_Pow(self, expr):
41 |         b = self._print(expr.base)
42 |         if expr.exp is S.Half:
43 |             return "sqrt(%s)" % b
44 | 
45 |         if -expr.exp is S.Half:
46 |             return "1/sqrt(%s)" % b
47 |         if expr.exp is -S.One:
48 |             return "1/%s" % b
49 | 
50 |         return "%s^(%s)" % (b, self._print(expr.exp)) 
51 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/dev-requirements.in:
--------------------------------------------------------------------------------
1 | -r requirements.txt
2 | # Development
3 | pip-tools
4 | pytest
5 | pytest-cov
6 | pycodestyle
7 | autopep8
8 | -e .
9 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/dev-requirements.txt:
--------------------------------------------------------------------------------
 1 | #
 2 | # This file is autogenerated by pip-compile with Python 3.10
 3 | # by the following command:
 4 | #
 5 | #    pip-compile dev-requirements.in
 6 | #
 7 |     # via -r dev-requirements.in
 8 | antlr4-python3-runtime==4.11.1
 9 |     # via
10 |     #   -r requirements.txt
11 |     #   latex2sympy2
12 | atomicwrites==1.3.0
13 |     # via pytest
14 | attrs==19.3.0
15 |     # via pytest
16 | autopep8==1.4.4
17 |     # via -r dev-requirements.in
18 | click==7.0
19 |     # via pip-tools
20 | coverage==4.5.4
21 |     # via pytest-cov
22 | more-itertools==7.2.0
23 |     # via pytest
24 | mpmath==1.3.0
25 |     # via
26 |     #   -r requirements.txt
27 |     #   sympy
28 | packaging==19.2
29 |     # via pytest
30 | pip-tools==4.2.0
31 |     # via -r dev-requirements.in
32 | pluggy==0.13.0
33 |     # via pytest
34 | py==1.8.0
35 |     # via pytest
36 | pycodestyle==2.5.0
37 |     # via
38 |     #   -r dev-requirements.in
39 |     #   autopep8
40 | pyparsing==2.4.4
41 |     # via packaging
42 | pytest==5.2.2
43 |     # via
44 |     #   -r dev-requirements.in
45 |     #   pytest-cov
46 | pytest-cov==2.8.1
47 |     # via -r dev-requirements.in
48 | six==1.13.0
49 |     # via
50 |     #   packaging
51 |     #   pip-tools
52 | sympy==1.12
53 |     # via
54 |     #   -r requirements.txt
55 |     #   latex2sympy2
56 | wcwidth==0.1.7
57 |     # via pytest
58 | 
59 | # THIS MUST BE MAINTAINED AS-IS
60 | -e .


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/gen/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/tools/evaluate_math/latex2sympy/gen/__init__.py


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/icon.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/tools/evaluate_math/latex2sympy/icon.png


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/requirements.in:
--------------------------------------------------------------------------------
1 | sympy
2 | antlr4-python3-runtime
3 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/requirements.txt:
--------------------------------------------------------------------------------
 1 | #
 2 | # This file is autogenerated by pip-compile with Python 3.10
 3 | # by the following command:
 4 | #
 5 | #    pip-compile requirements.in
 6 | #
 7 | antlr4-python3-runtime==4.11.1
 8 |     # via -r requirements.in
 9 | mpmath==1.3.0
10 |     # via sympy
11 | sympy==1.12
12 |     # via -r requirements.in
13 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/sandbox/linalg_equations.py:
--------------------------------------------------------------------------------
 1 | from latex2sympy import process_sympy
 2 | import sys
 3 | sys.path.append("..")
 4 | 
 5 | # latex = "2\\begin{pmatrix}1&1&1\\\\0&1&1\\\\0&0&1\\end{pmatrix}\\begin{pmatrix}1&1&1\\\\0&1&1\\\\0&0&1\\end{pmatrix}"
 6 | latex = "\\frac{a^{2} \\left(3 \\pi - 4 \\sin{\\left(\\pi \\right)} + \\frac{\\sin{\\left(2 \\pi \\right)}}{2}\\right)}{2}"
 7 | math = process_sympy(latex)
 8 | 
 9 | print(type(math))
10 | print("latex: %s to math: %s" % (latex, math))
11 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/sandbox/linalg_span.py:
--------------------------------------------------------------------------------
 1 | from latex2sympy import process_sympy
 2 | import sys
 3 | sys.path.append("..")
 4 | 
 5 | latex = "\\begin{pmatrix}1\\\\2\\\\3\\end{pmatrix}"
 6 | math = process_sympy(latex)
 7 | print("latex: %s to math: %s" % (latex, math))
 8 | 
 9 | latex = "\\begin{pmatrix}1\\\\2\\\\3\\end{pmatrix},\\begin{pmatrix}4\\\\3\\\\1\\end{pmatrix}"
10 | math = process_sympy(latex)
11 | print("latex: %s to math: %s" % (latex, math))
12 | 
13 | latex = "[\\begin{pmatrix}1\\\\2\\\\3\\end{pmatrix},\\begin{pmatrix}4\\\\3\\\\1\\end{pmatrix}]"
14 | math = process_sympy(latex)
15 | print("latex: %s to math: %s" % (latex, math))
16 | 
17 | latex = "\\left\\{\\begin{pmatrix}1\\\\2\\\\3\\end{pmatrix},\\begin{pmatrix}4\\\\3\\\\1\\end{pmatrix}\\right\\}"
18 | math = process_sympy(latex)
19 | print("latex: %s to math: %s" % (latex, math))
20 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/sandbox/matrix.py:
--------------------------------------------------------------------------------
 1 | from latex2sympy import process_sympy
 2 | from sympy import *
 3 | import sys
 4 | sys.path.append("..")
 5 | 
 6 | theta = Symbol('theta', real=True)
 7 | 
 8 | latex = "\\begin{matrix}1&2\\\\3&4\\end{matrix}"
 9 | math = process_sympy(latex)
10 | print("latex: %s to math: %s" % (latex, math))
11 | 
12 | latex = "\\begin{matrix}1&2\\\\3&4\\\\5&6\\end{matrix}"
13 | math = process_sympy(latex)
14 | print("latex: %s to math: %s" % (latex, math))
15 | 
16 | latex = "\\begin{matrix}1&2&3\\\\4&5&6\\\\7&8&9\\end{matrix}"
17 | math = process_sympy(latex)
18 | print("latex: %s to math: %s" % (latex, math))
19 | 
20 | latex = "\\begin{matrix}x^1&x^2&x^3\\\\y^1&y^2&y^3\\\\z^1&z^2&z^3\\end{matrix}"
21 | math = process_sympy(latex)
22 | print("latex: %s to math: %s" % (latex, math))
23 | 
24 | latex = "\\begin{matrix}x\\\\y\\end{matrix}"
25 | math = process_sympy(latex)
26 | print("latex: %s to math: %s" % (latex, math))
27 | 
28 | latex = "2\\cdot\\begin{matrix}x\\\\y\\end{matrix}"
29 | math = process_sympy(latex)
30 | print("latex: %s to math: %s" % (latex, math))
31 | 
32 | latex = "2\\cdot\\begin{matrix}x\\\\y\\end{matrix} + \\begin{matrix}2\\\\3\\end{matrix}"
33 | math = process_sympy(latex)
34 | print("latex: %s to math: %s" % (latex, math))
35 | 
36 | latex = "-2\\begin{matrix}1&2\\\\3&4\\end{matrix}"
37 | math = process_sympy(latex)
38 | print("latex: %s to math: %s" % (latex, math))
39 | 
40 | latex = "2\\cdot\\theta\\begin{matrix}x\\\\y\\end{matrix} + \\begin{matrix}2\\\\3\\end{matrix}"
41 | math = process_sympy(latex)
42 | print("latex: %s to math: %s" % (latex, math))
43 | 
44 | latex = "\\theta\\begin{matrix}1\\\\3\\end{matrix} - \\begin{matrix}-1\\\\2\\end{matrix}"
45 | math = process_sympy(latex)
46 | print("latex: %s to math: %s" % (latex, math))
47 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/sandbox/matrix_placeholders.py:
--------------------------------------------------------------------------------
 1 | from latex2sympy import process_sympy
 2 | from sympy import *
 3 | import sys
 4 | import hashlib
 5 | import time
 6 | 
 7 | sys.path.append("..")
 8 | 
 9 | 
10 | M = Matrix([[1, 2], [3, 4]])
11 | v = Matrix([1, 2])
12 | 
13 | # sub settings
14 | sub_settings_symbols = {}
15 | sub_settings_symbols[Symbol('M' + hashlib.md5('M'.encode()).hexdigest(), real=True)] = M
16 | sub_settings_symbols[Symbol('v' + hashlib.md5('v'.encode()).hexdigest(), real=True)] = v
17 | 
18 | 
19 | # one parameters
20 | latex = "\\begin{matrix}1&2\\\\3&4\\end{matrix}\\cdot[!v!]"
21 | equation_sympy_check = MatMul(M, Symbol('v' + hashlib.md5('v'.encode()).hexdigest(), real=True))
22 | equation_sympy_subs_check = MatMul(M, v)
23 | # placeholders
24 | equation_sympy = process_sympy(latex)
25 | print('latex = %s' % latex)
26 | print('equation_sympy = %s' % equation_sympy)
27 | print('equation_sympy_check = %s' % equation_sympy_check)
28 | print('equation_sympy = %s' % (srepr(equation_sympy)))
29 | 
30 | equation_sympy_subs = equation_sympy.subs(sub_settings_symbols, evaluate=False)
31 | print('equation_sympy_subs = %s' % equation_sympy_subs)
32 | print('equation_sympy_subs_check = %s' % equation_sympy_subs_check)
33 | 
34 | 
35 | # two parameters
36 | 
37 | # sub settings
38 | print('')
39 | print('============== Two Parameters -> M*v = Matrix*Vector =============')
40 | sub_settings_symbols = {}
41 | sub_settings_symbols[Symbol('M' + hashlib.md5('M'.encode()).hexdigest(), commutative=False)] = M
42 | sub_settings_symbols[Symbol('v' + hashlib.md5('v'.encode()).hexdigest(), commutative=False)] = v
43 | 
44 | latex = "[!M!]\\cdot[!v!]"
45 | math_check = Mul(Symbol('M' + hashlib.md5('M'.encode()).hexdigest(), commutative=False), Symbol('v' + hashlib.md5('v'.encode()).hexdigest(), commutative=False))
46 | # placeholders
47 | equation_sympy = process_sympy(latex)
48 | print(latex)
49 | print(math_check)
50 | print(equation_sympy)
51 | print(srepr(equation_sympy))
52 | 
53 | # performance
54 | t0 = time.time()
55 | 
56 | # process_sympy and substitute at the same time
57 | # Only needed for linalg input
58 | placeholder_values = {'M': M, 'v': v}
59 | equation_sympy_subs = process_sympy(latex, variable_values=placeholder_values)
60 | 
61 | t1 = time.time()
62 | print('equation with substituted placeholders = %s' % (str(equation_sympy_subs)))
63 | print('time to process to sympy with placeholders = %s s' % (t1 - t0))
64 | print('')
65 | print('============== Two Parameters -> M*v = Matrix*Vector =============')
66 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/sandbox/sandbox.py:
--------------------------------------------------------------------------------
 1 | from sympy import *
 2 | from latex2sympy import process_sympy
 3 | 
 4 | 
 5 | # latex = '\\variable{a}^{\\variable{b}}'
 6 | # variables = {'a': process_sympy('658.95998'), 'b': process_sympy('185083.8060')}
 7 | # c_ans_expr = process_sympy(latex, variables)
 8 | # print(c_ans_expr)
 9 | # print(srepr(c_ans_expr))
10 | # c_ans = c_ans_expr.doit(deep=False).evalf(chop=True)
11 | # print(c_ans)
12 | # print(srepr(c_ans))
13 | 
14 | 
15 | # numeric_responses = ['1', '1.0', '-1', '-1.0', '.5', '-.5', '3x10^3', '3E3', '3,000x10^{-3}', '0.5E-1', '\\frac{1}{3}', '(5\\times 3)^3', '\\sin(1)']
16 | # for latex in numeric_responses:
17 | #     parsed = process_sympy(latex)
18 | #     print('latex: ', latex)
19 | #     print('sympy: ', parsed)
20 | #     print('is_number: ', parsed.is_number)
21 | #     print('is_Number: ', parsed.is_Number)
22 | #     print('srepr: ', srepr(parsed))
23 | #     print('-----------------------------------------------------')
24 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/sandbox/sandbox_equality.py:
--------------------------------------------------------------------------------
 1 | from sympy import *
 2 | from latex2sympy import process_sympy
 3 | 
 4 | 
 5 | #
 6 | # Equality Testing
 7 | #
 8 | 
 9 | answer_sets = [
10 |     {
11 |         'correct_answer': '(x-y)(x+2y)',
12 |         'student_answers': [
13 |             'x^2+xy-2y^2',
14 |             '(x-y)(x+2y)',
15 |             '(x+2y)(x-y)',
16 |             '(2\\times y+x)(-y+x)',
17 |             '(y\\cdot 2+x)(-y+x)'
18 |         ]
19 |     },
20 |     {
21 |         'correct_answer': '2\\pi \\variable{r}^2',
22 |         'student_answers': [
23 |             '2\\pi \\variable{r}^2',
24 |             '\\pi 2\\variable{r}^2',
25 |             '2\\times \\pi \\times \\variable{r}^2',
26 |             '2\\pi \\variable{r} \\times \\variable{r}'
27 |         ]
28 |     },
29 |     {
30 |         'correct_answer': '2x - 3y',
31 |         'student_answers': [
32 |             '-3y + 2x'
33 |         ]
34 |     },
35 |     {
36 |         'correct_answer': 'x\\times x',
37 |         'student_answers': [
38 |             'x\\times x',
39 |             'x\\cdot x',
40 |             'x^2',
41 |             '(\\sqrt{x})^{4}'
42 |         ]
43 |     },
44 |     {
45 |         'correct_answer': '23e^{-1\\times \\sqrt{t^2}}',
46 |         'student_answers': [
47 |             '23e^{-t}'
48 |         ]
49 |     },
50 |     {
51 |         'correct_answer': 'a=x^2+1',
52 |         'student_answers': [
53 |             'x^2+1=a'
54 |         ]
55 |     }
56 | ]
57 | 
58 | for answer_set in answer_sets:
59 |     correct_answer = answer_set['correct_answer']
60 |     correct_answer_parsed = process_sympy(answer_set['correct_answer'])
61 |     for student_answer in answer_set['student_answers']:
62 |         student_answer_parsed = process_sympy(student_answer)
63 |         print('correct_answer (c): ', correct_answer, correct_answer_parsed)
64 |         print('student_answer (a): ', student_answer, student_answer_parsed)
65 |         print('')
66 |         print('Expression Tree (srepr(c) == srepr(a)) =>', srepr(correct_answer_parsed) == srepr(student_answer_parsed))
67 |         print('srepr(c) =>', srepr(correct_answer_parsed))
68 |         print('srepr(a) =>', srepr(student_answer_parsed))
69 |         print('')
70 |         # print('Structural (c == a) =>', correct_answer_parsed == student_answer_parsed)
71 |         print('Symbolic (simplify(c - s) == 0) =>', simplify(correct_answer_parsed - student_answer_parsed) == 0)
72 |         print('simplified =>', simplify(correct_answer_parsed - student_answer_parsed))
73 |         print('')
74 |         print('Numeric Substitution (c.equals(s)) =>', correct_answer_parsed.equals(student_answer_parsed))
75 |         print('-----------------------------------------------------')
76 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/sandbox/sectan.py:
--------------------------------------------------------------------------------
 1 | from sympy import *
 2 | import sys
 3 | sys.path.append("..")
 4 | 
 5 | # # x^2\cdot \left(3\cdot \tan \left([!a!]\cdot x+[!c!]\right)+[!a!]\cdot x\left(\sec \left([!a!]\cdot x+[!c!]\right)\right)^2\right)
 6 | # latex1 = "x^2\\cdot \\left(3\\cdot \\tan \\left(2\\cdot x+5\\right)+2\\cdot x\\left(\\sec \\left(2\\cdot x+5\\right)\\right)^2\\right)"
 7 | # math1 = process_sympy(latex1)
 8 | # print("latex: %s to math: %s" %(latex1,math1))
 9 | #
10 | # latex2 = "x^2\\cdot \\left(3\\cdot \\tan \\left(2\\cdot x+5\\right)+2\\cdot x\\left(\\sec \\left(2\\cdot x+5\\right)^2\\right)\\right)"
11 | # math2 = process_sympy(latex2)
12 | # print("latex: %s to math: %s" %(latex2,math2))
13 | #
14 | # latex3 = "x^2\\cdot \\left(3\\cdot \\tan \\left(2\\cdot x+5\\right)+2\\cdot x\\left(1+\\tan \\left(2\\cdot x+5\\right)^2\\right)\\right)"
15 | # math3 = process_sympy(latex3)
16 | # print("latex: %s to math: %s" %(latex3,math3))
17 | #
18 | # print(simplify(math1 - math2))
19 | # print(simplify(math1 - math3))
20 | 
21 | #
22 | # latex1 = "\\sec^2(2\\cdot x+5)"
23 | # math1 = process_sympy(latex1)
24 | # print("latex: %s to math: %s" %(latex1,math1))
25 | #
26 | # latex2 = "1+\\tan^2(2\\cdot x+5)"
27 | # math2 = process_sympy(latex2)
28 | # print("latex: %s to math: %s" %(latex2,math2))
29 | # print(simplify(math1 - math2))
30 | 
31 | 
32 | x = Symbol('x', real=True)
33 | y = Symbol('y', real=True)
34 | 
35 | # BUG: 1 + tan^2(x+1) should be == sec^2(x+1) but isnt
36 | lhs = (1 + (tan(x + 1))**2)
37 | rhs = (sec(x + 1))**2
38 | eq = lhs - rhs
39 | print(simplify(lhs))
40 | print(simplify(rhs))
41 | print(simplify(eq))
42 | print(simplify(lhs) == simplify(rhs))
43 | 
44 | # 1 + tan^2(x) == sec^2(x) but isnt
45 | lhs = (1 + (tan(x))**2)
46 | rhs = (sec(x))**2
47 | eq = lhs - rhs
48 | print(simplify(lhs))
49 | print(simplify(rhs))
50 | print(simplify(eq))
51 | print(simplify(lhs) == simplify(rhs))
52 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/sandbox/vector.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | from sympy import *
 3 | import sys
 4 | sys.path.append("..")
 5 | 
 6 | # row column matrix = vector
 7 | v = [1, 2, 3]
 8 | 
 9 | # single column matrix = vector
10 | m = Matrix([1, 2, 3])
11 | print(m[:, 0])
12 | 
13 | # a three row and 2 column matrix
14 | m = Matrix([[1, 2], [3, 4], [5, 6]])
15 | print(m[:, 0])
16 | 
17 | # determinant of lin indp system != 0
18 | m = Matrix([[1, 1], [1, 2]])
19 | print(m.det())
20 | 
21 | # determinant of lin dep system = 0
22 | m = Matrix([[1, 1], [2, 2]])
23 | print(m.det())
24 | 
25 | # determinant of lin dep system = 0
26 | x = Symbol('x')
27 | y = Symbol('y')
28 | m = Matrix([[x, y], [x, y]])
29 | print(m.det())
30 | # Reduced Row-Echelon Form
31 | _, ind = m.rref()
32 | print(len(ind))
33 | 
34 | # determinant of lin dep system != 0
35 | m = Matrix([[x, y], [y, x]])
36 | print(m.det())
37 | # Reduced Row-Echelon Form
38 | _, ind = m.rref()
39 | print(len(ind))
40 | 
41 | # determinant of lin dep system != 0
42 | # Reduced Row-Echelon Form
43 | m = Matrix([[x, x, y], [y, y, y]])
44 | _, ind = m.rref()
45 | # Reduced Row-Echelon Form
46 | print(len(ind))
47 | 
48 | #==================#
49 | #===== Numpy ======#
50 | #==================#
51 | # http://kitchingroup.cheme.cmu.edu/blog/2013/03/01/Determining-linear-independence-of-a-set-of-vectors/
52 | # Lin Indp of set of numerical vectors
53 | TOLERANCE = 1e-14
54 | v1 = [6, 0, 3, 1, 4, 2]
55 | v2 = [0, -1, 2, 7, 0, 5]
56 | v3 = [12, 3, 0, -19, 8, -11]
57 | 
58 | A = np.row_stack([v1, v2, v3])
59 | 
60 | U, s, V = np.linalg.svd(A)
61 | print(s)
62 | print(np.sum(s > TOLERANCE))
63 | 
64 | v1 = [1, 1]
65 | v2 = [4, 4]
66 | 
67 | A = np.row_stack([v1, v2])
68 | U, s, V = np.linalg.svd(A)
69 | print(s)
70 | print(np.sum(s > TOLERANCE))
71 | 
72 | 
73 | latex = "\\begin{matrix}1&2\\\\3&4\\end{matrix}"
74 | # math = process_sympy(latex)
75 | print("latex: %s to math: %s" % (latex, 1))
76 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/scripts/compile.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | 
 3 | # Get relative path of the root directory of the project
 4 | rdir=`git rev-parse --git-dir`
 5 | rel_path="$(dirname "$rdir")"
 6 | # Change to that path and run the file
 7 | cd $rel_path
 8 | 
 9 | java -jar antlr-4.11.1-complete.jar PS.g4 -o gen
10 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/scripts/coverage-ci.sh:
--------------------------------------------------------------------------------
1 | #!/bin/sh
2 | 
3 | pytest --doctest-modules --junitxml=junit/test-results.xml --cov-report=xml --cov-config=.coveragerc --cov=latex2sympy tests


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/scripts/coverage.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | 
 3 | # Get relative path of the root directory of the project
 4 | rdir=`git rev-parse --git-dir`
 5 | rel_path="$(dirname "$rdir")"
 6 | # Change to that path and run the file
 7 | cd $rel_path
 8 | 
 9 | # Activate virtual environment
10 | echo "activating venv..."
11 | if test -f .env/bin/activate
12 | then source .env/bin/activate && echo "venv activate (bin)"
13 | elif test -f .env/Scripts/activate
14 | then source .env/Scripts/activate && echo "venv activated (Scripts)"
15 | else exit 1
16 | fi
17 | 
18 | # Run unit test coverage
19 | echo "starting coverage..."
20 | if pytest --doctest-modules --cov-report=html --cov-config=.coveragerc --cov=latex2sympy tests
21 | then echo "coverage finished"
22 | else exit 1
23 | fi
24 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/scripts/pre-commit:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | 
 3 | # Get relative path of the root directory of the project
 4 | rdir=`git rev-parse --git-dir`
 5 | rel_path="$(dirname "$rdir")"
 6 | 
 7 | # Change to that path and run the file
 8 | cd $rel_path
 9 | 
10 | echo "pre-commit hook started..."
11 | 
12 | # Activate virtual environment
13 | echo "activating venv..."
14 | if test -f .env/bin/activate
15 | then source .env/bin/activate && echo "venv activated."
16 | elif test -f .env/Scripts/activate
17 | then source .env/Scripts/activate && echo "venv activated."
18 | else exit 1
19 | fi
20 | 
21 | # Run auto formatting on all staged python files, then add those changes
22 | echo "auto-formatting code..."
23 | if autopep8 --in-place `git diff --name-status --cached | grep '.py' | awk 'match($1, "A|M"){print $2}'` && git add `git diff --name-status --cached | grep '.py' | awk 'match($1, "A|M"){print $2}'`
24 | then echo "code was auto-formatted."
25 | else echo "no code was auto-formatted."
26 | fi
27 | 
28 | exit 0
29 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/scripts/pre-push:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | 
 3 | # Get relative path of the root directory of the project
 4 | rdir=`git rev-parse --git-dir`
 5 | rel_path="$(dirname "$rdir")"
 6 | 
 7 | # Change to that path and run the file
 8 | cd $rel_path
 9 | 
10 | echo "pre-push hook started..."
11 | 
12 | # Activate virtual environment
13 | echo "activating venv..."
14 | if test -f .env/bin/activate
15 | then source .env/bin/activate && echo "venv activated."
16 | elif test -f .env/Scripts/activate
17 | then source .env/Scripts/activate && echo "venv activated."
18 | else exit 1
19 | fi
20 | 
21 | # Run unit tests
22 | echo "starting tests..."
23 | # if pytest tests
24 | # then echo "tests finished."
25 | # else exit 1
26 | # fi
27 | 
28 | exit 0
29 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/scripts/publish.sh:
--------------------------------------------------------------------------------
1 | rm ./dist/*
2 | python3 setup.py bdist_wheel
3 | twine upload dist/*
4 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/scripts/setup-hooks.sh:
--------------------------------------------------------------------------------
1 | #!/bin/sh
2 | cp scripts/pre-push .git/hooks/
3 | cp scripts/pre-commit .git/hooks/


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/scripts/setup.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | 
 3 | # Get relative path of the root directory of the project
 4 | rdir=`git rev-parse --git-dir`
 5 | rel_path="$(dirname "$rdir")"
 6 | # Change to that path and run the file
 7 | cd $rel_path
 8 | 
 9 | echo "creating venv..."
10 | if test -d .env
11 | then echo "venv exists"
12 | else python3 -m venv .env && echo "venv created"
13 | fi
14 | 
15 | echo ''
16 | # Activate virtual environment
17 | echo "activating venv..."
18 | if test -f .env/bin/activate
19 | then source .env/bin/activate && echo "venv activate (bin)"
20 | elif test -f .env/Scripts/activate
21 | then source .env/Scripts/activate && echo "venv activated (Scripts)"
22 | else exit 1
23 | fi
24 | 
25 | echo ''
26 | echo "installing requirements..."
27 | if pip install -r dev-requirements.txt
28 | then echo "requirements installed"
29 | else exit 1
30 | fi
31 | 
32 | echo ''
33 | echo "compiling parser..."
34 | sh scripts/compile.sh
35 | echo "parser compiled"
36 | 
37 | echo ''
38 | echo "setup git hooks..."
39 | sh scripts/setup-hooks.sh
40 | echo "git hooks setup"
41 | 
42 | exit 0
43 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/scripts/test.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | 
 3 | # Get relative path of the root directory of the project
 4 | rdir=`git rev-parse --git-dir`
 5 | rel_path="$(dirname "$rdir")"
 6 | # Change to that path and run the file
 7 | cd $rel_path
 8 | 
 9 | # Activate virtual environment
10 | echo "activating venv..."
11 | if test -f .env/bin/activate
12 | then source .env/bin/activate && echo "venv activate (bin)"
13 | elif test -f .env/Scripts/activate
14 | then source .env/Scripts/activate && echo "venv activated (Scripts)"
15 | else exit 1
16 | fi
17 | 
18 | echo ''
19 | echo "compiling parser..."
20 | sh scripts/compile.sh
21 | echo "parser compiled"
22 | 
23 | echo ''
24 | # Run unit tests
25 | echo "starting tests..."
26 | if pytest tests
27 | then echo "tests finished"
28 | else exit 1
29 | fi
30 | 
31 | exit 0
32 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/setup.cfg:
--------------------------------------------------------------------------------
1 | [pycodestyle]
2 | max-line-length = 120
3 | ignore = E501
4 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/setup.py:
--------------------------------------------------------------------------------
 1 | from setuptools import setup, find_packages
 2 | from codecs import open
 3 | from os import path
 4 | here = path.abspath(path.dirname(__file__))
 5 | 
 6 | 
 7 | setup(
 8 |     name="latex2sympy2",
 9 |     version="1.9.0",
10 |     description='Convert latex to sympy with ANTLR and support Matrix, Linear Algebra and CAS functions.',
11 |     long_description_content_type='text/markdown',
12 |     long_description=open(path.join(here, "README.md"), encoding='utf-8').read(),
13 |     # The project's main homepage.
14 |     url='https://github.com/ZubinGou/latex2sympy',
15 |     # Author details
16 |     author='ZubinGou',
17 |     author_email='zebgou@gmail.com',
18 |     # Choose your license
19 |     license='MIT',
20 |     classifiers=[
21 |         'Development Status :: 4 - Beta',
22 |         'Intended Audience :: Developers',
23 |         'Intended Audience :: Education',
24 |         'Intended Audience :: Science/Research',
25 |         'License :: OSI Approved :: MIT License',
26 |         'Topic :: Education',
27 |         'Topic :: Scientific/Engineering :: Mathematics',
28 |         'Topic :: Software Development :: Compilers',
29 |         'Topic :: Text Processing :: Markup :: LaTeX',
30 |         'Topic :: Text Processing :: Markup :: Markdown',
31 |         'Programming Language :: Python :: 3',
32 |         'Programming Language :: Python :: 3.3',
33 |         'Programming Language :: Python :: 3.4',
34 |         'Programming Language :: Python :: 3.5',
35 |         'Programming Language :: Python :: 3.6',
36 |         'Programming Language :: Python :: 3.7',
37 |         'Programming Language :: Python :: 3.8',
38 |     ],
39 |     packages=find_packages(exclude=('tests')),
40 |     py_modules=['asciimath_printer', 'latex2sympy2'],
41 |     install_requires=[
42 |         'sympy>=1.4',
43 |         'antlr4-python3-runtime==4.11.1'
44 |     ],
45 | )
46 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/tools/evaluate_math/latex2sympy/tests/__init__.py


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/abs_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal, get_simple_examples
 2 | import pytest
 3 | from sympy import Abs
 4 | 
 5 | examples = get_simple_examples(Abs)
 6 | 
 7 | delimiter_pairs = {
 8 |     '|': '|',
 9 |     '\\vert': '\\vert',
10 |     '\\lvert': '\\rvert'
11 | }
12 | 
13 | 
14 | @pytest.mark.parametrize('input, output, symbolically', examples)
15 | def test_abs(input, output, symbolically):
16 |     for left, right in delimiter_pairs.items():
17 |         assert_equal("{left}{input}{right}".format(left=left, right=right, input=input), output, symbolically=symbolically)
18 |         assert_equal("\\left{left}{input}\\right{right}".format(left=left, right=right, input=input), output, symbolically=symbolically)
19 |         assert_equal("\\mleft{left}{input}\\mright{right}".format(left=left, right=right, input=input), output, symbolically=symbolically)
20 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/all_bad_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal, process_sympy
 2 | import pytest
 3 | 
 4 | 
 5 | def pytest_generate_tests(metafunc):
 6 |     metafunc.parametrize('s', metafunc.cls.BAD_STRINGS)
 7 | 
 8 | 
 9 | class TestAllBad(object):
10 |     # These bad latex strings should raise an exception when parsed
11 |     BAD_STRINGS = [
12 |         "(",
13 |         ")",
14 |         # "a / b /",
15 |         "\\frac{d}{dx}",
16 |         "(\\frac{d}{dx})"
17 |         "\\sqrt{}",
18 |         "\\sqrt",
19 |         "{",
20 |         "}",
21 |         # "1.1.1",
22 |         "\\mathit{TEST}"
23 |         "\\frac{2}{}",
24 |         "\\frac{}{2}",
25 |         "\\int",
26 |         # "1 +",
27 |         # "a +",
28 |         "!",
29 |         "!0",
30 |         "_",
31 |         "^",
32 |         # "a // b",
33 |         # "a \\cdot \\cdot b",
34 |         # "a \\div \\div b",
35 |         "a\\mod \\begin{matrix}b\\end{matrix}"
36 |         "|",
37 |         "||x|",
38 |         "\\lfloor x",
39 |         "\\lfloor a \\rceil",
40 |         "\\operatorname{floor}(12.3, 123.4)",
41 |         "()",
42 |         "((((((((((((((((()))))))))))))))))",
43 |         "-",
44 |         "\\frac{d}{dx} + \\frac{d}{dt}",
45 |         # "f()",
46 |         # "f(,",
47 |         # "f(x,,y)",
48 |         # "f(x,y,",
49 |         "\\sin^x",
50 |         "\\cos^2",
51 |         # "\\cos 1 \\cos",
52 |         # "\\gcd(3)",
53 |         # "\\lcm(2)",
54 |         "@", "#", "$", "%", "&", "*",
55 |         "\\",
56 |         "~",
57 |         "\\frac{(2 + x}{1 - x)}",
58 |         "\\lim_{\\pi \\to 3} a",
59 |         # because mix of COMMA and SEMICOLON
60 |         "\\left\\{\\begin{pmatrix}1\\\\2\\\\3\\end{pmatrix},\\begin{pmatrix}4\\\\3\\\\1\\end{pmatrix};\\begin{pmatrix}1\\\\1\\\\1\\end{pmatrix}\\right\\}",
61 |         # percentages without numbers before-hand
62 |         "a\\%",
63 |         "\\%100",
64 |         # dollar signs without numbers after
65 |         "\\$"
66 |     ]
67 | 
68 |     def test_bad_string(self, s):
69 |         with pytest.raises(Exception):
70 |             process_sympy(s)
71 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/atom_expr_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal
 2 | import pytest
 3 | from sympy import Symbol, Integer, Pow
 4 | 
 5 | # label, text, symbol_text
 6 | symbols = [
 7 |     ('letter', 'x', 'x'),
 8 |     ('greek letter', '\\lambda', 'lambda'),
 9 |     ('greek letter w/ space', '\\alpha ', 'alpha'),
10 |     ('accented letter', '\\overline{x}', 'xbar')
11 | ]
12 | 
13 | subscripts = [
14 |     ('2'),
15 |     ('{23}'),
16 |     ('i'),
17 |     ('{ij}'),
18 |     ('{i,j}'),
19 |     ('{good}'),
20 |     ('{x^2}')
21 | ]
22 | 
23 | examples = []
24 | for symbol in symbols:
25 |     for subscript in subscripts:
26 |         examples.append(tuple(list(symbol) + [subscript]))
27 | 
28 | 
29 | @pytest.mark.parametrize('label, text, symbol_text, subscript', examples)
30 | def test_with_supexpr(label, text, symbol_text, subscript):
31 |     assert_equal(text + '^2', Pow(Symbol(symbol_text, real=True), Integer(2)))
32 | 
33 | 
34 | @pytest.mark.parametrize('label, text, symbol_text, subscript', examples)
35 | def test_with_subexpr(label, text, symbol_text, subscript):
36 |     assert_equal(text + '_' + subscript, Symbol(symbol_text + '_' + subscript, real=True))
37 | 
38 | 
39 | @pytest.mark.parametrize('label, text, symbol_text, subscript', examples)
40 | def test_with_subexpr_before_supexpr(label, text, symbol_text, subscript):
41 |     assert_equal(text + '_' + subscript + '^2', Pow(Symbol(symbol_text + '_' + subscript, real=True), Integer(2)))
42 | 
43 | 
44 | @pytest.mark.parametrize('label, text, symbol_text, subscript', examples)
45 | def test_with_subexpr_before_supexpr_with_braces(label, text, symbol_text, subscript):
46 |     wrapped_subscript = subscript if '{' in subscript else '{' + subscript + '}'
47 |     assert_equal(text + '_' + wrapped_subscript + '^{2}', Pow(Symbol(symbol_text + '_' + subscript, real=True), Integer(2)))
48 | 
49 | 
50 | @pytest.mark.parametrize('label, text, symbol_text, subscript', examples)
51 | def test_with_supexpr_before_subexpr(label, text, symbol_text, subscript):
52 |     assert_equal(text + '^2_' + subscript, Pow(Symbol(symbol_text + '_' + subscript, real=True), Integer(2)))
53 | 
54 | 
55 | @pytest.mark.parametrize('label, text, symbol_text, subscript', examples)
56 | def test_with_supexpr_before_subexpr_with_braces(label, text, symbol_text, subscript):
57 |     wrapped_subscript = subscript if '{' in subscript else '{' + subscript + '}'
58 |     assert_equal(text + '^{2}_' + wrapped_subscript, Pow(Symbol(symbol_text + '_' + subscript, real=True), Integer(2)))
59 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/binomial_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal, _Add, _Mul, _Pow
 2 | import pytest
 3 | from sympy import binomial, Symbol
 4 | 
 5 | x = Symbol('x', real=True)
 6 | y = Symbol('y', real=True)
 7 | theta = Symbol('theta', real=True)
 8 | gamma = Symbol('gamma', real=True)
 9 | 
10 | 
11 | def test_binomial_numeric():
12 |     assert_equal("\\binom{16}{2}", binomial(16, 2))
13 | 
14 | 
15 | def test_binomial_symbols():
16 |     assert_equal("\\binom{x}{y}", binomial(x, y))
17 | 
18 | 
19 | def test_binomial_greek_symbols():
20 |     assert_equal("\\binom{\\theta}{\\gamma}", binomial(theta, gamma))
21 | 
22 | 
23 | def test_binomial_expr():
24 |     assert_equal("\\binom{16+2}{\\frac{4}{2}}", binomial(_Add(16, 2), _Mul(4, _Pow(2, -1)), evaluate=False))
25 | 
26 | 
27 | def test_choose_numeric():
28 |     assert_equal("\\choose{16}{2}", binomial(16, 2))
29 | 
30 | 
31 | def test_choose_symbols():
32 |     assert_equal("\\choose{x}{y}", binomial(x, y))
33 | 
34 | 
35 | def test_choose_greek_symbols():
36 |     assert_equal("\\choose{\\theta}{\\gamma}", binomial(theta, gamma))
37 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/ceil_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal, get_simple_examples
 2 | import pytest
 3 | from sympy import ceiling
 4 | 
 5 | examples = get_simple_examples(ceiling)
 6 | 
 7 | 
 8 | @pytest.mark.parametrize('input, output, symbolically', examples)
 9 | def test_ceil_func(input, output, symbolically):
10 |     assert_equal("\\ceil({input})".format(input=input), output, symbolically=symbolically)
11 | 
12 | 
13 | @pytest.mark.parametrize('input, output, symbolically', examples)
14 | def test_ceil_operatorname(input, output, symbolically):
15 |     assert_equal("\\operatorname{{ceil}}({input})".format(input=input), output, symbolically=symbolically)
16 | 
17 | 
18 | @pytest.mark.parametrize('input, output, symbolically', examples)
19 | def test_ceil_cmd(input, output, symbolically):
20 |     assert_equal("\\lceil {input}\\rceil".format(input=input), output, symbolically=symbolically)
21 |     assert_equal("\\left\\lceil {input}\\right\\rceil".format(input=input), output, symbolically=symbolically)
22 |     assert_equal("\\mleft\\lceil {input}\\mright\\rceil".format(input=input), output, symbolically=symbolically)
23 | 
24 | 
25 | @pytest.mark.parametrize('input, output, symbolically', examples)
26 | def test_ceil_corners(input, output, symbolically):
27 |     assert_equal("\\ulcorner {input}\\urcorner".format(input=input), output, symbolically=symbolically)
28 |     assert_equal("\\left\\ulcorner {input}\\right\\urcorner".format(input=input), output, symbolically=symbolically)
29 |     assert_equal("\\mleft\\ulcorner {input}\\mright\\urcorner".format(input=input), output, symbolically=symbolically)
30 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/complex_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal
 2 | import pytest
 3 | from sympy import Sum, I, Symbol, Integer
 4 | 
 5 | a = Symbol('a', real=True)
 6 | b = Symbol('b', real=True)
 7 | i = Symbol('i', real=True)
 8 | n = Symbol('n', real=True)
 9 | x = Symbol('x', real=True)
10 | 
11 | 
12 | def test_complex():
13 |     assert_equal("a+Ib", a + I * b)
14 | 
15 | 
16 | def test_complex_e():
17 |     assert_equal("e^{I\\pi}", Integer(-1))
18 | 
19 | 
20 | def test_complex_sum():
21 |     assert_equal("\\sum_{i=0}^{n} i \\cdot x", Sum(i * x, (i, 0, n)))
22 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/exp_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal
 2 | import pytest
 3 | from sympy import exp, sin, Symbol, E
 4 | 
 5 | x = Symbol('x', real=True)
 6 | y = Symbol('y', real=True)
 7 | 
 8 | 
 9 | def test_exp_letter():
10 |     assert_equal("e", E)
11 |     assert_equal("e", exp(1))
12 | 
13 | 
14 | def test_exp_func():
15 |     assert_equal("\\exp(3)", exp(3))
16 | 
17 | 
18 | def test_exp_func_no_delim():
19 |     assert_equal("\\exp3", exp(3))
20 | 
21 | 
22 | def test_exp_command_symbol():
23 |     assert_equal("\\exponentialE", E)
24 |     assert_equal("\\exponentialE", exp(1))
25 | 
26 | 
27 | def test_exp_command_symbol_expression():
28 |     assert_equal("\\exponentialE^{3}", exp(3))
29 | 
30 | 
31 | def test_exp_command_symbol_multiplied():
32 |     '''
33 |     \\exponentialE is NOT a function, so using the following notation equates to multiplication
34 |     '''
35 |     assert_equal("\\exponentialE (3)", E * 3)
36 |     assert_equal("\\exponentialE \\left( 3\\right)", E * 3)
37 |     assert_equal("\\exponentialE \\times 3", E * 3)
38 | 
39 | 
40 | def test_exp_numeric():
41 |     assert_equal("e^3", exp(3))
42 | 
43 | 
44 | def test_exp_symbol():
45 |     assert_equal("e^x", exp(x))
46 | 
47 | 
48 | def test_exp_symbol_expr():
49 |     assert_equal("e^{x+y}", exp(x + y))
50 | 
51 | 
52 | def test_exp_symbol_expr_group():
53 |     assert_equal("e^{(x+y)}", exp(x + y))
54 | 
55 | 
56 | def test_exp_expr():
57 |     assert_equal("\\sin(x)*e^x", sin(x) * exp(x))
58 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/floor_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal, get_simple_examples
 2 | import pytest
 3 | from sympy import floor
 4 | 
 5 | examples = get_simple_examples(floor)
 6 | 
 7 | 
 8 | @pytest.mark.parametrize('input, output, symbolically', examples)
 9 | def test_floor_func(input, output, symbolically):
10 |     assert_equal("\\floor({input})".format(input=input), output, symbolically=symbolically)
11 | 
12 | 
13 | @pytest.mark.parametrize('input, output, symbolically', examples)
14 | def test_floor_operatorname(input, output, symbolically):
15 |     assert_equal("\\operatorname{{floor}}({input})".format(input=input), output, symbolically=symbolically)
16 | 
17 | 
18 | @pytest.mark.parametrize('input, output, symbolically', examples)
19 | def test_floor_cmd(input, output, symbolically):
20 |     assert_equal("\\lfloor {input}\\rfloor".format(input=input), output, symbolically=symbolically)
21 |     assert_equal("\\left\\lfloor {input}\\right\\rfloor".format(input=input), output, symbolically=symbolically)
22 |     assert_equal("\\mleft\\lfloor {input}\\mright\\rfloor".format(input=input), output, symbolically=symbolically)
23 | 
24 | 
25 | @pytest.mark.parametrize('input, output, symbolically', examples)
26 | def test_floor_corners(input, output, symbolically):
27 |     assert_equal("\\llcorner {input}\\lrcorner".format(input=input), output, symbolically=symbolically)
28 |     assert_equal("\\left\\llcorner {input}\\right\\lrcorner".format(input=input), output, symbolically=symbolically)
29 |     assert_equal("\\mleft\\llcorner {input}\\mright\\lrcorner".format(input=input), output, symbolically=symbolically)
30 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/greek_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal
 2 | import pytest
 3 | from sympy import Symbol
 4 | 
 5 | epsilon_upper = Symbol('char"000190', real=True)
 6 | epsilon_lower = Symbol('epsilon', real=True)
 7 | varepsilon = Symbol('varepsilon', real=True)
 8 | 
 9 | 
10 | def test_greek_epsilon():
11 |     assert_equal("\\epsilon", epsilon_lower)
12 | 
13 | 
14 | def test_greek_epsilon_upper():
15 |     assert_equal('\\char"000190', epsilon_upper)
16 | 
17 | 
18 | def test_greek_varepsilon():
19 |     assert_equal('\\varepsilon', varepsilon)
20 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/grouping_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal, _Pow, _Add, _Mul
 2 | import pytest
 3 | from sympy import Integral, sin, Symbol, Mul, Integer, Pow
 4 | from latex2sympy.latex2sympy2 import latex2sympy as process_sympy
 5 | 
 6 | a = Symbol('a', real=True)
 7 | b = Symbol('b', real=True)
 8 | x = Symbol('x', real=True)
 9 | theta = Symbol('theta', real=True)
10 | 
11 | 
12 | func_arg_examples = [
13 |     ('\\int ', 'x dx', Integral(x, x)),
14 |     ('\\sin', '\\theta ', sin(theta))
15 | ]
16 | 
17 | example_groups = [
18 |     ('1+2', '3-4', _Mul(_Add(1, 2), _Add(3, _Mul(-1, 4))))
19 | ]
20 | 
21 | modifiable_delimiter_pairs = {
22 |     '(': ')',
23 |     '\\lgroup': '\\rgroup',
24 |     '\\{': '\\}',
25 |     '\\lbrace': '\\rbrace',
26 |     '[': ']',
27 |     '\\lbrack': '\\rbrack',
28 | }
29 | 
30 | 
31 | @pytest.mark.parametrize('func, args, output', func_arg_examples)
32 | def test_func_arg_groupings(func, args, output):
33 |     # none
34 |     assert_equal("{func} {args}".format(func=func, args=args), output)
35 |     # normal brace (not modifiable)
36 |     assert_equal("{func}{{{args}}}".format(func=func, args=args), output)
37 |     # rest of delimiters, with modifications
38 |     for left, right in modifiable_delimiter_pairs.items():
39 |         assert_equal("{func}{left}{args}{right}".format(left=left, right=right, func=func, args=args), output)
40 |         assert_equal("{func}\\left{left}{args}\\right{right}".format(left=left, right=right, func=func, args=args), output)
41 |         assert_equal("{func}\\mleft{left}{args}\\mright{right}".format(left=left, right=right, func=func, args=args), output)
42 | 
43 | 
44 | @pytest.mark.parametrize('group1, group2, output', example_groups)
45 | def test_delimiter_groupings(group1, group2, output):
46 |     # normal brace (not modifiable)
47 |     assert_equal("{{{group1}}}{{{group2}}}".format(group1=group1, group2=group2), output)
48 |     # rest of delimiters, with modifications
49 |     for left, right in modifiable_delimiter_pairs.items():
50 |         assert_equal("{left}{group1}{right}{left}{group2}{right}".format(left=left, right=right, group1=group1, group2=group2), output)
51 |         assert_equal("\\left{left}{group1}\\right{right}\\left{left}{group2}\\right{right}".format(left=left, right=right, group1=group1, group2=group2), output)
52 |         assert_equal("\\mleft{left}{group1}\\mright{right}\\mleft{left}{group2}\\mright{right}".format(left=left, right=right, group1=group1, group2=group2), output)
53 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/left_right_cdot_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal
 2 | import pytest
 3 | from sympy import sin, Symbol
 4 | 
 5 | x = Symbol('x', real=True)
 6 | 
 7 | 
 8 | def test_left_right_cdot():
 9 |     assert_equal("\\sin\\left(x\\right)\\cdot x", sin(x) * x)
10 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/linalg_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal
 2 | import pytest
 3 | from sympy import MatMul, Matrix
 4 | 
 5 | 
 6 | def test_linalg_placeholder():
 7 |     assert_equal("\\begin{pmatrix}1&2\\\\3&4\\end{pmatrix}\\cdot\\variable{v}", MatMul(Matrix([[1, 2], [3, 4]]), Matrix([1, 2])), {'v': Matrix([1, 2])})
 8 | 
 9 | 
10 | def test_linalg_placeholder_multiple():
11 |     assert_equal("\\variable{M}\\cdot\\variable{v}", MatMul(Matrix([[1, 2], [3, 4]]), Matrix([1, 2])), {'M': Matrix([[1, 2], [3, 4]]), 'v': Matrix([1, 2])})
12 | 
13 | 
14 | def test_linalg_placeholder_multiple_mul():
15 |     assert_equal("\\begin{pmatrix}3&-1\\end{pmatrix}\\cdot\\variable{M}\\cdot\\variable{v}", MatMul(Matrix([[3, -1]]), Matrix([[1, 2], [3, 4]]), Matrix([1, 2])), {'M': Matrix([[1, 2], [3, 4]]), 'v': Matrix([1, 2])})
16 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/overline_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal
 2 | import pytest
 3 | from sympy import sin, Symbol
 4 | 
 5 | x = Symbol('x', real=True)
 6 | 
 7 | 
 8 | def test_overline():
 9 |     assert_equal("\\frac{\\sin(x)}{\\overline{x}_n}", sin(x) / Symbol('xbar_n', real=True))
10 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/pi_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal, _Mul, _Pow
 2 | import pytest
 3 | from sympy import pi, Symbol, acos, cos
 4 | 
 5 | 
 6 | def test_pi_frac():
 7 |     assert_equal("\\frac{\\pi}{3}", _Mul(pi, _Pow(3, -1)))
 8 | 
 9 | 
10 | def test_pi_nested():
11 |     assert_equal("\\arccos{\\cos{\\frac{\\pi}{3}}}", acos(cos(_Mul(pi, _Pow(3, -1)), evaluate=False), evaluate=False))
12 | 
13 | 
14 | def test_pi_arccos():
15 |     assert_equal("\\arccos{-1}", pi, symbolically=True)
16 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/latex2sympy/tests/trig_test.py:
--------------------------------------------------------------------------------
 1 | from .context import assert_equal
 2 | import pytest
 3 | from sympy import asinh, Symbol
 4 | 
 5 | # x = Symbol('x', real=True);
 6 | 
 7 | # latex = "\\sinh(x)"
 8 | # math = process_sympy(latex)
 9 | # print("latex: %s to math: %s" %(latex,math))
10 | #
11 | # latex = "\\arcsinh(x)"
12 | # math = process_sympy(latex)
13 | # print("latex: %s to math: %s" %(latex,math))
14 | #
15 | # latex = "\\arsinh(x)"
16 | # math = process_sympy(latex)
17 | # print("latex: %s to math: %s" %(latex,math))
18 | 
19 | 
20 | def test_arcsinh():
21 |     assert_equal("\\operatorname{arcsinh}\\left(1\\right)", asinh(1, evaluate=False))
22 | 


--------------------------------------------------------------------------------
/tools/evaluate_math/requirements.txt:
--------------------------------------------------------------------------------
 1 | # common
 2 | vllm
 3 | tqdm
 4 | datasets
 5 | torch
 6 | transformers
 7 | python_dateutil
 8 | flash_attn
 9 | 
10 | # math_eval
11 | sympy==1.12
12 | antlr4-python3-runtime==4.11.1 # ! The version needs to be compatible with sympy.
13 | word2number
14 | Pebble
15 | timeout-decorator


--------------------------------------------------------------------------------
/tools/evaluate_math/scripts/evaluate_deepseek.sh:
--------------------------------------------------------------------------------
 1 | set -ex
 2 | 
 3 | PROMPT_TYPE="deepseek-math"
 4 | MODEL_NAME_OR_PATH=$1
 5 | OUTPUT_DIR=$2
 6 | SUMMARY_PATH=$3
 7 | SPLIT="test"
 8 | NUM_TEST_SAMPLE=-1
 9 | 
10 | mkdir -p $OUTPUT_DIR
11 | cd ..
12 | 
13 | DATA_NAME="math,minerva_math,gsm8k,olympiadbench,aime24,amc23,theoremqa"
14 | TOKENIZERS_PARALLELISM=false \
15 | python3 -u math_eval.py \
16 |     --model_name_or_path ${MODEL_NAME_OR_PATH} \
17 |     --data_name ${DATA_NAME} \
18 |     --output_dir ${OUTPUT_DIR} \
19 |     --summary_path ${SUMMARY_PATH} \
20 |     --split ${SPLIT} \
21 |     --prompt_type ${PROMPT_TYPE} \
22 |     --num_test_sample ${NUM_TEST_SAMPLE} \
23 |     --seed 0 \
24 |     --temperature 0 \
25 |     --n_sampling 1 \
26 |     --top_p 1 \
27 |     --start 0 \
28 |     --end -1 \
29 |     --use_vllm \
30 |     --save_outputs \
31 |     # --overwrite \


--------------------------------------------------------------------------------
/tools/evaluate_math/scripts/evaluate_qwen.sh:
--------------------------------------------------------------------------------
 1 | set -ex
 2 | 
 3 | PROMPT_TYPE="qwen25-math-cot"
 4 | MODEL_NAME_OR_PATH=$1
 5 | OUTPUT_DIR=$2
 6 | SUMMARY_PATH=$3
 7 | SPLIT="test"
 8 | NUM_TEST_SAMPLE=-1
 9 | 
10 | mkdir -p $OUTPUT_DIR
11 | cd ..
12 | 
13 | DATA_NAME="math,minerva_math,gsm8k,olympiadbench,amc23,aime24,theoremqa"
14 | # DATA_NAME="minerva_math"
15 | TOKENIZERS_PARALLELISM=false \
16 | python3 -u math_eval.py \
17 |     --model_name_or_path ${MODEL_NAME_OR_PATH} \
18 |     --data_name ${DATA_NAME} \
19 |     --output_dir ${OUTPUT_DIR} \
20 |     --summary_path ${SUMMARY_PATH} \
21 |     --split ${SPLIT} \
22 |     --prompt_type ${PROMPT_TYPE} \
23 |     --num_test_sample ${NUM_TEST_SAMPLE} \
24 |     --seed 0 \
25 |     --temperature 0 \
26 |     --n_sampling 1 \
27 |     --top_p 1 \
28 |     --start 0 \
29 |     --end -1 \
30 |     --use_vllm \
31 |     --save_outputs \
32 |     # --overwrite \
33 | 
34 | 
35 | #DATA_NAME="aime24"
36 | #TOKENIZERS_PARALLELISM=false \
37 | #python3 -u math_eval.py \
38 | #    --model_name_or_path ${MODEL_NAME_OR_PATH} \
39 | #    --data_name ${DATA_NAME} \
40 | #    --output_dir ${OUTPUT_DIR} \
41 | #    --summary_path ${SUMMARY_PATH} \
42 | #    --split ${SPLIT} \
43 | #    --prompt_type ${PROMPT_TYPE} \
44 | #    --num_test_sample ${NUM_TEST_SAMPLE} \
45 | #    --seed 0 \
46 | #    --temperature 0.8 \
47 | #    --n_sampling 1 \
48 | #    --top_p 1 \
49 | #    --start 0 \
50 | #    --end -1 \
51 | #    --use_vllm \
52 | #    --save_outputs \
53 | #    # --overwrite \
54 | 


--------------------------------------------------------------------------------
/tools/evaluate_mmlu-pro/cot_prompt_lib/initial_prompt.txt:
--------------------------------------------------------------------------------
1 | The following are multiple choice questions (with answers) about {$}. Think step by step and then finish your answer with "the answer is (X)" where X is the correct letter choice.
2 | 
3 | 
4 | 


--------------------------------------------------------------------------------
/tools/evaluate_mmlu-pro/cot_prompt_lib/initial_prompt_1.txt:
--------------------------------------------------------------------------------
1 | <|im_start|>system
2 | Please reason step by step, and put your answer with "the answer is (X)" where X is the correct letter choice.<|im_end|>
3 | 


--------------------------------------------------------------------------------
/tools/evaluate_mmlu-pro/cot_prompt_lib/initial_prompt_2.txt:
--------------------------------------------------------------------------------
1 | <|im_start|>system
2 | The following are multiple choice questions (with answers) about {$}. Think step by step and then finish your answer with "the answer is (X)" where X is the correct letter choice.<|im_end|>
3 | 


--------------------------------------------------------------------------------
/tools/evaluate_mmlu-pro/mmlu-pro-eval.sh:
--------------------------------------------------------------------------------
 1 | set -ex
 2 | 
 3 | model_path=$1
 4 | output_dir=$2
 5 | summary_path=$3
 6 | n_shot=$4
 7 | 
 8 | python evaluate_from_local.py \
 9 |     --ntrain $n_shot \
10 |     --model $model_path \
11 |     --save_dir $output_dir \
12 |     --global_record_file $summary_path
13 | 
14 | 


--------------------------------------------------------------------------------
/tools/scripts/download_data.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | set -ex
3 | 
4 | cd ../download_data
5 | python download_cft_data_hf.py --config 4k 50k
6 | 


--------------------------------------------------------------------------------
/tools/scripts/evaluate.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | set -ex
 3 | 
 4 | model_path="/path/to/model"
 5 | output_dir="../evaluation_output"
 6 | summary_path="../evaluation_summary.txt"
 7 | 
 8 | export CUDA_VISIBLE_DEVICES=0,1,2,3
 9 | 
10 | cd ../evaluate_math/scripts
11 | bash evaluate_qwen.sh ${model_path} ${output_dir} ${summary_path}
12 | 
13 | cd ../../evaluate_gpqa/scripts
14 | bash evaluate_gpqa.sh ${model_path} ${output_dir} ${summary_path}
15 | 
16 | cd ../../evaluate_mmlu-pro
17 | bash mmlu-pro-eval.sh ${model_path} ${output_dir} ${summary_path} 0
18 | 


--------------------------------------------------------------------------------
/tools/self_construct_critique_data/run.sh:
--------------------------------------------------------------------------------
1 | 
2 | export OPENAI_API_KEY=YOUR_API_KEY
3 | 
4 | python generate_critique_by_api.py --model_name "gpt-4o-2024-11-20" --num_processes 20
5 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/.env.local:
--------------------------------------------------------------------------------
 1 | # Note: actually we do not support .env, just for reference
 2 | # api
 3 | API_HOST=
 4 | API_PORT=
 5 | API_KEY=
 6 | API_MODEL_NAME=
 7 | FASTAPI_ROOT_PATH=
 8 | MAX_CONCURRENT=
 9 | # general
10 | DISABLE_VERSION_CHECK=
11 | FORCE_CHECK_IMPORTS=
12 | LLAMAFACTORY_VERBOSITY=
13 | USE_MODELSCOPE_HUB=
14 | USE_OPENMIND_HUB=
15 | RECORD_VRAM=
16 | # torchrun
17 | FORCE_TORCHRUN=
18 | MASTER_ADDR=
19 | MASTER_PORT=
20 | NNODES=
21 | NODE_RANK=
22 | NPROC_PER_NODE=
23 | # wandb
24 | WANDB_DISABLED=
25 | WANDB_PROJECT=
26 | WANDB_API_KEY=
27 | # gradio ui
28 | GRADIO_SHARE=
29 | GRADIO_SERVER_NAME=
30 | GRADIO_SERVER_PORT=
31 | GRADIO_ROOT_PATH=
32 | GRADIO_IPV6=
33 | # setup
34 | ENABLE_SHORT_CONSOLE=1
35 | # reserved (do not use)
36 | LLAMABOARD_ENABLED=
37 | LLAMABOARD_WORKDIR=
38 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/.gitattributes:
--------------------------------------------------------------------------------
1 | # Auto detect text files and perform LF normalization
2 | * text=auto
3 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/.pre-commit-config.yaml:
--------------------------------------------------------------------------------
 1 | repos:
 2 | -   repo: https://github.com/pre-commit/pre-commit-hooks
 3 |     rev: v5.0.0
 4 |     hooks:
 5 |     -   id: check-ast
 6 |     -   id: check-added-large-files
 7 |         args: ['--maxkb=25000']
 8 |     -   id: check-merge-conflict
 9 |     -   id: check-yaml
10 |     -   id: debug-statements
11 |     -   id: end-of-file-fixer
12 |     -   id: trailing-whitespace
13 |         args: [--markdown-linebreak-ext=md]
14 |     -   id: no-commit-to-branch
15 |         args: ['--branch', 'main']
16 | 
17 | -   repo: https://github.com/asottile/pyupgrade
18 |     rev: v3.17.0
19 |     hooks:
20 |     -   id: pyupgrade
21 |         args: [--py38-plus]
22 | 
23 | -   repo: https://github.com/astral-sh/ruff-pre-commit
24 |     rev: v0.6.9
25 |     hooks:
26 |     -   id: ruff
27 |         args: [--fix]
28 |     -   id: ruff-format
29 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/CITATION.cff:
--------------------------------------------------------------------------------
 1 | cff-version: 1.2.0
 2 | date-released: 2024-03
 3 | message: "If you use this software, please cite it as below."
 4 | authors:
 5 | - family-names: "Zheng"
 6 |   given-names: "Yaowei"
 7 | - family-names: "Zhang"
 8 |   given-names: "Richong"
 9 | - family-names: "Zhang"
10 |   given-names: "Junhao"
11 | - family-names: "Ye"
12 |   given-names: "Yanhan"
13 | - family-names: "Luo"
14 |   given-names: "Zheyan"
15 | - family-names: "Feng"
16 |   given-names: "Zhangchi"
17 | - family-names: "Ma"
18 |   given-names: "Yongqiang"
19 | title: "LlamaFactory: Unified Efficient Fine-Tuning of 100+ Language Models"
20 | url: "https://arxiv.org/abs/2403.13372"
21 | preferred-citation:
22 |   type: conference-paper
23 |   conference:
24 |     name: "Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 3: System Demonstrations)"
25 |   authors:
26 |     - family-names: "Zheng"
27 |       given-names: "Yaowei"
28 |     - family-names: "Zhang"
29 |       given-names: "Richong"
30 |     - family-names: "Zhang"
31 |       given-names: "Junhao"
32 |     - family-names: "Ye"
33 |       given-names: "Yanhan"
34 |     - family-names: "Luo"
35 |       given-names: "Zheyan"
36 |     - family-names: "Feng"
37 |       given-names: "Zhangchi"
38 |     - family-names: "Ma"
39 |       given-names: "Yongqiang"
40 |   title: "LlamaFactory: Unified Efficient Fine-Tuning of 100+ Language Models"
41 |   url: "https://arxiv.org/abs/2403.13372"
42 |   year: 2024
43 |   publisher: "Association for Computational Linguistics"
44 |   address: "Bangkok, Thailand"
45 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/MANIFEST.in:
--------------------------------------------------------------------------------
1 | include LICENSE requirements.txt
2 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/Makefile:
--------------------------------------------------------------------------------
 1 | .PHONY: build commit quality style test
 2 | 
 3 | check_dirs := scripts src tests setup.py
 4 | 
 5 | build:
 6 | 	pip install build && python -m build
 7 | 
 8 | commit:
 9 | 	pre-commit install
10 | 	pre-commit run --all-files
11 | 
12 | quality:
13 | 	ruff check $(check_dirs)
14 | 	ruff format --check $(check_dirs)
15 | 
16 | style:
17 | 	ruff check $(check_dirs) --fix
18 | 	ruff format $(check_dirs)
19 | 
20 | test:
21 | 	CUDA_VISIBLE_DEVICES= WANDB_DISABLED=true pytest -vv tests/
22 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/assets/logo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/assets/logo.png


--------------------------------------------------------------------------------
/train/LLaMA-Factory/assets/wechat.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/assets/wechat.jpg


--------------------------------------------------------------------------------
/train/LLaMA-Factory/assets/wechat_npu.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/assets/wechat_npu.jpg


--------------------------------------------------------------------------------
/train/LLaMA-Factory/data/mllm_demo_data/1.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/data/mllm_demo_data/1.jpg


--------------------------------------------------------------------------------
/train/LLaMA-Factory/data/mllm_demo_data/1.mp4:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/data/mllm_demo_data/1.mp4


--------------------------------------------------------------------------------
/train/LLaMA-Factory/data/mllm_demo_data/2.avi:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/data/mllm_demo_data/2.avi


--------------------------------------------------------------------------------
/train/LLaMA-Factory/data/mllm_demo_data/2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/data/mllm_demo_data/2.jpg


--------------------------------------------------------------------------------
/train/LLaMA-Factory/data/mllm_demo_data/3.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/data/mllm_demo_data/3.jpg


--------------------------------------------------------------------------------
/train/LLaMA-Factory/data/mllm_demo_data/3.mp4:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/data/mllm_demo_data/3.mp4


--------------------------------------------------------------------------------
/train/LLaMA-Factory/data/mllm_video_demo.json:
--------------------------------------------------------------------------------
 1 | [
 2 |   {
 3 |     "messages": [
 4 |       {
 5 |         "content": "<video>Why is this video funny?",
 6 |         "role": "user"
 7 |       },
 8 |       {
 9 |         "content": "Because a baby is reading, and he is so cute!",
10 |         "role": "assistant"
11 |       }
12 |     ],
13 |     "videos": [
14 |       "mllm_demo_data/1.mp4"
15 |     ]
16 |   },
17 |   {
18 |     "messages": [
19 |       {
20 |         "content": "<video>What is she doing?",
21 |         "role": "user"
22 |       },
23 |       {
24 |         "content": "She is cooking.",
25 |         "role": "assistant"
26 |       }
27 |     ],
28 |     "videos": [
29 |       "mllm_demo_data/2.avi"
30 |     ]
31 |   },
32 |   {
33 |     "messages": [
34 |       {
35 |         "content": "<video>What's in the video?",
36 |         "role": "user"
37 |       },
38 |       {
39 |         "content": "A baby is playing in the living room.",
40 |         "role": "assistant"
41 |       }
42 |     ],
43 |     "videos": [
44 |       "mllm_demo_data/3.mp4"
45 |     ]
46 |   }
47 | ]
48 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/data/ultra_chat/ultra_chat.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | import os
 3 | from typing import List
 4 | 
 5 | import datasets
 6 | 
 7 | 
 8 | _HF_ENDPOINT = os.getenv("HF_ENDPOINT", "https://huggingface.co")
 9 | 
10 | _DESCRIPTION = "UltraChat: Large-scale, Informative, and Diverse Multi-round Dialogue Data."
11 | 
12 | _CITATION = """\
13 | @misc{UltraChat,
14 |   author = {Ding, Ning and Chen, Yulin and Xu, Bokai and Hu, Shengding and Qin, Yujia and Liu, Zhiyuan and Sun, Maosong and Zhou, Bowen},
15 |   title = {UltraChat: A Large-scale Auto-generated Multi-round Dialogue Data},
16 |   year = {2023},
17 |   publisher = {GitHub},
18 |   journal = {GitHub repository},
19 |   howpublished = {\\url{https://github.com/thunlp/ultrachat}},
20 | }
21 | """
22 | 
23 | _HOMEPAGE = f"{_HF_ENDPOINT}/datasets/stingning/ultrachat"
24 | _LICENSE = "cc-by-nc-4.0"
25 | _BASE_DATA_URL = f"{_HF_ENDPOINT}/datasets/stingning/ultrachat/resolve/main/train_{{idx}}.jsonl"
26 | 
27 | 
28 | class UltraChat(datasets.GeneratorBasedBuilder):
29 |     VERSION = datasets.Version("0.0.0")
30 | 
31 |     def _info(self):
32 |         features = datasets.Features(
33 |             {"conversations": [{"from": datasets.Value("string"), "value": datasets.Value("string")}]}
34 |         )
35 |         return datasets.DatasetInfo(
36 |             description=_DESCRIPTION, features=features, homepage=_HOMEPAGE, license=_LICENSE, citation=_CITATION
37 |         )
38 | 
39 |     def _split_generators(self, dl_manager: datasets.DownloadManager):
40 |         file_paths = [dl_manager.download(_BASE_DATA_URL.format(idx=idx)) for idx in range(10)]  # multiple shards
41 |         return [datasets.SplitGenerator(name=datasets.Split.TRAIN, gen_kwargs={"filepaths": file_paths})]
42 | 
43 |     def _generate_examples(self, filepaths: List[str]):
44 |         for filepath in filepaths:
45 |             with open(filepath, encoding="utf-8") as f:
46 |                 for row in f:
47 |                     try:
48 |                         data = json.loads(row)
49 |                     except Exception:
50 |                         continue
51 |                     key: int = data["id"]
52 |                     content: List[str] = data["data"]
53 |                     if len(content) % 2 == 1:
54 |                         content.pop(-1)
55 |                     if len(content) < 2:
56 |                         continue
57 |                     conversations = [
58 |                         {"from": "human" if i % 2 == 0 else "gpt", "value": content[i]} for i in range(len(content))
59 |                     ]
60 |                     yield key, {"conversations": conversations}
61 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/docker/docker-cuda/Dockerfile:
--------------------------------------------------------------------------------
 1 | # Default use the NVIDIA official image with PyTorch 2.3.0
 2 | # https://docs.nvidia.com/deeplearning/frameworks/pytorch-release-notes/index.html
 3 | ARG BASE_IMAGE=nvcr.io/nvidia/pytorch:24.02-py3
 4 | FROM ${BASE_IMAGE}
 5 | 
 6 | # Define environments
 7 | ENV MAX_JOBS=4
 8 | ENV FLASH_ATTENTION_FORCE_BUILD=TRUE
 9 | ENV VLLM_WORKER_MULTIPROC_METHOD=spawn
10 | 
11 | # Define installation arguments
12 | ARG INSTALL_BNB=false
13 | ARG INSTALL_VLLM=false
14 | ARG INSTALL_DEEPSPEED=false
15 | ARG INSTALL_FLASHATTN=false
16 | ARG INSTALL_LIGER_KERNEL=false
17 | ARG INSTALL_HQQ=false
18 | ARG INSTALL_EETQ=false
19 | ARG PIP_INDEX=https://pypi.org/simple
20 | 
21 | # Set the working directory
22 | WORKDIR /app
23 | 
24 | # Install the requirements
25 | COPY requirements.txt /app
26 | RUN pip config set global.index-url "$PIP_INDEX" && \
27 |     pip config set global.extra-index-url "$PIP_INDEX" && \
28 |     python -m pip install --upgrade pip && \
29 |     python -m pip install -r requirements.txt
30 | 
31 | # Copy the rest of the application into the image
32 | COPY . /app
33 | 
34 | # Install the LLaMA Factory
35 | RUN EXTRA_PACKAGES="metrics"; \
36 |     if [ "$INSTALL_BNB" == "true" ]; then \
37 |         EXTRA_PACKAGES="${EXTRA_PACKAGES},bitsandbytes"; \
38 |     fi; \
39 |     if [ "$INSTALL_VLLM" == "true" ]; then \
40 |         EXTRA_PACKAGES="${EXTRA_PACKAGES},vllm"; \
41 |     fi; \
42 |     if [ "$INSTALL_DEEPSPEED" == "true" ]; then \
43 |         EXTRA_PACKAGES="${EXTRA_PACKAGES},deepspeed"; \
44 |     fi; \
45 |     if [ "$INSTALL_LIGER_KERNEL" == "true" ]; then \
46 |         EXTRA_PACKAGES="${EXTRA_PACKAGES},liger-kernel"; \
47 |     fi; \
48 |     if [ "$INSTALL_HQQ" == "true" ]; then \
49 |         EXTRA_PACKAGES="${EXTRA_PACKAGES},hqq"; \
50 |     fi; \
51 |     if [ "$INSTALL_EETQ" == "true" ]; then \
52 |         EXTRA_PACKAGES="${EXTRA_PACKAGES},eetq"; \
53 |     fi; \
54 |     pip install -e ".[$EXTRA_PACKAGES]"
55 | 
56 | # Rebuild flash attention
57 | RUN pip uninstall -y transformer-engine flash-attn && \
58 |     if [ "$INSTALL_FLASHATTN" == "true" ]; then \
59 |         pip uninstall -y ninja && pip install ninja && \
60 |         pip install --no-cache-dir flash-attn --no-build-isolation; \
61 |     fi
62 | 
63 | # Set up volumes
64 | VOLUME [ "/root/.cache/huggingface", "/root/.cache/modelscope", "/app/data", "/app/output" ]
65 | 
66 | # Expose port 7860 for the LLaMA Board
67 | ENV GRADIO_SERVER_PORT 7860
68 | EXPOSE 7860
69 | 
70 | # Expose port 8000 for the API service
71 | ENV API_PORT 8000
72 | EXPOSE 8000
73 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/docker/docker-cuda/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   llamafactory:
 3 |     build:
 4 |       dockerfile: ./docker/docker-cuda/Dockerfile
 5 |       context: ../..
 6 |       args:
 7 |         INSTALL_BNB: false
 8 |         INSTALL_VLLM: false
 9 |         INSTALL_DEEPSPEED: false
10 |         INSTALL_FLASHATTN: false
11 |         INSTALL_LIGER_KERNEL: false
12 |         INSTALL_HQQ: false
13 |         INSTALL_EETQ: false
14 |         PIP_INDEX: https://pypi.org/simple
15 |     container_name: llamafactory
16 |     volumes:
17 |       - ../../hf_cache:/root/.cache/huggingface
18 |       - ../../ms_cache:/root/.cache/modelscope
19 |       - ../../om_cache:/root/.cache/openmind
20 |       - ../../data:/app/data
21 |       - ../../output:/app/output
22 |     ports:
23 |       - "7860:7860"
24 |       - "8000:8000"
25 |     ipc: host
26 |     tty: true
27 |     shm_size: '16gb'
28 |     stdin_open: true
29 |     command: bash
30 |     deploy:
31 |       resources:
32 |         reservations:
33 |           devices:
34 |           - driver: nvidia
35 |             count: "all"
36 |             capabilities: [gpu]
37 |     restart: unless-stopped
38 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/docker/docker-npu/Dockerfile:
--------------------------------------------------------------------------------
 1 | # Use the Ubuntu 22.04 image with CANN 8.0.rc1
 2 | # More versions can be found at https://hub.docker.com/r/ascendai/cann/tags
 3 | # FROM ascendai/cann:8.0.rc1-910-ubuntu22.04-py3.8
 4 | FROM ascendai/cann:8.0.rc1-910b-ubuntu22.04-py3.8
 5 | # FROM ascendai/cann:8.0.rc1-910-openeuler22.03-py3.8
 6 | # FROM ascendai/cann:8.0.rc1-910b-openeuler22.03-py3.8
 7 | 
 8 | # Define environments
 9 | ENV DEBIAN_FRONTEND=noninteractive
10 | 
11 | # Define installation arguments
12 | ARG INSTALL_DEEPSPEED=false
13 | ARG PIP_INDEX=https://pypi.org/simple
14 | ARG TORCH_INDEX=https://download.pytorch.org/whl/cpu
15 | 
16 | # Set the working directory
17 | WORKDIR /app
18 | 
19 | # Install the requirements
20 | COPY requirements.txt /app
21 | RUN pip config set global.index-url "$PIP_INDEX" && \
22 |     pip config set global.extra-index-url "$TORCH_INDEX" && \
23 |     python -m pip install --upgrade pip && \
24 |     python -m pip install -r requirements.txt
25 | 
26 | # Copy the rest of the application into the image
27 | COPY . /app
28 | 
29 | # Install the LLaMA Factory
30 | RUN EXTRA_PACKAGES="torch-npu,metrics"; \
31 |     if [ "$INSTALL_DEEPSPEED" == "true" ]; then \
32 |         EXTRA_PACKAGES="${EXTRA_PACKAGES},deepspeed"; \
33 |     fi; \
34 |     pip install -e ".[$EXTRA_PACKAGES]"
35 | 
36 | # Set up volumes
37 | VOLUME [ "/root/.cache/huggingface", "/root/.cache/modelscope", "/app/data", "/app/output" ]
38 | 
39 | # Expose port 7860 for the LLaMA Board
40 | ENV GRADIO_SERVER_PORT 7860
41 | EXPOSE 7860
42 | 
43 | # Expose port 8000 for the API service
44 | ENV API_PORT 8000
45 | EXPOSE 8000
46 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/docker/docker-npu/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   llamafactory:
 3 |     build:
 4 |       dockerfile: ./docker/docker-npu/Dockerfile
 5 |       context: ../..
 6 |       args:
 7 |         INSTALL_DEEPSPEED: false
 8 |         PIP_INDEX: https://pypi.org/simple
 9 |     container_name: llamafactory
10 |     volumes:
11 |       - ../../hf_cache:/root/.cache/huggingface
12 |       - ../../ms_cache:/root/.cache/modelscope
13 |       - ../../om_cache:/root/.cache/openmind
14 |       - ../../data:/app/data
15 |       - ../../output:/app/output
16 |       - /usr/local/dcmi:/usr/local/dcmi
17 |       - /usr/local/bin/npu-smi:/usr/local/bin/npu-smi
18 |       - /usr/local/Ascend/driver:/usr/local/Ascend/driver
19 |       - /etc/ascend_install.info:/etc/ascend_install.info
20 |     ports:
21 |       - "7860:7860"
22 |       - "8000:8000"
23 |     ipc: host
24 |     tty: true
25 |     shm_size: '16gb'
26 |     stdin_open: true
27 |     command: bash
28 |     devices:
29 |       - /dev/davinci0
30 |       - /dev/davinci_manager
31 |       - /dev/devmm_svm
32 |       - /dev/hisi_hdc
33 |     restart: unless-stopped
34 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/docker/docker-rocm/Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM hardandheavy/transformers-rocm:2.2.0
 2 | 
 3 | # Define environments
 4 | ENV MAX_JOBS=4
 5 | ENV FLASH_ATTENTION_FORCE_BUILD=TRUE
 6 | ENV VLLM_WORKER_MULTIPROC_METHOD=spawn
 7 | 
 8 | # Define installation arguments
 9 | ARG INSTALL_BNB=false
10 | ARG INSTALL_VLLM=false
11 | ARG INSTALL_DEEPSPEED=false
12 | ARG INSTALL_FLASHATTN=false
13 | ARG INSTALL_LIGER_KERNEL=false
14 | ARG INSTALL_HQQ=false
15 | ARG PIP_INDEX=https://pypi.org/simple
16 | 
17 | # Set the working directory
18 | WORKDIR /app
19 | 
20 | # Install the requirements
21 | COPY requirements.txt /app
22 | RUN pip config set global.index-url "$PIP_INDEX" && \
23 |     pip config set global.extra-index-url "$PIP_INDEX" && \
24 |     python -m pip install --upgrade pip && \
25 |     python -m pip install -r requirements.txt
26 | 
27 | # Copy the rest of the application into the image
28 | COPY . /app
29 | 
30 | # Install the LLaMA Factory
31 | RUN EXTRA_PACKAGES="metrics"; \
32 |     if [ "$INSTALL_BNB" == "true" ]; then \
33 |         EXTRA_PACKAGES="${EXTRA_PACKAGES},bitsandbytes"; \
34 |     fi; \
35 |     if [ "$INSTALL_VLLM" == "true" ]; then \
36 |         EXTRA_PACKAGES="${EXTRA_PACKAGES},vllm"; \
37 |     fi; \
38 |     if [ "$INSTALL_DEEPSPEED" == "true" ]; then \
39 |         EXTRA_PACKAGES="${EXTRA_PACKAGES},deepspeed"; \
40 |     fi; \
41 |     if [ "$INSTALL_LIGER_KERNEL" == "true" ]; then \
42 |         EXTRA_PACKAGES="${EXTRA_PACKAGES},liger-kernel"; \
43 |     fi; \
44 |     if [ "$INSTALL_HQQ" == "true" ]; then \
45 |         EXTRA_PACKAGES="${EXTRA_PACKAGES},hqq"; \
46 |     fi; \
47 |     pip install -e ".[$EXTRA_PACKAGES]"
48 | 
49 | # Rebuild flash attention
50 | RUN pip uninstall -y transformer-engine flash-attn && \
51 |     if [ "$INSTALL_FLASHATTN" == "true" ]; then \
52 |         pip uninstall -y ninja && pip install ninja && \
53 |         pip install --no-cache-dir flash-attn --no-build-isolation; \
54 |     fi
55 | 
56 | # Set up volumes
57 | VOLUME [ "/root/.cache/huggingface", "/root/.cache/modelscope", "/app/data", "/app/output" ]
58 | 
59 | # Expose port 7860 for the LLaMA Board
60 | ENV GRADIO_SERVER_PORT 7860
61 | EXPOSE 7860
62 | 
63 | # Expose port 8000 for the API service
64 | ENV API_PORT 8000
65 | EXPOSE 8000
66 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/docker/docker-rocm/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   llamafactory:
 3 |     build:
 4 |       dockerfile: ./docker/docker-rocm/Dockerfile
 5 |       context: ../..
 6 |       args:
 7 |         INSTALL_BNB: false
 8 |         INSTALL_VLLM: false
 9 |         INSTALL_DEEPSPEED: false
10 |         INSTALL_FLASHATTN: false
11 |         INSTALL_LIGER_KERNEL: false
12 |         INSTALL_HQQ: false
13 |         PIP_INDEX: https://pypi.org/simple
14 |     container_name: llamafactory
15 |     volumes:
16 |       - ../../hf_cache:/root/.cache/huggingface
17 |       - ../../ms_cache:/root/.cache/modelscope
18 |       - ../../om_cache:/root/.cache/openmind
19 |       - ../../data:/app/data
20 |       - ../../output:/app/output
21 |       - ../../saves:/app/saves
22 |     ports:
23 |       - "7860:7860"
24 |       - "8000:8000"
25 |     ipc: host
26 |     tty: true
27 |     shm_size: '16gb'
28 |     stdin_open: true
29 |     command: bash
30 |     devices:
31 |       - /dev/kfd:/dev/kfd
32 |       - /dev/dri:/dev/dri
33 |     restart: unless-stopped
34 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/evaluation/ceval/ceval.zip:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/evaluation/ceval/ceval.zip


--------------------------------------------------------------------------------
/train/LLaMA-Factory/evaluation/cmmlu/cmmlu.zip:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/evaluation/cmmlu/cmmlu.zip


--------------------------------------------------------------------------------
/train/LLaMA-Factory/evaluation/mmlu/mmlu.zip:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/evaluation/mmlu/mmlu.zip


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/accelerate/fsdp_config.yaml:
--------------------------------------------------------------------------------
 1 | compute_environment: LOCAL_MACHINE
 2 | debug: false
 3 | distributed_type: FSDP
 4 | downcast_bf16: 'no'
 5 | fsdp_config:
 6 |   fsdp_auto_wrap_policy: TRANSFORMER_BASED_WRAP
 7 |   fsdp_backward_prefetch: BACKWARD_PRE
 8 |   fsdp_forward_prefetch: false
 9 |   fsdp_cpu_ram_efficient_loading: true
10 |   fsdp_offload_params: true # offload may affect training speed
11 |   fsdp_sharding_strategy: FULL_SHARD
12 |   fsdp_state_dict_type: FULL_STATE_DICT
13 |   fsdp_sync_module_states: true
14 |   fsdp_use_orig_params: true
15 | machine_rank: 0
16 | main_training_function: main
17 | mixed_precision: fp16 # or bf16
18 | num_machines: 1 # the number of nodes
19 | num_processes: 2 # the number of GPUs in all nodes
20 | rdzv_backend: static
21 | same_network: true
22 | tpu_env: []
23 | tpu_use_cluster: false
24 | tpu_use_sudo: false
25 | use_cpu: false
26 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/deepspeed/ds_z0_config.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "train_batch_size": "auto",
 3 |   "train_micro_batch_size_per_gpu": "auto",
 4 |   "gradient_accumulation_steps": "auto",
 5 |   "gradient_clipping": "auto",
 6 |   "zero_allow_untested_optimizer": true,
 7 |   "fp16": {
 8 |     "enabled": "auto",
 9 |     "loss_scale": 0,
10 |     "loss_scale_window": 1000,
11 |     "initial_scale_power": 16,
12 |     "hysteresis": 2,
13 |     "min_loss_scale": 1
14 |   },
15 |   "bf16": {
16 |     "enabled": "auto"
17 |   },
18 |   "zero_optimization": {
19 |     "stage": 0,
20 |     "allgather_partitions": true,
21 |     "allgather_bucket_size": 5e8,
22 |     "overlap_comm": true,
23 |     "reduce_scatter": true,
24 |     "reduce_bucket_size": 5e8,
25 |     "contiguous_gradients": true,
26 |     "round_robin_gradients": true
27 |   }
28 | }
29 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/deepspeed/ds_z2_config.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "train_batch_size": "auto",
 3 |   "train_micro_batch_size_per_gpu": "auto",
 4 |   "gradient_accumulation_steps": "auto",
 5 |   "gradient_clipping": "auto",
 6 |   "zero_allow_untested_optimizer": true,
 7 |   "fp16": {
 8 |     "enabled": "auto",
 9 |     "loss_scale": 0,
10 |     "loss_scale_window": 1000,
11 |     "initial_scale_power": 16,
12 |     "hysteresis": 2,
13 |     "min_loss_scale": 1
14 |   },
15 |   "bf16": {
16 |     "enabled": "auto"
17 |   },
18 |   "zero_optimization": {
19 |     "stage": 2,
20 |     "allgather_partitions": true,
21 |     "allgather_bucket_size": 5e8,
22 |     "overlap_comm": true,
23 |     "reduce_scatter": true,
24 |     "reduce_bucket_size": 5e8,
25 |     "contiguous_gradients": true,
26 |     "round_robin_gradients": true
27 |   }
28 | }
29 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/deepspeed/ds_z2_offload_config.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "train_batch_size": "auto",
 3 |   "train_micro_batch_size_per_gpu": "auto",
 4 |   "gradient_accumulation_steps": "auto",
 5 |   "gradient_clipping": "auto",
 6 |   "zero_allow_untested_optimizer": true,
 7 |   "fp16": {
 8 |     "enabled": "auto",
 9 |     "loss_scale": 0,
10 |     "loss_scale_window": 1000,
11 |     "initial_scale_power": 16,
12 |     "hysteresis": 2,
13 |     "min_loss_scale": 1
14 |   },
15 |   "bf16": {
16 |     "enabled": "auto"
17 |   },
18 |   "zero_optimization": {
19 |     "stage": 2,
20 |     "offload_optimizer": {
21 |       "device": "cpu",
22 |       "pin_memory": true
23 |     },
24 |     "allgather_partitions": true,
25 |     "allgather_bucket_size": 5e8,
26 |     "overlap_comm": true,
27 |     "reduce_scatter": true,
28 |     "reduce_bucket_size": 5e8,
29 |     "contiguous_gradients": true,
30 |     "round_robin_gradients": true
31 |   }
32 | }
33 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/deepspeed/ds_z3_config.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "train_batch_size": "auto",
 3 |   "train_micro_batch_size_per_gpu": "auto",
 4 |   "gradient_accumulation_steps": "auto",
 5 |   "gradient_clipping": "auto",
 6 |   "zero_allow_untested_optimizer": true,
 7 |   "fp16": {
 8 |     "enabled": "auto",
 9 |     "loss_scale": 0,
10 |     "loss_scale_window": 1000,
11 |     "initial_scale_power": 16,
12 |     "hysteresis": 2,
13 |     "min_loss_scale": 1
14 |   },
15 |   "bf16": {
16 |     "enabled": "auto"
17 |   },
18 |   "zero_optimization": {
19 |     "stage": 3,
20 |     "overlap_comm": true,
21 |     "contiguous_gradients": true,
22 |     "sub_group_size": 1e9,
23 |     "reduce_bucket_size": "auto",
24 |     "stage3_prefetch_bucket_size": "auto",
25 |     "stage3_param_persistence_threshold": "auto",
26 |     "stage3_max_live_parameters": 1e9,
27 |     "stage3_max_reuse_distance": 1e9,
28 |     "stage3_gather_16bit_weights_on_model_save": true
29 |   }
30 | }
31 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/deepspeed/ds_z3_offload_config.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "train_batch_size": "auto",
 3 |   "train_micro_batch_size_per_gpu": "auto",
 4 |   "gradient_accumulation_steps": "auto",
 5 |   "gradient_clipping": "auto",
 6 |   "zero_allow_untested_optimizer": true,
 7 |   "fp16": {
 8 |     "enabled": "auto",
 9 |     "loss_scale": 0,
10 |     "loss_scale_window": 1000,
11 |     "initial_scale_power": 16,
12 |     "hysteresis": 2,
13 |     "min_loss_scale": 1
14 |   },
15 |   "bf16": {
16 |     "enabled": "auto"
17 |   },
18 |   "zero_optimization": {
19 |     "stage": 3,
20 |     "offload_optimizer": {
21 |       "device": "cpu",
22 |       "pin_memory": true
23 |     },
24 |     "offload_param": {
25 |       "device": "cpu",
26 |       "pin_memory": true
27 |     },
28 |     "overlap_comm": true,
29 |     "contiguous_gradients": true,
30 |     "sub_group_size": 1e9,
31 |     "reduce_bucket_size": "auto",
32 |     "stage3_prefetch_bucket_size": "auto",
33 |     "stage3_param_persistence_threshold": "auto",
34 |     "stage3_max_live_parameters": 1e9,
35 |     "stage3_max_reuse_distance": 1e9,
36 |     "stage3_gather_16bit_weights_on_model_save": true
37 |   }
38 | }
39 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/extras/adam_mini/qwen2_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: Qwen/Qwen2-1.5B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | use_adam_mini: true
10 | 
11 | ### dataset
12 | dataset: identity,alpaca_en_demo
13 | template: qwen
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | 
19 | ### output
20 | output_dir: saves/qwen2-1_5b/full/sft
21 | logging_steps: 10
22 | save_steps: 500
23 | plot_loss: true
24 | overwrite_output_dir: true
25 | 
26 | ### train
27 | per_device_train_batch_size: 1
28 | gradient_accumulation_steps: 8
29 | learning_rate: 1.0e-5
30 | num_train_epochs: 3.0
31 | lr_scheduler_type: cosine
32 | warmup_ratio: 0.1
33 | bf16: true
34 | ddp_timeout: 180000000
35 | 
36 | ### eval
37 | val_size: 0.1
38 | per_device_eval_batch_size: 1
39 | eval_strategy: steps
40 | eval_steps: 500
41 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/extras/badam/llama3_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | use_badam: true
10 | badam_mode: layer
11 | badam_switch_mode: ascending
12 | badam_switch_interval: 50
13 | badam_verbose: 2
14 | # deepspeed: examples/deepspeed/ds_z3_config.json
15 | 
16 | ### dataset
17 | dataset: identity,alpaca_en_demo
18 | template: llama3
19 | cutoff_len: 2048
20 | max_samples: 1000
21 | overwrite_cache: true
22 | preprocessing_num_workers: 16
23 | 
24 | ### output
25 | output_dir: saves/llama3-8b/full/sft
26 | logging_steps: 10
27 | save_steps: 500
28 | plot_loss: true
29 | overwrite_output_dir: true
30 | 
31 | ### train
32 | per_device_train_batch_size: 1
33 | gradient_accumulation_steps: 8
34 | learning_rate: 1.0e-5
35 | num_train_epochs: 3.0
36 | lr_scheduler_type: cosine
37 | warmup_ratio: 0.1
38 | 
39 | ### eval
40 | val_size: 0.1
41 | per_device_eval_batch_size: 1
42 | eval_strategy: steps
43 | eval_steps: 500
44 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/extras/fsdp_qlora/llama3_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | quantization_bit: 4
 4 | trust_remote_code: true
 5 | 
 6 | ### method
 7 | stage: sft
 8 | do_train: true
 9 | finetuning_type: lora
10 | lora_target: all
11 | 
12 | ### dataset
13 | dataset: identity,alpaca_en_demo
14 | template: llama3
15 | cutoff_len: 2048
16 | max_samples: 1000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | 
20 | ### output
21 | output_dir: saves/llama3-8b/lora/sft
22 | logging_steps: 10
23 | save_steps: 500
24 | plot_loss: true
25 | overwrite_output_dir: true
26 | 
27 | ### train
28 | per_device_train_batch_size: 1
29 | gradient_accumulation_steps: 8
30 | learning_rate: 1.0e-4
31 | num_train_epochs: 3.0
32 | lr_scheduler_type: cosine
33 | warmup_ratio: 0.1
34 | bf16: true
35 | ddp_timeout: 180000000
36 | 
37 | ### eval
38 | val_size: 0.1
39 | per_device_eval_batch_size: 1
40 | eval_strategy: steps
41 | eval_steps: 500
42 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/extras/fsdp_qlora/train.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | # DO NOT use GPTQ/AWQ model in FSDP+QLoRA
3 | 
4 | CUDA_VISIBLE_DEVICES=0,1 accelerate launch \
5 |     --config_file examples/accelerate/fsdp_config.yaml \
6 |     src/train.py examples/extras/fsdp_qlora/llama3_lora_sft.yaml
7 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/extras/galore/llama3_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | use_galore: true
10 | galore_layerwise: true
11 | galore_target: mlp,self_attn
12 | galore_rank: 128
13 | galore_scale: 2.0
14 | 
15 | ### dataset
16 | dataset: identity,alpaca_en_demo
17 | template: llama3
18 | cutoff_len: 2048
19 | max_samples: 1000
20 | overwrite_cache: true
21 | preprocessing_num_workers: 16
22 | 
23 | ### output
24 | output_dir: saves/llama3-8b/full/sft
25 | logging_steps: 10
26 | save_steps: 500
27 | plot_loss: true
28 | overwrite_output_dir: true
29 | 
30 | ### train
31 | per_device_train_batch_size: 1
32 | gradient_accumulation_steps: 1
33 | learning_rate: 1.0e-5
34 | num_train_epochs: 3.0
35 | lr_scheduler_type: cosine
36 | warmup_ratio: 0.1
37 | pure_bf16: true
38 | ddp_timeout: 180000000
39 | 
40 | ### eval
41 | val_size: 0.1
42 | per_device_eval_batch_size: 1
43 | eval_strategy: steps
44 | eval_steps: 500
45 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/extras/llama_pro/expand.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | 
3 | python scripts/llama_pro.py \
4 |     --model_name_or_path meta-llama/Meta-Llama-3-8B-Instruct \
5 |     --output_dir models/llama3-8b-pro \
6 |     --num_expand 8
7 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/extras/llama_pro/llama3_freeze_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: models/llama3-8b-pro
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: freeze
 9 | freeze_trainable_layers: 8
10 | freeze_trainable_modules: all
11 | use_llama_pro: true
12 | 
13 | ### dataset
14 | dataset: identity,alpaca_en_demo
15 | template: llama3
16 | cutoff_len: 2048
17 | max_samples: 1000
18 | overwrite_cache: true
19 | preprocessing_num_workers: 16
20 | 
21 | ### output
22 | output_dir: saves/llama3-8b-pro/freeze/sft
23 | logging_steps: 10
24 | save_steps: 500
25 | plot_loss: true
26 | overwrite_output_dir: true
27 | 
28 | ### train
29 | per_device_train_batch_size: 1
30 | gradient_accumulation_steps: 8
31 | learning_rate: 1.0e-4
32 | num_train_epochs: 3.0
33 | lr_scheduler_type: cosine
34 | warmup_ratio: 0.1
35 | bf16: true
36 | ddp_timeout: 180000000
37 | 
38 | ### eval
39 | val_size: 0.1
40 | per_device_eval_batch_size: 1
41 | eval_strategy: steps
42 | eval_steps: 500
43 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/extras/loraplus/llama3_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | loraplus_lr_ratio: 16.0
11 | 
12 | ### dataset
13 | dataset: identity,alpaca_en_demo
14 | template: llama3
15 | cutoff_len: 2048
16 | max_samples: 1000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | 
20 | ### output
21 | output_dir: saves/llama3-8b/lora/sft
22 | logging_steps: 10
23 | save_steps: 500
24 | plot_loss: true
25 | overwrite_output_dir: true
26 | 
27 | ### train
28 | per_device_train_batch_size: 1
29 | gradient_accumulation_steps: 8
30 | learning_rate: 1.0e-4
31 | num_train_epochs: 3.0
32 | lr_scheduler_type: cosine
33 | warmup_ratio: 0.1
34 | bf16: true
35 | ddp_timeout: 180000000
36 | 
37 | ### eval
38 | val_size: 0.1
39 | per_device_eval_batch_size: 1
40 | eval_strategy: steps
41 | eval_steps: 500
42 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/extras/mod/llama3_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | mixture_of_depths: convert
10 | 
11 | ### dataset
12 | dataset: identity,alpaca_en_demo
13 | template: llama3
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | 
19 | ### output
20 | output_dir: saves/llama3-8b-mod/full/sft
21 | logging_steps: 10
22 | save_steps: 500
23 | plot_loss: true
24 | overwrite_output_dir: true
25 | 
26 | ### train
27 | per_device_train_batch_size: 1
28 | gradient_accumulation_steps: 8
29 | optim: paged_adamw_8bit
30 | learning_rate: 1.0e-5
31 | num_train_epochs: 3.0
32 | lr_scheduler_type: cosine
33 | warmup_ratio: 0.1
34 | pure_bf16: true
35 | ddp_timeout: 180000000
36 | 
37 | ### eval
38 | val_size: 0.1
39 | per_device_eval_batch_size: 1
40 | eval_strategy: steps
41 | eval_steps: 500
42 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/extras/nlg_eval/llama3_lora_predict.yaml:
--------------------------------------------------------------------------------
 1 | # The batch generation can be SLOW using this config.
 2 | # For faster inference, we recommend to use `scripts/vllm_infer.py`.
 3 | 
 4 | ### model
 5 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 6 | adapter_name_or_path: saves/llama3-8b/lora/sft
 7 | trust_remote_code: true
 8 | 
 9 | ### method
10 | stage: sft
11 | do_predict: true
12 | finetuning_type: lora
13 | 
14 | ### dataset
15 | eval_dataset: identity,alpaca_en_demo
16 | template: llama3
17 | cutoff_len: 2048
18 | max_samples: 50
19 | overwrite_cache: true
20 | preprocessing_num_workers: 16
21 | 
22 | ### output
23 | output_dir: saves/llama3-8b/lora/predict
24 | overwrite_output_dir: true
25 | 
26 | ### eval
27 | per_device_eval_batch_size: 1
28 | predict_with_generate: true
29 | ddp_timeout: 180000000
30 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/extras/pissa/init.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | 
3 | python scripts/pissa_init.py \
4 |     --model_name_or_path meta-llama/Meta-Llama-3-8B-Instruct \
5 |     --output_dir models/llama3-8b-pissa
6 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/extras/pissa/llama3_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | pissa_init: true
11 | pissa_iter: 16
12 | pissa_convert: true
13 | 
14 | ### dataset
15 | dataset: identity,alpaca_en_demo
16 | template: llama3
17 | cutoff_len: 2048
18 | max_samples: 1000
19 | overwrite_cache: true
20 | preprocessing_num_workers: 16
21 | 
22 | ### output
23 | output_dir: saves/llama3-8b/lora/sft
24 | logging_steps: 10
25 | save_steps: 500
26 | plot_loss: true
27 | overwrite_output_dir: true
28 | 
29 | ### train
30 | per_device_train_batch_size: 1
31 | gradient_accumulation_steps: 8
32 | learning_rate: 1.0e-4
33 | num_train_epochs: 3.0
34 | lr_scheduler_type: cosine
35 | warmup_ratio: 0.1
36 | bf16: true
37 | ddp_timeout: 180000000
38 | 
39 | ### eval
40 | val_size: 0.1
41 | per_device_eval_batch_size: 1
42 | eval_strategy: steps
43 | eval_steps: 500
44 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/inference/llama3.yaml:
--------------------------------------------------------------------------------
1 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
2 | template: llama3
3 | infer_backend: huggingface  # choices: [huggingface, vllm]
4 | trust_remote_code: true
5 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/inference/llama3_full_sft.yaml:
--------------------------------------------------------------------------------
1 | model_name_or_path: saves/llama3-8b/full/sft
2 | template: llama3
3 | infer_backend: huggingface  # choices: [huggingface, vllm]
4 | trust_remote_code: true
5 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/inference/llama3_lora_sft.yaml:
--------------------------------------------------------------------------------
1 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
2 | adapter_name_or_path: saves/llama3-8b/lora/sft
3 | template: llama3
4 | infer_backend: huggingface  # choices: [huggingface, vllm]
5 | trust_remote_code: true
6 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/inference/llama3_vllm.yaml:
--------------------------------------------------------------------------------
1 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
2 | template: llama3
3 | infer_backend: vllm
4 | vllm_enforce_eager: true
5 | trust_remote_code: true
6 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/inference/llava1_5.yaml:
--------------------------------------------------------------------------------
1 | model_name_or_path: llava-hf/llava-1.5-7b-hf
2 | template: llava
3 | infer_backend: huggingface  # choices: [huggingface, vllm]
4 | trust_remote_code: true
5 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/inference/qwen2_vl.yaml:
--------------------------------------------------------------------------------
1 | model_name_or_path: Qwen/Qwen2-VL-7B-Instruct
2 | template: qwen2_vl
3 | infer_backend: huggingface  # choices: [huggingface, vllm]
4 | trust_remote_code: true
5 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/merge_lora/llama3_gptq.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | template: llama3
 4 | trust_remote_code: true
 5 | 
 6 | ### export
 7 | export_dir: models/llama3_gptq
 8 | export_quantization_bit: 4
 9 | export_quantization_dataset: data/c4_demo.json
10 | export_size: 2
11 | export_device: cpu
12 | export_legacy_format: false
13 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/merge_lora/llama3_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### Note: DO NOT use quantized model or quantization_bit when merging lora adapters
 2 | 
 3 | ### model
 4 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 5 | adapter_name_or_path: saves/llama3-8b/lora/sft
 6 | template: llama3
 7 | finetuning_type: lora
 8 | trust_remote_code: true
 9 | 
10 | ### export
11 | export_dir: models/llama3_lora_sft
12 | export_size: 2
13 | export_device: cpu
14 | export_legacy_format: false
15 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/merge_lora/qwen2vl_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### Note: DO NOT use quantized model or quantization_bit when merging lora adapters
 2 | 
 3 | ### model
 4 | model_name_or_path: Qwen/Qwen2-VL-7B-Instruct
 5 | adapter_name_or_path: saves/qwen2_vl-7b/lora/sft
 6 | template: qwen2_vl
 7 | finetuning_type: lora
 8 | trust_remote_code: true
 9 | 
10 | ### export
11 | export_dir: models/qwen2_vl_lora_sft
12 | export_size: 2
13 | export_device: cpu
14 | export_legacy_format: false
15 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_full/llama3_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | deepspeed: examples/deepspeed/ds_z3_config.json  # choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
10 | 
11 | ### dataset
12 | dataset: identity,alpaca_en_demo
13 | template: llama3
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | 
19 | ### output
20 | output_dir: saves/llama3-8b/full/sft
21 | logging_steps: 10
22 | save_steps: 500
23 | plot_loss: true
24 | overwrite_output_dir: true
25 | 
26 | ### train
27 | per_device_train_batch_size: 1
28 | gradient_accumulation_steps: 2
29 | learning_rate: 1.0e-5
30 | num_train_epochs: 3.0
31 | lr_scheduler_type: cosine
32 | warmup_ratio: 0.1
33 | bf16: true
34 | ddp_timeout: 180000000
35 | 
36 | ### eval
37 | val_size: 0.1
38 | per_device_eval_batch_size: 1
39 | eval_strategy: steps
40 | eval_steps: 500
41 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_full/qwen2vl_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: Qwen/Qwen2-VL-7B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | freeze_vision_tower: true  # choices: [true, false]
10 | train_mm_proj_only: false  # choices: [true, false]
11 | deepspeed: examples/deepspeed/ds_z3_config.json  # choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
12 | 
13 | ### dataset
14 | dataset: mllm_demo,identity,alpaca_en_demo
15 | template: qwen2_vl
16 | cutoff_len: 2048
17 | max_samples: 1000
18 | overwrite_cache: true
19 | preprocessing_num_workers: 16
20 | 
21 | ### output
22 | output_dir: saves/qwen2_vl-7b/full/sft
23 | logging_steps: 10
24 | save_steps: 500
25 | plot_loss: true
26 | overwrite_output_dir: true
27 | 
28 | ### train
29 | per_device_train_batch_size: 1
30 | gradient_accumulation_steps: 2
31 | learning_rate: 1.0e-5
32 | num_train_epochs: 30.0
33 | lr_scheduler_type: cosine
34 | warmup_ratio: 0.1
35 | bf16: true
36 | ddp_timeout: 180000000
37 | 
38 | ### eval
39 | val_size: 0.1
40 | per_device_eval_batch_size: 1
41 | eval_strategy: steps
42 | eval_steps: 500
43 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_lora/llama3_lora_dpo.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: dpo
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | pref_beta: 0.1
11 | pref_loss: sigmoid  # choices: [sigmoid (dpo), orpo, simpo]
12 | 
13 | ### dataset
14 | dataset: dpo_en_demo
15 | template: llama3
16 | cutoff_len: 2048
17 | max_samples: 1000
18 | overwrite_cache: true
19 | preprocessing_num_workers: 16
20 | 
21 | ### output
22 | output_dir: saves/llama3-8b/lora/dpo
23 | logging_steps: 10
24 | save_steps: 500
25 | plot_loss: true
26 | overwrite_output_dir: true
27 | 
28 | ### train
29 | per_device_train_batch_size: 1
30 | gradient_accumulation_steps: 8
31 | learning_rate: 5.0e-6
32 | num_train_epochs: 3.0
33 | lr_scheduler_type: cosine
34 | warmup_ratio: 0.1
35 | bf16: true
36 | ddp_timeout: 180000000
37 | 
38 | ### eval
39 | val_size: 0.1
40 | per_device_eval_batch_size: 1
41 | eval_strategy: steps
42 | eval_steps: 500
43 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_lora/llama3_lora_eval.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | adapter_name_or_path: saves/llama3-8b/lora/sft
 4 | trust_remote_code: true
 5 | 
 6 | ### method
 7 | finetuning_type: lora
 8 | 
 9 | ### dataset
10 | task: mmlu_test  # choices: [mmlu_test, ceval_validation, cmmlu_test]
11 | template: fewshot
12 | lang: en
13 | n_shot: 5
14 | 
15 | ### output
16 | save_dir: saves/llama3-8b/lora/eval
17 | 
18 | ### eval
19 | batch_size: 4
20 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_lora/llama3_lora_kto.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: kto
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | pref_beta: 0.1
11 | 
12 | ### dataset
13 | dataset: kto_en_demo
14 | template: llama3
15 | cutoff_len: 2048
16 | max_samples: 1000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | 
20 | ### output
21 | output_dir: saves/llama3-8b/lora/kto
22 | logging_steps: 10
23 | save_steps: 500
24 | plot_loss: true
25 | overwrite_output_dir: true
26 | 
27 | ### train
28 | per_device_train_batch_size: 1
29 | gradient_accumulation_steps: 8
30 | learning_rate: 5.0e-6
31 | num_train_epochs: 3.0
32 | lr_scheduler_type: cosine
33 | warmup_ratio: 0.1
34 | bf16: true
35 | ddp_timeout: 180000000
36 | 
37 | ### eval
38 | val_size: 0.1
39 | per_device_eval_batch_size: 1
40 | eval_strategy: steps
41 | eval_steps: 500
42 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_lora/llama3_lora_ppo.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | reward_model: saves/llama3-8b/lora/reward
 4 | trust_remote_code: true
 5 | 
 6 | ### method
 7 | stage: ppo
 8 | do_train: true
 9 | finetuning_type: lora
10 | lora_target: all
11 | 
12 | ### dataset
13 | dataset: identity,alpaca_en_demo
14 | template: llama3
15 | cutoff_len: 2048
16 | max_samples: 1000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | 
20 | ### output
21 | output_dir: saves/llama3-8b/lora/ppo
22 | logging_steps: 10
23 | save_steps: 500
24 | plot_loss: true
25 | overwrite_output_dir: true
26 | 
27 | ### train
28 | per_device_train_batch_size: 1
29 | gradient_accumulation_steps: 8
30 | learning_rate: 1.0e-5
31 | num_train_epochs: 3.0
32 | lr_scheduler_type: cosine
33 | warmup_ratio: 0.1
34 | bf16: true
35 | ddp_timeout: 180000000
36 | 
37 | ### generate
38 | max_new_tokens: 512
39 | top_k: 0
40 | top_p: 0.9
41 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_lora/llama3_lora_pretrain.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: pt
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | 
11 | ### dataset
12 | dataset: c4_demo
13 | cutoff_len: 2048
14 | max_samples: 1000
15 | overwrite_cache: true
16 | preprocessing_num_workers: 16
17 | 
18 | ### output
19 | output_dir: saves/llama3-8b/lora/pretrain
20 | logging_steps: 10
21 | save_steps: 500
22 | plot_loss: true
23 | overwrite_output_dir: true
24 | 
25 | ### train
26 | per_device_train_batch_size: 1
27 | gradient_accumulation_steps: 8
28 | learning_rate: 1.0e-4
29 | num_train_epochs: 3.0
30 | lr_scheduler_type: cosine
31 | warmup_ratio: 0.1
32 | bf16: true
33 | ddp_timeout: 180000000
34 | 
35 | ### eval
36 | val_size: 0.1
37 | per_device_eval_batch_size: 1
38 | eval_strategy: steps
39 | eval_steps: 500
40 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_lora/llama3_lora_reward.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: rm
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | 
11 | ### dataset
12 | dataset: dpo_en_demo
13 | template: llama3
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | 
19 | ### output
20 | output_dir: saves/llama3-8b/lora/reward
21 | logging_steps: 10
22 | save_steps: 500
23 | plot_loss: true
24 | overwrite_output_dir: true
25 | 
26 | ### train
27 | per_device_train_batch_size: 1
28 | gradient_accumulation_steps: 8
29 | learning_rate: 1.0e-4
30 | num_train_epochs: 3.0
31 | lr_scheduler_type: cosine
32 | warmup_ratio: 0.1
33 | bf16: true
34 | ddp_timeout: 180000000
35 | 
36 | ### eval
37 | val_size: 0.1
38 | per_device_eval_batch_size: 1
39 | eval_strategy: steps
40 | eval_steps: 500
41 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_lora/llama3_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | 
11 | ### dataset
12 | dataset: identity,alpaca_en_demo
13 | template: llama3
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | 
19 | ### output
20 | output_dir: saves/llama3-8b/lora/sft
21 | logging_steps: 10
22 | save_steps: 500
23 | plot_loss: true
24 | overwrite_output_dir: true
25 | 
26 | ### train
27 | per_device_train_batch_size: 1
28 | gradient_accumulation_steps: 8
29 | learning_rate: 1.0e-4
30 | num_train_epochs: 3.0
31 | lr_scheduler_type: cosine
32 | warmup_ratio: 0.1
33 | bf16: true
34 | ddp_timeout: 180000000
35 | 
36 | ### eval
37 | val_size: 0.1
38 | per_device_eval_batch_size: 1
39 | eval_strategy: steps
40 | eval_steps: 500
41 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_lora/llama3_lora_sft_ds3.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | deepspeed: examples/deepspeed/ds_z3_config.json  # choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
11 | 
12 | ### dataset
13 | dataset: identity,alpaca_en_demo
14 | template: llama3
15 | cutoff_len: 2048
16 | max_samples: 1000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | 
20 | ### output
21 | output_dir: saves/llama3-8b/lora/sft
22 | logging_steps: 10
23 | save_steps: 500
24 | plot_loss: true
25 | overwrite_output_dir: true
26 | 
27 | ### train
28 | per_device_train_batch_size: 1
29 | gradient_accumulation_steps: 2
30 | learning_rate: 1.0e-4
31 | num_train_epochs: 3.0
32 | lr_scheduler_type: cosine
33 | warmup_ratio: 0.1
34 | bf16: true
35 | ddp_timeout: 180000000
36 | 
37 | ### eval
38 | val_size: 0.1
39 | per_device_eval_batch_size: 1
40 | eval_strategy: steps
41 | eval_steps: 500
42 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_lora/llama3_preprocess.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | 
11 | ### dataset
12 | dataset: identity,alpaca_en_demo
13 | template: llama3
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | tokenized_path: saves/llama3-8b/dataset/sft
19 | 
20 | ### output
21 | output_dir: saves/llama3-8b/lora/sft
22 | overwrite_output_dir: true
23 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_lora/llava1_5_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: llava-hf/llava-1.5-7b-hf
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | 
11 | ### dataset
12 | dataset: mllm_demo
13 | template: llava
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | 
19 | ### output
20 | output_dir: saves/llava1_5-7b/lora/sft
21 | logging_steps: 10
22 | save_steps: 500
23 | plot_loss: true
24 | overwrite_output_dir: true
25 | 
26 | ### train
27 | per_device_train_batch_size: 1
28 | gradient_accumulation_steps: 8
29 | learning_rate: 1.0e-4
30 | num_train_epochs: 3.0
31 | lr_scheduler_type: cosine
32 | warmup_ratio: 0.1
33 | bf16: true
34 | ddp_timeout: 180000000
35 | 
36 | ### eval
37 | val_size: 0.1
38 | per_device_eval_batch_size: 1
39 | eval_strategy: steps
40 | eval_steps: 500
41 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_lora/qwen2vl_lora_dpo.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: Qwen/Qwen2-VL-7B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: dpo
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | pref_beta: 0.1
11 | pref_loss: sigmoid  # choices: [sigmoid (dpo), orpo, simpo]
12 | 
13 | ### dataset
14 | dataset: rlhf_v
15 | template: qwen2_vl
16 | cutoff_len: 2048
17 | max_samples: 1000
18 | overwrite_cache: true
19 | preprocessing_num_workers: 16
20 | 
21 | ### output
22 | output_dir: saves/qwen2_vl-7b/lora/dpo
23 | logging_steps: 10
24 | save_steps: 500
25 | plot_loss: true
26 | overwrite_output_dir: true
27 | 
28 | ### train
29 | per_device_train_batch_size: 1
30 | gradient_accumulation_steps: 8
31 | learning_rate: 5.0e-6
32 | num_train_epochs: 3.0
33 | lr_scheduler_type: cosine
34 | warmup_ratio: 0.1
35 | bf16: true
36 | ddp_timeout: 180000000
37 | 
38 | ### eval
39 | val_size: 0.1
40 | per_device_eval_batch_size: 1
41 | eval_strategy: steps
42 | eval_steps: 500
43 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_lora/qwen2vl_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: Qwen/Qwen2-VL-7B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | 
11 | ### dataset
12 | dataset: mllm_demo,identity,alpaca_en_demo  # video: mllm_video_demo
13 | template: qwen2_vl
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | 
19 | ### output
20 | output_dir: saves/qwen2_vl-7b/lora/sft
21 | logging_steps: 10
22 | save_steps: 500
23 | plot_loss: true
24 | overwrite_output_dir: true
25 | 
26 | ### train
27 | per_device_train_batch_size: 1
28 | gradient_accumulation_steps: 8
29 | learning_rate: 1.0e-4
30 | num_train_epochs: 3.0
31 | lr_scheduler_type: cosine
32 | warmup_ratio: 0.1
33 | bf16: true
34 | ddp_timeout: 180000000
35 | 
36 | ### eval
37 | val_size: 0.1
38 | per_device_eval_batch_size: 1
39 | eval_strategy: steps
40 | eval_steps: 500
41 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_aqlm.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: ISTA-DASLab/Meta-Llama-3-8B-Instruct-AQLM-2Bit-1x16
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | 
11 | ### dataset
12 | dataset: identity,alpaca_en_demo
13 | template: llama3
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | 
19 | ### output
20 | output_dir: saves/llama3-8b/lora/sft
21 | logging_steps: 10
22 | save_steps: 500
23 | plot_loss: true
24 | overwrite_output_dir: true
25 | 
26 | ### train
27 | per_device_train_batch_size: 1
28 | gradient_accumulation_steps: 8
29 | learning_rate: 1.0e-4
30 | num_train_epochs: 3.0
31 | lr_scheduler_type: cosine
32 | warmup_ratio: 0.1
33 | bf16: true
34 | ddp_timeout: 180000000
35 | 
36 | ### eval
37 | val_size: 0.1
38 | per_device_eval_batch_size: 1
39 | eval_strategy: steps
40 | eval_steps: 500
41 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_awq.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: TechxGenus/Meta-Llama-3-8B-Instruct-AWQ
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | 
11 | ### dataset
12 | dataset: identity,alpaca_en_demo
13 | template: llama3
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | 
19 | ### output
20 | output_dir: saves/llama3-8b/lora/sft
21 | logging_steps: 10
22 | save_steps: 500
23 | plot_loss: true
24 | overwrite_output_dir: true
25 | 
26 | ### train
27 | per_device_train_batch_size: 1
28 | gradient_accumulation_steps: 8
29 | learning_rate: 1.0e-4
30 | num_train_epochs: 3.0
31 | lr_scheduler_type: cosine
32 | warmup_ratio: 0.1
33 | bf16: true
34 | ddp_timeout: 180000000
35 | 
36 | ### eval
37 | val_size: 0.1
38 | per_device_eval_batch_size: 1
39 | eval_strategy: steps
40 | eval_steps: 500
41 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_gptq.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: TechxGenus/Meta-Llama-3-8B-Instruct-GPTQ
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_target: all
10 | 
11 | ### dataset
12 | dataset: identity,alpaca_en_demo
13 | template: llama3
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | 
19 | ### output
20 | output_dir: saves/llama3-8b/lora/sft
21 | logging_steps: 10
22 | save_steps: 500
23 | plot_loss: true
24 | overwrite_output_dir: true
25 | 
26 | ### train
27 | per_device_train_batch_size: 1
28 | gradient_accumulation_steps: 8
29 | learning_rate: 1.0e-4
30 | num_train_epochs: 3.0
31 | lr_scheduler_type: cosine
32 | warmup_ratio: 0.1
33 | bf16: true
34 | ddp_timeout: 180000000
35 | 
36 | ### eval
37 | val_size: 0.1
38 | per_device_eval_batch_size: 1
39 | eval_strategy: steps
40 | eval_steps: 500
41 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_otfq.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | quantization_bit: 4
 4 | quantization_method: bitsandbytes  # choices: [bitsandbytes (4/8), hqq (2/3/4/5/6/8), eetq (8)]
 5 | trust_remote_code: true
 6 | 
 7 | ### method
 8 | stage: sft
 9 | do_train: true
10 | finetuning_type: lora
11 | lora_target: all
12 | 
13 | ### dataset
14 | dataset: identity,alpaca_en_demo
15 | template: llama3
16 | cutoff_len: 2048
17 | max_samples: 1000
18 | overwrite_cache: true
19 | preprocessing_num_workers: 16
20 | 
21 | ### output
22 | output_dir: saves/llama3-8b/lora/sft
23 | logging_steps: 10
24 | save_steps: 500
25 | plot_loss: true
26 | overwrite_output_dir: true
27 | 
28 | ### train
29 | per_device_train_batch_size: 1
30 | gradient_accumulation_steps: 8
31 | learning_rate: 1.0e-4
32 | num_train_epochs: 3.0
33 | lr_scheduler_type: cosine
34 | warmup_ratio: 0.1
35 | bf16: true
36 | ddp_timeout: 180000000
37 | 
38 | ### eval
39 | val_size: 0.1
40 | per_device_eval_batch_size: 1
41 | eval_strategy: steps
42 | eval_steps: 500
43 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/pyproject.toml:
--------------------------------------------------------------------------------
 1 | [build-system]
 2 | requires = ["setuptools>=61.0"]
 3 | build-backend = "setuptools.build_meta"
 4 | 
 5 | [tool.ruff]
 6 | target-version = "py38"
 7 | line-length = 119
 8 | indent-width = 4
 9 | 
10 | [tool.ruff.lint]
11 | ignore = ["C408", "C901", "E501", "E731", "E741", "W605"]
12 | select = ["C", "E", "F", "I", "W"]
13 | 
14 | [tool.ruff.lint.isort]
15 | lines-after-imports = 2
16 | known-first-party = ["llamafactory"]
17 | known-third-party = [
18 |     "accelerate",
19 |     "datasets",
20 |     "gradio",
21 |     "numpy",
22 |     "peft",
23 |     "torch",
24 |     "transformers",
25 |     "trl"
26 | ]
27 | 
28 | [tool.ruff.format]
29 | quote-style = "double"
30 | indent-style = "space"
31 | docstring-code-format = true
32 | skip-magic-trailing-comma = false
33 | line-ending = "auto"
34 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/requirements.txt:
--------------------------------------------------------------------------------
 1 | transformers>=4.41.2,<=4.46.1
 2 | datasets>=2.16.0,<=3.1.0
 3 | accelerate>=0.34.0,<=1.0.1
 4 | peft>=0.11.1,<=0.12.0
 5 | trl>=0.8.6,<=0.9.6
 6 | tokenizers>=0.19.0,<0.20.4
 7 | gradio>=4.0.0,<5.0.0
 8 | pandas>=2.0.0
 9 | scipy
10 | einops
11 | sentencepiece
12 | tiktoken
13 | protobuf
14 | uvicorn
15 | pydantic
16 | fastapi
17 | sse-starlette
18 | matplotlib>=3.7.0
19 | fire
20 | packaging
21 | pyyaml
22 | numpy<2.0.0
23 | av
24 | tyro<0.9.0
25 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/scripts/api_example/test_image.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | from openai import OpenAI
18 | from transformers.utils.versions import require_version
19 | 
20 | 
21 | require_version("openai>=1.5.0", "To fix: pip install openai>=1.5.0")
22 | 
23 | 
24 | def main():
25 |     client = OpenAI(
26 |         api_key="{}".format(os.environ.get("API_KEY", "0")),
27 |         base_url="http://localhost:{}/v1".format(os.environ.get("API_PORT", 8000)),
28 |     )
29 |     messages = []
30 |     messages.append(
31 |         {
32 |             "role": "user",
33 |             "content": [
34 |                 {"type": "text", "text": "Output the color and number of each box."},
35 |                 {
36 |                     "type": "image_url",
37 |                     "image_url": {"url": "https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen2-VL/boxes.png"},
38 |                 },
39 |             ],
40 |         }
41 |     )
42 |     result = client.chat.completions.create(messages=messages, model="test")
43 |     messages.append(result.choices[0].message)
44 |     print("Round 1:", result.choices[0].message.content)
45 |     # The image shows a pyramid of colored blocks with numbers on them. Here are the colors and numbers of ...
46 |     messages.append(
47 |         {
48 |             "role": "user",
49 |             "content": [
50 |                 {"type": "text", "text": "What kind of flower is this?"},
51 |                 {
52 |                     "type": "image_url",
53 |                     "image_url": {"url": "https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen2-VL/flowers.jpg"},
54 |                 },
55 |             ],
56 |         }
57 |     )
58 |     result = client.chat.completions.create(messages=messages, model="test")
59 |     messages.append(result.choices[0].message)
60 |     print("Round 2:", result.choices[0].message.content)
61 |     # The image shows a cluster of forget-me-not flowers. Forget-me-nots are small ...
62 | 
63 | 
64 | if __name__ == "__main__":
65 |     main()
66 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/scripts/stat_utils/cal_flops.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Microsoft Corporation and the LlamaFactory team.
 2 | #
 3 | # This code is inspired by the Microsoft's DeepSpeed library.
 4 | # https://www.deepspeed.ai/tutorials/flops-profiler/
 5 | #
 6 | # Licensed under the Apache License, Version 2.0 (the "License");
 7 | # you may not use this file except in compliance with the License.
 8 | # You may obtain a copy of the License at
 9 | #
10 | #     http://www.apache.org/licenses/LICENSE-2.0
11 | #
12 | # Unless required by applicable law or agreed to in writing, software
13 | # distributed under the License is distributed on an "AS IS" BASIS,
14 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 | # See the License for the specific language governing permissions and
16 | # limitations under the License.
17 | 
18 | import fire
19 | import torch
20 | from deepspeed.accelerator import get_accelerator  # type: ignore
21 | from deepspeed.profiling.flops_profiler import get_model_profile  # type: ignore
22 | 
23 | from llamafactory.chat import ChatModel
24 | 
25 | 
26 | def calculate_flops(
27 |     model_name_or_path: str,
28 |     batch_size: int = 1,
29 |     seq_length: int = 512,
30 |     flash_attn: str = "auto",
31 | ):
32 |     r"""
33 |     Calculates the flops of pre-trained models.
34 |     Usage: python cal_flops.py --model_name_or_path path_to_model --batch_size 1 --seq_length 512
35 |     """
36 |     with get_accelerator().device(0):
37 |         chat_model = ChatModel(dict(model_name_or_path=model_name_or_path, template="empty", flash_attn=flash_attn))
38 |         fake_input = torch.ones((batch_size, seq_length), dtype=torch.long, device=chat_model.engine.model.device)
39 |         input_dict = {"input_ids": fake_input, "labels": fake_input.clone()}
40 |         flops, macs, params = get_model_profile(
41 |             chat_model.engine.model, kwargs=input_dict, print_profile=True, detailed=True
42 |         )
43 |         print("FLOPs:", flops)
44 |         print("MACs:", macs)
45 |         print("Params:", params)
46 | 
47 | 
48 | if __name__ == "__main__":
49 |     fire.Fire(calculate_flops)
50 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/api.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | import uvicorn
18 | 
19 | from llamafactory.api.app import create_app
20 | from llamafactory.chat import ChatModel
21 | 
22 | 
23 | def main():
24 |     chat_model = ChatModel()
25 |     app = create_app(chat_model)
26 |     api_host = os.getenv("API_HOST", "0.0.0.0")
27 |     api_port = int(os.getenv("API_PORT", "8000"))
28 |     print(f"Visit http://localhost:{api_port}/docs for API document.")
29 |     uvicorn.run(app, host=api_host, port=api_port)
30 | 
31 | 
32 | if __name__ == "__main__":
33 |     main()
34 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory.egg-info/dependency_links.txt:
--------------------------------------------------------------------------------
1 | 
2 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory.egg-info/entry_points.txt:
--------------------------------------------------------------------------------
1 | [console_scripts]
2 | llamafactory-cli = llamafactory.cli:main
3 | lmf = llamafactory.cli:main
4 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory.egg-info/requires.txt:
--------------------------------------------------------------------------------
 1 | transformers<=4.46.1,>=4.41.2
 2 | datasets<=3.1.0,>=2.16.0
 3 | accelerate<=1.0.1,>=0.34.0
 4 | peft<=0.12.0,>=0.11.1
 5 | trl<=0.9.6,>=0.8.6
 6 | tokenizers<0.20.4,>=0.19.0
 7 | gradio<5.0.0,>=4.0.0
 8 | pandas>=2.0.0
 9 | scipy
10 | einops
11 | sentencepiece
12 | tiktoken
13 | protobuf
14 | uvicorn
15 | pydantic
16 | fastapi
17 | sse-starlette
18 | matplotlib>=3.7.0
19 | fire
20 | packaging
21 | pyyaml
22 | numpy<2.0.0
23 | av
24 | tyro<0.9.0
25 | 
26 | [adam-mini]
27 | adam-mini
28 | 
29 | [aqlm]
30 | aqlm[gpu]>=1.1.0
31 | 
32 | [awq]
33 | autoawq
34 | 
35 | [badam]
36 | badam>=1.2.1
37 | 
38 | [bitsandbytes]
39 | bitsandbytes>=0.39.0
40 | 
41 | [deepspeed]
42 | deepspeed<=0.14.4,>=0.10.0
43 | 
44 | [dev]
45 | pre-commit
46 | ruff
47 | pytest
48 | 
49 | [eetq]
50 | eetq
51 | 
52 | [galore]
53 | galore-torch
54 | 
55 | [gptq]
56 | optimum>=1.17.0
57 | auto-gptq>=0.5.0
58 | 
59 | [hqq]
60 | hqq
61 | 
62 | [liger-kernel]
63 | liger-kernel
64 | 
65 | [metrics]
66 | nltk
67 | jieba
68 | rouge-chinese
69 | 
70 | [modelscope]
71 | modelscope
72 | 
73 | [openmind]
74 | openmind
75 | 
76 | [qwen]
77 | transformers_stream_generator
78 | 
79 | [swanlab]
80 | swanlab
81 | 
82 | [torch]
83 | torch>=1.13.1
84 | 
85 | [torch-npu]
86 | torch==2.1.0
87 | torch-npu==2.1.0.post3
88 | decorator
89 | 
90 | [vllm]
91 | vllm<0.6.5,>=0.4.3
92 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory.egg-info/top_level.txt:
--------------------------------------------------------------------------------
1 | llamafactory
2 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | r"""
16 | Efficient fine-tuning of large language models.
17 | 
18 | Level:
19 |   api, webui > chat, eval, train > data, model > hparams > extras
20 | 
21 | Dependency graph:
22 |   main:
23 |     transformers>=4.41.2,<=4.46.1
24 |     datasets>=2.16.0,<=3.1.0
25 |     accelerate>=0.34.0,<=1.0.1
26 |     peft>=0.11.1,<=0.12.0
27 |     trl>=0.8.6,<=0.9.6
28 |   attention:
29 |     transformers>=4.42.4 (gemma+fa2)
30 |   longlora:
31 |     transformers>=4.41.2,<=4.46.1
32 |   packing:
33 |     transformers>=4.43.0,<=4.46.1
34 | 
35 | Disable version checking: DISABLE_VERSION_CHECK=1
36 | Enable VRAM recording: RECORD_VRAM=1
37 | Force check imports: FORCE_CHECK_IMPORTS=1
38 | Force using torchrun: FORCE_TORCHRUN=1
39 | Set logging verbosity: LLAMAFACTORY_VERBOSITY=WARN
40 | Use modelscope: USE_MODELSCOPE_HUB=1
41 | Use openmind: USE_OPENMIND_HUB=1
42 | """
43 | 
44 | from .extras.env import VERSION
45 | 
46 | 
47 | __version__ = VERSION
48 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/__pycache__/cli.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/__pycache__/cli.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/__pycache__/launcher.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/__pycache__/launcher.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/api/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/api/__init__.py


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/api/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/api/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/api/__pycache__/app.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/api/__pycache__/app.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/api/__pycache__/chat.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/api/__pycache__/chat.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/api/__pycache__/common.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/api/__pycache__/common.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/api/__pycache__/protocol.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/api/__pycache__/protocol.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/api/common.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import json
16 | from typing import TYPE_CHECKING, Any, Dict
17 | 
18 | 
19 | if TYPE_CHECKING:
20 |     from pydantic import BaseModel
21 | 
22 | 
23 | def dictify(data: "BaseModel") -> Dict[str, Any]:
24 |     try:  # pydantic v2
25 |         return data.model_dump(exclude_unset=True)
26 |     except AttributeError:  # pydantic v1
27 |         return data.dict(exclude_unset=True)
28 | 
29 | 
30 | def jsonify(data: "BaseModel") -> str:
31 |     try:  # pydantic v2
32 |         return json.dumps(data.model_dump(exclude_unset=True), ensure_ascii=False)
33 |     except AttributeError:  # pydantic v1
34 |         return data.json(exclude_unset=True, ensure_ascii=False)
35 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/chat/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .base_engine import BaseEngine
16 | from .chat_model import ChatModel
17 | 
18 | 
19 | __all__ = ["BaseEngine", "ChatModel"]
20 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/chat/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/chat/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/chat/__pycache__/base_engine.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/chat/__pycache__/base_engine.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/chat/__pycache__/chat_model.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/chat/__pycache__/chat_model.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/chat/__pycache__/hf_engine.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/chat/__pycache__/hf_engine.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/chat/__pycache__/vllm_engine.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/chat/__pycache__/vllm_engine.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/eval/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/eval/__init__.py


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/eval/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/eval/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/eval/__pycache__/evaluator.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/eval/__pycache__/evaluator.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/eval/__pycache__/template.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/eval/__pycache__/template.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/extras/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/extras/__init__.py


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/constants.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/constants.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/env.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/env.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/logging.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/logging.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/misc.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/misc.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/packages.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/packages.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/ploting.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/extras/__pycache__/ploting.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/extras/env.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 HuggingFace Inc. and the LlamaFactory team.
 2 | #
 3 | # This code is inspired by the HuggingFace's transformers library.
 4 | # https://github.com/huggingface/transformers/blob/v4.40.0/src/transformers/commands/env.py
 5 | #
 6 | # Licensed under the Apache License, Version 2.0 (the "License");
 7 | # you may not use this file except in compliance with the License.
 8 | # You may obtain a copy of the License at
 9 | #
10 | #     http://www.apache.org/licenses/LICENSE-2.0
11 | #
12 | # Unless required by applicable law or agreed to in writing, software
13 | # distributed under the License is distributed on an "AS IS" BASIS,
14 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 | # See the License for the specific language governing permissions and
16 | # limitations under the License.
17 | 
18 | import platform
19 | 
20 | import accelerate
21 | import datasets
22 | import peft
23 | import torch
24 | import transformers
25 | import trl
26 | from transformers.utils import is_torch_cuda_available, is_torch_npu_available
27 | 
28 | 
29 | VERSION = "0.9.2.dev0"
30 | 
31 | 
32 | def print_env() -> None:
33 |     info = {
34 |         "`llamafactory` version": VERSION,
35 |         "Platform": platform.platform(),
36 |         "Python version": platform.python_version(),
37 |         "PyTorch version": torch.__version__,
38 |         "Transformers version": transformers.__version__,
39 |         "Datasets version": datasets.__version__,
40 |         "Accelerate version": accelerate.__version__,
41 |         "PEFT version": peft.__version__,
42 |         "TRL version": trl.__version__,
43 |     }
44 | 
45 |     if is_torch_cuda_available():
46 |         info["PyTorch version"] += " (GPU)"
47 |         info["GPU type"] = torch.cuda.get_device_name()
48 | 
49 |     if is_torch_npu_available():
50 |         info["PyTorch version"] += " (NPU)"
51 |         info["NPU type"] = torch.npu.get_device_name()
52 |         info["CANN version"] = torch.version.cann
53 | 
54 |     try:
55 |         import deepspeed  # type: ignore
56 | 
57 |         info["DeepSpeed version"] = deepspeed.__version__
58 |     except Exception:
59 |         pass
60 | 
61 |     try:
62 |         import bitsandbytes
63 | 
64 |         info["Bitsandbytes version"] = bitsandbytes.__version__
65 |     except Exception:
66 |         pass
67 | 
68 |     try:
69 |         import vllm
70 | 
71 |         info["vLLM version"] = vllm.__version__
72 |     except Exception:
73 |         pass
74 | 
75 |     print("\n" + "\n".join([f"- {key}: {value}" for key, value in info.items()]) + "\n")
76 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/hparams/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .data_args import DataArguments
16 | from .evaluation_args import EvaluationArguments
17 | from .finetuning_args import FinetuningArguments
18 | from .generating_args import GeneratingArguments
19 | from .model_args import ModelArguments
20 | from .parser import get_eval_args, get_infer_args, get_train_args
21 | 
22 | 
23 | __all__ = [
24 |     "DataArguments",
25 |     "EvaluationArguments",
26 |     "FinetuningArguments",
27 |     "GeneratingArguments",
28 |     "ModelArguments",
29 |     "get_eval_args",
30 |     "get_infer_args",
31 |     "get_train_args",
32 | ]
33 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/data_args.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/data_args.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/evaluation_args.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/evaluation_args.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/finetuning_args.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/finetuning_args.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/generating_args.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/generating_args.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/model_args.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/model_args.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/parser.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/hparams/__pycache__/parser.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/hparams/evaluation_args.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | from dataclasses import dataclass, field
17 | from typing import Literal, Optional
18 | 
19 | from datasets import DownloadMode
20 | 
21 | 
22 | @dataclass
23 | class EvaluationArguments:
24 |     r"""
25 |     Arguments pertaining to specify the evaluation parameters.
26 |     """
27 | 
28 |     task: str = field(
29 |         metadata={"help": "Name of the evaluation task."},
30 |     )
31 |     task_dir: str = field(
32 |         default="evaluation",
33 |         metadata={"help": "Path to the folder containing the evaluation datasets."},
34 |     )
35 |     batch_size: int = field(
36 |         default=4,
37 |         metadata={"help": "The batch size per GPU for evaluation."},
38 |     )
39 |     seed: int = field(
40 |         default=42,
41 |         metadata={"help": "Random seed to be used with data loaders."},
42 |     )
43 |     lang: Literal["en", "zh"] = field(
44 |         default="en",
45 |         metadata={"help": "Language used at evaluation."},
46 |     )
47 |     n_shot: int = field(
48 |         default=5,
49 |         metadata={"help": "Number of examplars for few-shot learning."},
50 |     )
51 |     save_dir: Optional[str] = field(
52 |         default=None,
53 |         metadata={"help": "Path to save the evaluation results."},
54 |     )
55 |     download_mode: DownloadMode = field(
56 |         default=DownloadMode.REUSE_DATASET_IF_EXISTS,
57 |         metadata={"help": "Download mode used for the evaluation datasets."},
58 |     )
59 | 
60 |     def __post_init__(self):
61 |         if self.save_dir is not None and os.path.exists(self.save_dir):
62 |             raise ValueError("`save_dir` already exists, use another one.")
63 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/launcher.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from llamafactory.train.tuner import run_exp  # use absolute import
16 | 
17 | 
18 | def launch():
19 |     run_exp()
20 | 
21 | 
22 | if __name__ == "__main__":
23 |     launch()
24 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .loader import load_config, load_model, load_tokenizer
16 | from .model_utils.misc import find_all_linear_modules
17 | from .model_utils.quantization import QuantizationMethod
18 | from .model_utils.valuehead import load_valuehead_params
19 | 
20 | 
21 | __all__ = [
22 |     "QuantizationMethod",
23 |     "load_config",
24 |     "load_model",
25 |     "load_tokenizer",
26 |     "find_all_linear_modules",
27 |     "load_valuehead_params",
28 | ]
29 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/__pycache__/adapter.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/__pycache__/adapter.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/__pycache__/loader.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/__pycache__/loader.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/__pycache__/patcher.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/__pycache__/patcher.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__init__.py


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/attention.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/attention.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/checkpointing.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/checkpointing.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/embedding.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/embedding.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/liger_kernel.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/liger_kernel.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/longlora.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/longlora.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/misc.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/misc.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/mod.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/mod.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/moe.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/moe.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/packing.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/packing.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/quantization.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/quantization.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/rope.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/rope.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/unsloth.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/unsloth.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/valuehead.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/valuehead.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/visual.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/model/model_utils/__pycache__/visual.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/model/model_utils/mod.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from typing import TYPE_CHECKING
16 | 
17 | from ...extras.constants import MOD_SUPPORTED_MODELS
18 | 
19 | 
20 | if TYPE_CHECKING:
21 |     from transformers import PretrainedConfig, PreTrainedModel
22 | 
23 |     from ...hparams import ModelArguments
24 | 
25 | 
26 | def load_mod_pretrained_model(**init_kwargs) -> "PreTrainedModel":
27 |     from MoD import AutoMoDModelForCausalLM
28 | 
29 |     return AutoMoDModelForCausalLM.from_pretrained(**init_kwargs)
30 | 
31 | 
32 | def convert_pretrained_model_to_mod(
33 |     model: "PreTrainedModel", config: "PretrainedConfig", model_args: "ModelArguments"
34 | ) -> "PreTrainedModel":
35 |     from MoD import apply_mod_to_hf
36 | 
37 |     if getattr(config, "model_type", None) not in MOD_SUPPORTED_MODELS:
38 |         raise ValueError("Current model is not supported by mixture-of-depth.")
39 | 
40 |     model = apply_mod_to_hf(model)
41 |     model = model.to(model_args.compute_dtype)
42 |     return model
43 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/__init__.py


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/__pycache__/callbacks.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/__pycache__/callbacks.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/__pycache__/trainer_utils.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/__pycache__/trainer_utils.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/__pycache__/tuner.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/__pycache__/tuner.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/dpo/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .workflow import run_dpo
16 | 
17 | 
18 | __all__ = ["run_dpo"]
19 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/dpo/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/dpo/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/dpo/__pycache__/trainer.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/dpo/__pycache__/trainer.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/dpo/__pycache__/workflow.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/dpo/__pycache__/workflow.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/kto/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .workflow import run_kto
16 | 
17 | 
18 | __all__ = ["run_kto"]
19 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/kto/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/kto/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/kto/__pycache__/trainer.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/kto/__pycache__/trainer.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/kto/__pycache__/workflow.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/kto/__pycache__/workflow.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/ppo/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .workflow import run_ppo
16 | 
17 | 
18 | __all__ = ["run_ppo"]
19 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/ppo/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/ppo/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/ppo/__pycache__/ppo_utils.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/ppo/__pycache__/ppo_utils.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/ppo/__pycache__/trainer.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/ppo/__pycache__/trainer.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/ppo/__pycache__/workflow.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/ppo/__pycache__/workflow.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/pt/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .workflow import run_pt
16 | 
17 | 
18 | __all__ = ["run_pt"]
19 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/pt/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/pt/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/pt/__pycache__/trainer.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/pt/__pycache__/trainer.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/pt/__pycache__/workflow.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/pt/__pycache__/workflow.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/rm/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .workflow import run_rm
16 | 
17 | 
18 | __all__ = ["run_rm"]
19 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/rm/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/rm/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/rm/__pycache__/metric.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/rm/__pycache__/metric.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/rm/__pycache__/trainer.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/rm/__pycache__/trainer.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/rm/__pycache__/workflow.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/rm/__pycache__/workflow.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/rm/metric.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from dataclasses import dataclass
16 | from typing import TYPE_CHECKING, Dict, Optional
17 | 
18 | import numpy as np
19 | 
20 | from ...extras.misc import numpify
21 | 
22 | 
23 | if TYPE_CHECKING:
24 |     from transformers import EvalPrediction
25 | 
26 | 
27 | @dataclass
28 | class ComputeAccuracy:
29 |     r"""
30 |     Computes reward accuracy and supports `batch_eval_metrics`.
31 |     """
32 | 
33 |     def _dump(self) -> Optional[Dict[str, float]]:
34 |         result = None
35 |         if hasattr(self, "score_dict"):
36 |             result = {k: float(np.mean(v)) for k, v in self.score_dict.items()}
37 | 
38 |         self.score_dict = {"accuracy": []}
39 |         return result
40 | 
41 |     def __post_init__(self):
42 |         self._dump()
43 | 
44 |     def __call__(self, eval_preds: "EvalPrediction", compute_result: bool = True) -> Optional[Dict[str, float]]:
45 |         chosen_scores, rejected_scores = numpify(eval_preds.predictions[0]), numpify(eval_preds.predictions[1])
46 |         if not chosen_scores.shape:
47 |             self.score_dict["accuracy"].append(chosen_scores > rejected_scores)
48 |         else:
49 |             for i in range(len(chosen_scores)):
50 |                 self.score_dict["accuracy"].append(chosen_scores[i] > rejected_scores[i])
51 | 
52 |         if compute_result:
53 |             return self._dump()
54 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/sft/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .workflow import run_sft
16 | 
17 | 
18 | __all__ = ["run_sft"]
19 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/sft/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/sft/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/sft/__pycache__/metric.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/sft/__pycache__/metric.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/sft/__pycache__/trainer.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/sft/__pycache__/trainer.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/train/sft/__pycache__/workflow.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/train/sft/__pycache__/workflow.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/__init__.py


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/chatter.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/chatter.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/common.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/common.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/css.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/css.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/engine.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/engine.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/interface.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/interface.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/manager.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/manager.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/runner.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/runner.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/utils.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/__pycache__/utils.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/components/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .chatbot import create_chat_box
16 | from .eval import create_eval_tab
17 | from .export import create_export_tab
18 | from .infer import create_infer_tab
19 | from .top import create_top
20 | from .train import create_train_tab
21 | 
22 | 
23 | __all__ = [
24 |     "create_chat_box",
25 |     "create_eval_tab",
26 |     "create_export_tab",
27 |     "create_infer_tab",
28 |     "create_top",
29 |     "create_train_tab",
30 | ]
31 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/__init__.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/__init__.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/chatbot.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/chatbot.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/data.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/data.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/eval.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/eval.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/export.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/export.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/infer.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/infer.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/top.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/top.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/train.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/TIGER-AI-Lab/CritiqueFineTuning/6715b3ca3606b86141515f1918cc95b353609607/train/LLaMA-Factory/src/llamafactory/webui/components/__pycache__/train.cpython-311.pyc


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/llamafactory/webui/css.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | CSS = r"""
16 | .duplicate-button {
17 |   margin: auto !important;
18 |   color: white !important;
19 |   background: black !important;
20 |   border-radius: 100vh !important;
21 | }
22 | 
23 | .modal-box {
24 |   position: fixed !important;
25 |   top: 50%;
26 |   left: 50%;
27 |   transform: translate(-50%, -50%); /* center horizontally */
28 |   max-width: 1000px;
29 |   max-height: 750px;
30 |   overflow-y: auto;
31 |   background-color: var(--input-background-fill);
32 |   flex-wrap: nowrap !important;
33 |   border: 2px solid black !important;
34 |   z-index: 1000;
35 |   padding: 10px;
36 | }
37 | 
38 | .dark .modal-box {
39 |   border: 2px solid white !important;
40 | }
41 | """
42 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/train.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from llamafactory.train.tuner import run_exp
16 | 
17 | 
18 | def main():
19 |     run_exp()
20 | 
21 | 
22 | def _mp_fn(index):
23 |     # For xla_spawn (TPUs)
24 |     run_exp()
25 | 
26 | 
27 | if __name__ == "__main__":
28 |     main()
29 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/src/webui.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | from llamafactory.webui.interface import create_ui
18 | 
19 | 
20 | def main():
21 |     gradio_ipv6 = os.getenv("GRADIO_IPV6", "0").lower() in ["true", "1"]
22 |     gradio_share = os.getenv("GRADIO_SHARE", "0").lower() in ["true", "1"]
23 |     server_name = os.getenv("GRADIO_SERVER_NAME", "[::]" if gradio_ipv6 else "0.0.0.0")
24 |     create_ui().queue().launch(share=gradio_share, server_name=server_name, inbrowser=True)
25 | 
26 | 
27 | if __name__ == "__main__":
28 |     main()
29 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/tests/e2e/test_chat.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | from llamafactory.chat import ChatModel
18 | 
19 | 
20 | TINY_LLAMA = os.getenv("TINY_LLAMA", "llamafactory/tiny-random-Llama-3")
21 | 
22 | INFER_ARGS = {
23 |     "model_name_or_path": TINY_LLAMA,
24 |     "finetuning_type": "lora",
25 |     "template": "llama3",
26 |     "infer_dtype": "float16",
27 |     "do_sample": False,
28 |     "max_new_tokens": 1,
29 | }
30 | 
31 | MESSAGES = [
32 |     {"role": "user", "content": "Hi"},
33 | ]
34 | 
35 | EXPECTED_RESPONSE = "_rho"
36 | 
37 | 
38 | def test_chat():
39 |     chat_model = ChatModel(INFER_ARGS)
40 |     assert chat_model.chat(MESSAGES)[0].response_text == EXPECTED_RESPONSE
41 | 
42 | 
43 | def test_stream_chat():
44 |     chat_model = ChatModel(INFER_ARGS)
45 |     response = ""
46 |     for token in chat_model.stream_chat(MESSAGES):
47 |         response += token
48 | 
49 |     assert response == EXPECTED_RESPONSE
50 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/tests/e2e/test_train.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | import pytest
18 | 
19 | from llamafactory.train.tuner import export_model, run_exp
20 | 
21 | 
22 | DEMO_DATA = os.getenv("DEMO_DATA", "llamafactory/demo_data")
23 | 
24 | TINY_LLAMA = os.getenv("TINY_LLAMA", "llamafactory/tiny-random-Llama-3")
25 | 
26 | TINY_LLAMA_ADAPTER = os.getenv("TINY_LLAMA_ADAPTER", "llamafactory/tiny-random-Llama-3-lora")
27 | 
28 | TRAIN_ARGS = {
29 |     "model_name_or_path": TINY_LLAMA,
30 |     "do_train": True,
31 |     "finetuning_type": "lora",
32 |     "dataset_dir": "REMOTE:" + DEMO_DATA,
33 |     "template": "llama3",
34 |     "cutoff_len": 1,
35 |     "overwrite_cache": False,
36 |     "overwrite_output_dir": True,
37 |     "per_device_train_batch_size": 1,
38 |     "max_steps": 1,
39 | }
40 | 
41 | INFER_ARGS = {
42 |     "model_name_or_path": TINY_LLAMA,
43 |     "adapter_name_or_path": TINY_LLAMA_ADAPTER,
44 |     "finetuning_type": "lora",
45 |     "template": "llama3",
46 |     "infer_dtype": "float16",
47 | }
48 | 
49 | OS_NAME = os.getenv("OS_NAME", "")
50 | 
51 | 
52 | @pytest.mark.parametrize(
53 |     "stage,dataset",
54 |     [
55 |         ("pt", "c4_demo"),
56 |         ("sft", "alpaca_en_demo"),
57 |         ("dpo", "dpo_en_demo"),
58 |         ("kto", "kto_en_demo"),
59 |         pytest.param("rm", "dpo_en_demo", marks=pytest.mark.xfail(OS_NAME.startswith("windows"), reason="OS error.")),
60 |     ],
61 | )
62 | def test_run_exp(stage: str, dataset: str):
63 |     output_dir = os.path.join("output", f"train_{stage}")
64 |     run_exp({"stage": stage, "dataset": dataset, "output_dir": output_dir, **TRAIN_ARGS})
65 |     assert os.path.exists(output_dir)
66 | 
67 | 
68 | def test_export():
69 |     export_dir = os.path.join("output", "llama3_export")
70 |     export_model({"export_dir": export_dir, **INFER_ARGS})
71 |     assert os.path.exists(export_dir)
72 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/tests/model/model_utils/test_attention.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | from transformers.utils import is_flash_attn_2_available, is_torch_sdpa_available
18 | 
19 | from llamafactory.train.test_utils import load_infer_model
20 | 
21 | 
22 | TINY_LLAMA = os.getenv("TINY_LLAMA", "llamafactory/tiny-random-Llama-3")
23 | 
24 | INFER_ARGS = {
25 |     "model_name_or_path": TINY_LLAMA,
26 |     "template": "llama3",
27 | }
28 | 
29 | 
30 | def test_attention():
31 |     attention_available = ["disabled"]
32 |     if is_torch_sdpa_available():
33 |         attention_available.append("sdpa")
34 | 
35 |     if is_flash_attn_2_available():
36 |         attention_available.append("fa2")
37 | 
38 |     llama_attention_classes = {
39 |         "disabled": "LlamaAttention",
40 |         "sdpa": "LlamaSdpaAttention",
41 |         "fa2": "LlamaFlashAttention2",
42 |     }
43 |     for requested_attention in attention_available:
44 |         model = load_infer_model(flash_attn=requested_attention, **INFER_ARGS)
45 |         for module in model.modules():
46 |             if "Attention" in module.__class__.__name__:
47 |                 assert module.__class__.__name__ == llama_attention_classes[requested_attention]
48 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/tests/model/model_utils/test_packing.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import pytest
16 | import torch
17 | 
18 | from llamafactory.model.model_utils.packing import get_seqlens_in_batch, get_unpad_data
19 | 
20 | 
21 | @pytest.mark.parametrize(
22 |     "attention_mask,golden_seq_lens",
23 |     [
24 |         (
25 |             [
26 |                 [1, 1, 2, 2, 2, 0],
27 |                 [1, 2, 2, 3, 3, 3],
28 |             ],
29 |             [2, 3, 1, 2, 3],
30 |         ),
31 |         (
32 |             [[1]],
33 |             [1],
34 |         ),
35 |     ],
36 | )
37 | def test_get_seqlens_in_batch(attention_mask, golden_seq_lens):
38 |     attention_mask_with_indices = torch.tensor(attention_mask)
39 |     seqlens_in_batch = get_seqlens_in_batch(attention_mask_with_indices)
40 |     assert torch.all(seqlens_in_batch == torch.tensor(golden_seq_lens))
41 | 
42 | 
43 | @pytest.mark.parametrize(
44 |     "attention_mask,golden_indices,golden_cu_seqlens,golden_max_seqlen",
45 |     [
46 |         (
47 |             [
48 |                 [1, 1, 2, 2, 2, 0],
49 |                 [1, 2, 2, 3, 3, 3],
50 |             ],
51 |             [0, 1, 2, 3, 4, 6, 7, 8, 9, 10, 11],
52 |             [0, 2, 5, 6, 8, 11],
53 |             3,
54 |         ),
55 |         (
56 |             [[1]],
57 |             [0],
58 |             [0, 1],
59 |             1,
60 |         ),
61 |     ],
62 | )
63 | def test_get_unpad_data(attention_mask, golden_indices, golden_cu_seqlens, golden_max_seqlen):
64 |     attention_mask_with_indices = torch.tensor(attention_mask)
65 |     indices, cu_seqlens, max_seqlen_in_batch = get_unpad_data(attention_mask_with_indices)
66 |     assert torch.all(indices == torch.tensor(golden_indices))
67 |     assert torch.all(cu_seqlens == torch.tensor(golden_cu_seqlens, dtype=torch.int32))
68 |     assert max_seqlen_in_batch == golden_max_seqlen
69 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/tests/model/test_base.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | import pytest
18 | 
19 | from llamafactory.train.test_utils import compare_model, load_infer_model, load_reference_model, patch_valuehead_model
20 | 
21 | 
22 | TINY_LLAMA = os.getenv("TINY_LLAMA", "llamafactory/tiny-random-Llama-3")
23 | 
24 | TINY_LLAMA_VALUEHEAD = os.getenv("TINY_LLAMA_VALUEHEAD", "llamafactory/tiny-random-Llama-3-valuehead")
25 | 
26 | INFER_ARGS = {
27 |     "model_name_or_path": TINY_LLAMA,
28 |     "template": "llama3",
29 |     "infer_dtype": "float16",
30 | }
31 | 
32 | 
33 | @pytest.fixture
34 | def fix_valuehead_cpu_loading():
35 |     patch_valuehead_model()
36 | 
37 | 
38 | def test_base():
39 |     model = load_infer_model(**INFER_ARGS)
40 |     ref_model = load_reference_model(TINY_LLAMA)
41 |     compare_model(model, ref_model)
42 | 
43 | 
44 | @pytest.mark.usefixtures("fix_valuehead_cpu_loading")
45 | def test_valuehead():
46 |     model = load_infer_model(add_valuehead=True, **INFER_ARGS)
47 |     ref_model = load_reference_model(TINY_LLAMA_VALUEHEAD, add_valuehead=True)
48 |     compare_model(model, ref_model)
49 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/tests/model/test_full.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | import torch
18 | 
19 | from llamafactory.train.test_utils import load_infer_model, load_train_model
20 | 
21 | 
22 | TINY_LLAMA = os.getenv("TINY_LLAMA", "llamafactory/tiny-random-Llama-3")
23 | 
24 | TRAIN_ARGS = {
25 |     "model_name_or_path": TINY_LLAMA,
26 |     "stage": "sft",
27 |     "do_train": True,
28 |     "finetuning_type": "full",
29 |     "dataset": "llamafactory/tiny-supervised-dataset",
30 |     "dataset_dir": "ONLINE",
31 |     "template": "llama3",
32 |     "cutoff_len": 1024,
33 |     "overwrite_cache": True,
34 |     "output_dir": "dummy_dir",
35 |     "overwrite_output_dir": True,
36 |     "fp16": True,
37 | }
38 | 
39 | INFER_ARGS = {
40 |     "model_name_or_path": TINY_LLAMA,
41 |     "finetuning_type": "full",
42 |     "template": "llama3",
43 |     "infer_dtype": "float16",
44 | }
45 | 
46 | 
47 | def test_full_train():
48 |     model = load_train_model(**TRAIN_ARGS)
49 |     for param in model.parameters():
50 |         assert param.requires_grad is True
51 |         assert param.dtype == torch.float32
52 | 
53 | 
54 | def test_full_inference():
55 |     model = load_infer_model(**INFER_ARGS)
56 |     for param in model.parameters():
57 |         assert param.requires_grad is False
58 |         assert param.dtype == torch.float16
59 | 


--------------------------------------------------------------------------------
/train/LLaMA-Factory/tests/model/test_pissa.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | import pytest
18 | 
19 | from llamafactory.train.test_utils import compare_model, load_infer_model, load_reference_model, load_train_model
20 | 
21 | 
22 | TINY_LLAMA = os.getenv("TINY_LLAMA", "llamafactory/tiny-random-Llama-3")
23 | 
24 | TINY_LLAMA_PISSA = os.getenv("TINY_LLAMA_ADAPTER", "llamafactory/tiny-random-Llama-3-pissa")
25 | 
26 | TRAIN_ARGS = {
27 |     "model_name_or_path": TINY_LLAMA,
28 |     "stage": "sft",
29 |     "do_train": True,
30 |     "finetuning_type": "lora",
31 |     "pissa_init": True,
32 |     "pissa_iter": -1,
33 |     "dataset": "llamafactory/tiny-supervised-dataset",
34 |     "dataset_dir": "ONLINE",
35 |     "template": "llama3",
36 |     "cutoff_len": 1024,
37 |     "overwrite_cache": True,
38 |     "output_dir": "dummy_dir",
39 |     "overwrite_output_dir": True,
40 |     "fp16": True,
41 | }
42 | 
43 | INFER_ARGS = {
44 |     "model_name_or_path": TINY_LLAMA_PISSA,
45 |     "adapter_name_or_path": TINY_LLAMA_PISSA,
46 |     "adapter_folder": "pissa_init",
47 |     "finetuning_type": "lora",
48 |     "template": "llama3",
49 |     "infer_dtype": "float16",
50 | }
51 | 
52 | OS_NAME = os.getenv("OS_NAME", "")
53 | 
54 | 
55 | @pytest.mark.xfail(reason="PiSSA initialization is not stable in different platform.")
56 | def test_pissa_train():
57 |     model = load_train_model(**TRAIN_ARGS)
58 |     ref_model = load_reference_model(TINY_LLAMA_PISSA, TINY_LLAMA_PISSA, use_pissa=True, is_trainable=True)
59 |     compare_model(model, ref_model)
60 | 
61 | 
62 | @pytest.mark.xfail(OS_NAME.startswith("windows"), reason="Known connection error on Windows.")
63 | def test_pissa_inference():
64 |     model = load_infer_model(**INFER_ARGS)
65 |     ref_model = load_reference_model(TINY_LLAMA_PISSA, TINY_LLAMA_PISSA, use_pissa=True, is_trainable=False)
66 |     ref_model = ref_model.merge_and_unload()
67 |     compare_model(model, ref_model)
68 | 


--------------------------------------------------------------------------------
/train/Validation/start_validate.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | set -ex
 3 | 
 4 | export CUDA_VISIBLE_DEVICES=0,1,2,3
 5 | 
 6 | model_dir="/path/to/models"
 7 | summary_path="../../Validation/validation_summary.txt"
 8 | 
 9 | models_dir_name=$(basename "$models_dir")
10 | summary_parent_dir=$(dirname "$summary_path")
11 | 
12 | for checkpoint_dir in ${models_dir}/checkpoint-*; do
13 |     if [ -d "$checkpoint_dir" ]; then
14 | 
15 |         checkpoint_num=$(basename "$checkpoint_dir" | cut -d'-' -f2)
16 |         if [ "$checkpoint_num" -ge 1 ] && [ "$checkpoint_num" -lt 100 ]; then
17 | 
18 |             output_dir="${summary_parent_dir}/${models_dir_name}-checkpoint-${checkpoint_num}/"
19 | 
20 |             echo "Processing checkpoint-${checkpoint_num}"
21 |             echo "Model path: ${checkpoint_dir}"
22 |             echo "Output dir: ${output_dir}"
23 | 
24 |             bash validate_single.sh "$checkpoint_dir" "$output_dir" "$summary_path"
25 |         else
26 |             echo "Skipping checkpoint-${checkpoint_num} as it's >= 100"
27 | 
28 | 
29 | 
30 | 
31 | 


--------------------------------------------------------------------------------
/train/Validation/validate_single.sh:
--------------------------------------------------------------------------------
 1 | set -ex
 2 | 
 3 | PROMPT_TYPE="qwen25-math-cot"
 4 | MODEL_NAME_OR_PATH=$1
 5 | OUTPUT_DIR=$2
 6 | SUMMARY_PATH=$3
 7 | SPLIT="test"
 8 | NUM_TEST_SAMPLE=-1
 9 | 
10 | mkdir -p $OUTPUT_DIR
11 | cd ../../tools/evaluate_math
12 | 
13 | DATA_NAME="math-500"
14 | TOKENIZERS_PARALLELISM=false \
15 | python3 -u math_eval.py \
16 |     --model_name_or_path ${MODEL_NAME_OR_PATH} \
17 |     --data_name ${DATA_NAME} \
18 |     --output_dir ${OUTPUT_DIR} \
19 |     --summary_path ${SUMMARY_PATH} \
20 |     --split ${SPLIT} \
21 |     --prompt_type ${PROMPT_TYPE} \
22 |     --num_test_sample ${NUM_TEST_SAMPLE} \
23 |     --seed 0 \
24 |     --temperature 0 \
25 |     --n_sampling 1 \
26 |     --top_p 1 \
27 |     --start 0 \
28 |     --end -1 \
29 |     --use_vllm \
30 |     --save_outputs \
31 |     # --overwrite \


--------------------------------------------------------------------------------
/train/Validation/validation_on_math-500.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import shutil
 3 | 
 4 | 
 5 | def main(summary_path, model_dir, output_dir):
 6 |     os.makedirs(output_dir, exist_ok=True)
 7 |     curr_accu = 60.0
 8 |     curr_ckpt = None
 9 |     with open(summary_path, 'r') as f:
10 |         for line in f.readlines():
11 |             segs = line.strip().split(" Final Accuracy: ")
12 |             accu = float(segs[1])
13 |             ckpt_num = segs[0].split("-checkpoint-")[1].split("/")[0]
14 |             if accu > curr_accu:
15 |                 curr_accu = accu
16 |                 curr_ckpt = ckpt_num
17 |     if not curr_ckpt:
18 |         print("Validation error")
19 |         return
20 |     source_folder = os.path.join(model_dir, f"checkpoint-{str(curr_ckpt)}")
21 |     shutil.copytree(source_folder, output_dir)
22 | 
23 | 
24 | if __name__ == "__main__":
25 |     main(
26 |         "",
27 |         "",
28 |         ""
29 |     )
30 | 
31 | 
32 | 


--------------------------------------------------------------------------------
/train/scripts/train_qwen2_5-32b-instruct-cft/qwen2.5-32b-cft-webinstruct-4k.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: /path/to/Qwen2.5-32B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | do_eval: false
 9 | finetuning_type: full
10 | deepspeed: examples/deepspeed/ds_z3_config.json  # choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
11 | 
12 | ### dataset
13 | dataset: WebInstruct-CFT-4K
14 | template: qwen
15 | cutoff_len: 2048
16 | max_samples: 100000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | 
20 | ### output
21 | output_dir: output_models/qwen2.5-math-7B-cft_WebInstruct-CFT-4K
22 | logging_steps: 1
23 | save_steps: 2
24 | plot_loss: true
25 | overwrite_output_dir: true
26 | save_only_model: true
27 | 
28 | ### train
29 | per_device_train_batch_size: 8
30 | gradient_accumulation_steps: 8
31 | learning_rate: 5.0e-6
32 | num_train_epochs: 1.0
33 | lr_scheduler_type: cosine
34 | warmup_ratio: 0.1
35 | bf16: true
36 | ddp_timeout: 180000000
37 | 


--------------------------------------------------------------------------------
/train/scripts/train_qwen2_5-32b-instruct-cft/train.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | cd ../../LLaMA-Factory
 4 | PROJECT_NAME="CFT"
 5 | export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
 6 | export WANDB_API_KEY=f318ffd0dcf5d31701fd33aee12e57e9cf15444f
 7 | export WANDB_PROJECT=$PROJECT_NAME
 8 | export WANDB_MODE=disabled
 9 | MASTER_PORT=$(shuf -i 20000-30000 -n 1)
10 | export MASTER_PORT
11 | export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
12 | 
13 | MODEL_NAME="critique-model"
14 | export WANDB_RUN_NAME=$MODEL_NAME
15 | 
16 | FORCE_TORCHRUN=1 llamafactory-cli train ../scripts/train_qwen2_5-32b-instruct-cft/qwen2.5-32b-cft-webinstruct-4k.yaml
17 | 


--------------------------------------------------------------------------------
/train/scripts/train_qwen2_5-math-7b-cft/qwen2.5-math-7b-cft-webinstruct-50k.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: /path/to/Qwen2.5-Math-7B
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | do_eval: false
 9 | finetuning_type: full
10 | deepspeed: examples/deepspeed/ds_z3_config.json  # choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
11 | 
12 | ### dataset
13 | dataset: WebInstruct-CFT-50K
14 | template: qwen
15 | cutoff_len: 2048
16 | max_samples: 100000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | 
20 | ### output
21 | output_dir: output_models/qwen2.5-math-7B-cft_WebInstruct-CFT-50K
22 | logging_steps: 1
23 | save_steps: 2
24 | plot_loss: true
25 | overwrite_output_dir: true
26 | save_only_model: true
27 | 
28 | ### train
29 | per_device_train_batch_size: 8
30 | gradient_accumulation_steps: 8
31 | learning_rate: 5.0e-6
32 | num_train_epochs: 1.0
33 | lr_scheduler_type: cosine
34 | warmup_ratio: 0.1
35 | bf16: true
36 | ddp_timeout: 180000000
37 | 


--------------------------------------------------------------------------------
/train/scripts/train_qwen2_5-math-7b-cft/train.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | cd ../../LLaMA-Factory
 4 | PROJECT_NAME="CFT"
 5 | export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
 6 | export WANDB_API_KEY=f318ffd0dcf5d31701fd33aee12e57e9cf15444f
 7 | export WANDB_PROJECT=$PROJECT_NAME
 8 | export WANDB_MODE=disabled
 9 | MASTER_PORT=$(shuf -i 20000-30000 -n 1)
10 | export MASTER_PORT
11 | export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
12 | 
13 | MODEL_NAME="critique-model"
14 | export WANDB_RUN_NAME=$MODEL_NAME
15 | 
16 | FORCE_TORCHRUN=1 llamafactory-cli train ../scripts/train_qwen2_5-math-7b-cft/qwen2.5-math-7b-cft-webinstruct-50k.yaml
17 | 


--------------------------------------------------------------------------------