├── .gitignore ├── README.md ├── assets ├── demo-vlthinker.png ├── iterative.png ├── keyword_evol.png └── overview.png ├── evaluation ├── eval_openvlthinker.py ├── eval_qwen.py ├── run_evaluation.py └── verify_mathverse_gpt4.py ├── generation ├── __init__.py └── generate_reasoning_thinker.py ├── paper └── OpenVLThinker_report.pdf ├── requirements.txt ├── train ├── README.md ├── easyr1 │ ├── .gitignore │ ├── Dockerfile │ ├── Dockerfile.legacy │ ├── LICENSE │ ├── Makefile │ ├── README.md │ ├── examples │ │ ├── config.yaml │ │ ├── format_prompt │ │ │ └── math_format.jinja │ │ ├── openvlthinker_grpo_hard.sh │ │ ├── openvlthinker_grpo_medium.sh │ │ ├── reward_function │ │ │ └── r1v.py │ │ └── runtime_env.yaml │ ├── pyproject.toml │ ├── requirements.txt │ ├── scripts │ │ └── model_merger.py │ ├── setup.py │ └── verl │ │ ├── __init__.py │ │ ├── models │ │ ├── __init__.py │ │ ├── monkey_patch.py │ │ └── transformers │ │ │ ├── __init__.py │ │ │ ├── flash_attention_utils.py │ │ │ └── qwen2_vl.py │ │ ├── protocol.py │ │ ├── single_controller │ │ ├── __init__.py │ │ ├── base │ │ │ ├── __init__.py │ │ │ ├── decorator.py │ │ │ ├── register_center │ │ │ │ ├── __init__.py │ │ │ │ └── ray.py │ │ │ ├── worker.py │ │ │ └── worker_group.py │ │ └── ray │ │ │ ├── __init__.py │ │ │ └── base.py │ │ ├── trainer │ │ ├── __init__.py │ │ ├── config.py │ │ ├── core_algos.py │ │ ├── data_loader.py │ │ ├── main.py │ │ ├── metrics.py │ │ └── ray_trainer.py │ │ ├── utils │ │ ├── __init__.py │ │ ├── checkpoint │ │ │ ├── __init__.py │ │ │ ├── checkpoint_manager.py │ │ │ └── fsdp_checkpoint_manager.py │ │ ├── dataset.py │ │ ├── flops_counter.py │ │ ├── fsdp_utils.py │ │ ├── logger │ │ │ ├── __init__.py │ │ │ ├── gen_logger.py │ │ │ └── logger.py │ │ ├── model_utils.py │ │ ├── py_functional.py │ │ ├── seqlen_balancing.py │ │ ├── tokenizer.py │ │ ├── torch_dtypes.py │ │ ├── torch_functional.py │ │ └── ulysses.py │ │ └── workers │ │ ├── __init__.py │ │ ├── actor │ │ ├── __init__.py │ │ ├── base.py │ │ ├── config.py │ │ └── dp_actor.py │ │ ├── config.py │ │ ├── critic │ │ ├── __init__.py │ │ ├── base.py │ │ ├── config.py │ │ └── dp_critic.py │ │ ├── fsdp_workers.py │ │ ├── reward │ │ ├── __init__.py │ │ ├── config.py │ │ └── function.py │ │ ├── rollout │ │ ├── __init__.py │ │ ├── base.py │ │ ├── config.py │ │ └── vllm_rollout_spmd.py │ │ └── sharding_manager │ │ ├── __init__.py │ │ ├── base.py │ │ ├── fsdp_ulysses.py │ │ └── fsdp_vllm.py └── llama-factory │ ├── .gitignore │ ├── Makefile │ ├── README.md │ ├── data │ └── dataset_info.json │ ├── examples │ └── deepspeed │ │ └── ds_z3_config.json │ ├── pyproject.toml │ ├── requirements.txt │ ├── scripts │ ├── api_example │ │ ├── test_image.py │ │ └── test_toolcall.py │ ├── convert_ckpt │ │ ├── llamafy_baichuan2.py │ │ └── llamafy_qwen.py │ ├── llama_pro.py │ ├── loftq_init.py │ ├── pissa_init.py │ ├── stat_utils │ │ ├── cal_flops.py │ │ ├── cal_lr.py │ │ ├── cal_mfu.py │ │ ├── cal_ppl.py │ │ └── length_cdf.py │ └── vllm_infer.py │ ├── setup.py │ ├── sft.yaml │ └── src │ ├── api.py │ ├── llamafactory.egg-info │ ├── PKG-INFO │ ├── SOURCES.txt │ ├── dependency_links.txt │ ├── entry_points.txt │ ├── requires.txt │ └── top_level.txt │ ├── llamafactory │ ├── __init__.py │ ├── api │ │ ├── __init__.py │ │ ├── app.py │ │ ├── chat.py │ │ ├── common.py │ │ └── protocol.py │ ├── chat │ │ ├── __init__.py │ │ ├── base_engine.py │ │ ├── chat_model.py │ │ ├── hf_engine.py │ │ └── vllm_engine.py │ ├── cli.py │ ├── data │ │ ├── __init__.py │ │ ├── collator.py │ │ ├── converter.py │ │ ├── data_utils.py │ │ ├── formatter.py │ │ ├── loader.py │ │ ├── mm_plugin.py │ │ ├── parser.py │ │ ├── processor │ │ │ ├── __init__.py │ │ │ ├── feedback.py │ │ │ ├── pairwise.py │ │ │ ├── pretrain.py │ │ │ ├── processor_utils.py │ │ │ ├── supervised.py │ │ │ └── unsupervised.py │ │ ├── template.py │ │ └── tool_utils.py │ ├── eval │ │ ├── __init__.py │ │ ├── evaluator.py │ │ └── template.py │ ├── extras │ │ ├── __init__.py │ │ ├── constants.py │ │ ├── env.py │ │ ├── logging.py │ │ ├── misc.py │ │ ├── packages.py │ │ └── ploting.py │ ├── hparams │ │ ├── __init__.py │ │ ├── data_args.py │ │ ├── evaluation_args.py │ │ ├── finetuning_args.py │ │ ├── generating_args.py │ │ ├── model_args.py │ │ ├── parser.py │ │ └── training_args.py │ ├── launcher.py │ ├── model │ │ ├── __init__.py │ │ ├── adapter.py │ │ ├── loader.py │ │ ├── model_utils │ │ │ ├── __init__.py │ │ │ ├── attention.py │ │ │ ├── checkpointing.py │ │ │ ├── embedding.py │ │ │ ├── liger_kernel.py │ │ │ ├── longlora.py │ │ │ ├── misc.py │ │ │ ├── mod.py │ │ │ ├── moe.py │ │ │ ├── packing.py │ │ │ ├── quantization.py │ │ │ ├── rope.py │ │ │ ├── unsloth.py │ │ │ ├── valuehead.py │ │ │ └── visual.py │ │ └── patcher.py │ ├── train │ │ ├── __init__.py │ │ ├── callbacks.py │ │ ├── dpo │ │ │ ├── __init__.py │ │ │ ├── trainer.py │ │ │ └── workflow.py │ │ ├── kto │ │ │ ├── __init__.py │ │ │ ├── trainer.py │ │ │ └── workflow.py │ │ ├── ppo │ │ │ ├── __init__.py │ │ │ ├── ppo_utils.py │ │ │ ├── trainer.py │ │ │ └── workflow.py │ │ ├── pt │ │ │ ├── __init__.py │ │ │ ├── trainer.py │ │ │ └── workflow.py │ │ ├── rm │ │ │ ├── __init__.py │ │ │ ├── metric.py │ │ │ ├── trainer.py │ │ │ └── workflow.py │ │ ├── sft │ │ │ ├── __init__.py │ │ │ ├── metric.py │ │ │ ├── trainer.py │ │ │ └── workflow.py │ │ ├── test_utils.py │ │ ├── trainer_utils.py │ │ └── tuner.py │ └── webui │ │ ├── __init__.py │ │ ├── chatter.py │ │ ├── common.py │ │ ├── components │ │ ├── __init__.py │ │ ├── chatbot.py │ │ ├── data.py │ │ ├── eval.py │ │ ├── export.py │ │ ├── infer.py │ │ ├── top.py │ │ └── train.py │ │ ├── control.py │ │ ├── css.py │ │ ├── engine.py │ │ ├── interface.py │ │ ├── locales.py │ │ ├── manager.py │ │ └── runner.py │ ├── train.py │ └── webui.py └── utils ├── __init__.py ├── clean_answer.py └── upload_model.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/README.md -------------------------------------------------------------------------------- /assets/demo-vlthinker.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/assets/demo-vlthinker.png -------------------------------------------------------------------------------- /assets/iterative.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/assets/iterative.png -------------------------------------------------------------------------------- /assets/keyword_evol.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/assets/keyword_evol.png -------------------------------------------------------------------------------- /assets/overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/assets/overview.png -------------------------------------------------------------------------------- /evaluation/eval_openvlthinker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/evaluation/eval_openvlthinker.py -------------------------------------------------------------------------------- /evaluation/eval_qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/evaluation/eval_qwen.py -------------------------------------------------------------------------------- /evaluation/run_evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/evaluation/run_evaluation.py -------------------------------------------------------------------------------- /evaluation/verify_mathverse_gpt4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/evaluation/verify_mathverse_gpt4.py -------------------------------------------------------------------------------- /generation/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /generation/generate_reasoning_thinker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/generation/generate_reasoning_thinker.py -------------------------------------------------------------------------------- /paper/OpenVLThinker_report.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/paper/OpenVLThinker_report.pdf -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/requirements.txt -------------------------------------------------------------------------------- /train/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/README.md -------------------------------------------------------------------------------- /train/easyr1/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/.gitignore -------------------------------------------------------------------------------- /train/easyr1/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/Dockerfile -------------------------------------------------------------------------------- /train/easyr1/Dockerfile.legacy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/Dockerfile.legacy -------------------------------------------------------------------------------- /train/easyr1/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/LICENSE -------------------------------------------------------------------------------- /train/easyr1/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/Makefile -------------------------------------------------------------------------------- /train/easyr1/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/README.md -------------------------------------------------------------------------------- /train/easyr1/examples/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/examples/config.yaml -------------------------------------------------------------------------------- /train/easyr1/examples/format_prompt/math_format.jinja: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/examples/format_prompt/math_format.jinja -------------------------------------------------------------------------------- /train/easyr1/examples/openvlthinker_grpo_hard.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/examples/openvlthinker_grpo_hard.sh -------------------------------------------------------------------------------- /train/easyr1/examples/openvlthinker_grpo_medium.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/examples/openvlthinker_grpo_medium.sh -------------------------------------------------------------------------------- /train/easyr1/examples/reward_function/r1v.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/examples/reward_function/r1v.py -------------------------------------------------------------------------------- /train/easyr1/examples/runtime_env.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/examples/runtime_env.yaml -------------------------------------------------------------------------------- /train/easyr1/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/pyproject.toml -------------------------------------------------------------------------------- /train/easyr1/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/requirements.txt -------------------------------------------------------------------------------- /train/easyr1/scripts/model_merger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/scripts/model_merger.py -------------------------------------------------------------------------------- /train/easyr1/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/setup.py -------------------------------------------------------------------------------- /train/easyr1/verl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/models/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/models/monkey_patch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/models/monkey_patch.py -------------------------------------------------------------------------------- /train/easyr1/verl/models/transformers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/models/transformers/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/models/transformers/flash_attention_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/models/transformers/flash_attention_utils.py -------------------------------------------------------------------------------- /train/easyr1/verl/models/transformers/qwen2_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/models/transformers/qwen2_vl.py -------------------------------------------------------------------------------- /train/easyr1/verl/protocol.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/protocol.py -------------------------------------------------------------------------------- /train/easyr1/verl/single_controller/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/single_controller/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/single_controller/base/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/single_controller/base/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/single_controller/base/decorator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/single_controller/base/decorator.py -------------------------------------------------------------------------------- /train/easyr1/verl/single_controller/base/register_center/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/single_controller/base/register_center/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/single_controller/base/register_center/ray.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/single_controller/base/register_center/ray.py -------------------------------------------------------------------------------- /train/easyr1/verl/single_controller/base/worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/single_controller/base/worker.py -------------------------------------------------------------------------------- /train/easyr1/verl/single_controller/base/worker_group.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/single_controller/base/worker_group.py -------------------------------------------------------------------------------- /train/easyr1/verl/single_controller/ray/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/single_controller/ray/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/single_controller/ray/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/single_controller/ray/base.py -------------------------------------------------------------------------------- /train/easyr1/verl/trainer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/trainer/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/trainer/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/trainer/config.py -------------------------------------------------------------------------------- /train/easyr1/verl/trainer/core_algos.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/trainer/core_algos.py -------------------------------------------------------------------------------- /train/easyr1/verl/trainer/data_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/trainer/data_loader.py -------------------------------------------------------------------------------- /train/easyr1/verl/trainer/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/trainer/main.py -------------------------------------------------------------------------------- /train/easyr1/verl/trainer/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/trainer/metrics.py -------------------------------------------------------------------------------- /train/easyr1/verl/trainer/ray_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/trainer/ray_trainer.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/checkpoint/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/checkpoint/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/checkpoint/checkpoint_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/checkpoint/checkpoint_manager.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/checkpoint/fsdp_checkpoint_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/checkpoint/fsdp_checkpoint_manager.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/dataset.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/flops_counter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/flops_counter.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/fsdp_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/fsdp_utils.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/logger/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/logger/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/logger/gen_logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/logger/gen_logger.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/logger/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/logger/logger.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/model_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/model_utils.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/py_functional.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/py_functional.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/seqlen_balancing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/seqlen_balancing.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/tokenizer.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/torch_dtypes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/torch_dtypes.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/torch_functional.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/torch_functional.py -------------------------------------------------------------------------------- /train/easyr1/verl/utils/ulysses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/utils/ulysses.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/actor/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/actor/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/actor/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/actor/base.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/actor/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/actor/config.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/actor/dp_actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/actor/dp_actor.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/config.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/critic/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/critic/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/critic/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/critic/base.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/critic/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/critic/config.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/critic/dp_critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/critic/dp_critic.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/fsdp_workers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/fsdp_workers.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/reward/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/reward/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/reward/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/reward/config.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/reward/function.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/reward/function.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/rollout/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/rollout/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/rollout/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/rollout/base.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/rollout/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/rollout/config.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/rollout/vllm_rollout_spmd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/rollout/vllm_rollout_spmd.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/sharding_manager/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/sharding_manager/__init__.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/sharding_manager/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/sharding_manager/base.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/sharding_manager/fsdp_ulysses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/sharding_manager/fsdp_ulysses.py -------------------------------------------------------------------------------- /train/easyr1/verl/workers/sharding_manager/fsdp_vllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/easyr1/verl/workers/sharding_manager/fsdp_vllm.py -------------------------------------------------------------------------------- /train/llama-factory/.gitignore: -------------------------------------------------------------------------------- 1 | saves/ 2 | wandb/ -------------------------------------------------------------------------------- /train/llama-factory/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/Makefile -------------------------------------------------------------------------------- /train/llama-factory/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/README.md -------------------------------------------------------------------------------- /train/llama-factory/data/dataset_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/data/dataset_info.json -------------------------------------------------------------------------------- /train/llama-factory/examples/deepspeed/ds_z3_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/examples/deepspeed/ds_z3_config.json -------------------------------------------------------------------------------- /train/llama-factory/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/pyproject.toml -------------------------------------------------------------------------------- /train/llama-factory/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/requirements.txt -------------------------------------------------------------------------------- /train/llama-factory/scripts/api_example/test_image.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/api_example/test_image.py -------------------------------------------------------------------------------- /train/llama-factory/scripts/api_example/test_toolcall.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/api_example/test_toolcall.py -------------------------------------------------------------------------------- /train/llama-factory/scripts/convert_ckpt/llamafy_baichuan2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/convert_ckpt/llamafy_baichuan2.py -------------------------------------------------------------------------------- /train/llama-factory/scripts/convert_ckpt/llamafy_qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/convert_ckpt/llamafy_qwen.py -------------------------------------------------------------------------------- /train/llama-factory/scripts/llama_pro.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/llama_pro.py -------------------------------------------------------------------------------- /train/llama-factory/scripts/loftq_init.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/loftq_init.py -------------------------------------------------------------------------------- /train/llama-factory/scripts/pissa_init.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/pissa_init.py -------------------------------------------------------------------------------- /train/llama-factory/scripts/stat_utils/cal_flops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/stat_utils/cal_flops.py -------------------------------------------------------------------------------- /train/llama-factory/scripts/stat_utils/cal_lr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/stat_utils/cal_lr.py -------------------------------------------------------------------------------- /train/llama-factory/scripts/stat_utils/cal_mfu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/stat_utils/cal_mfu.py -------------------------------------------------------------------------------- /train/llama-factory/scripts/stat_utils/cal_ppl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/stat_utils/cal_ppl.py -------------------------------------------------------------------------------- /train/llama-factory/scripts/stat_utils/length_cdf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/stat_utils/length_cdf.py -------------------------------------------------------------------------------- /train/llama-factory/scripts/vllm_infer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/scripts/vllm_infer.py -------------------------------------------------------------------------------- /train/llama-factory/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/setup.py -------------------------------------------------------------------------------- /train/llama-factory/sft.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/sft.yaml -------------------------------------------------------------------------------- /train/llama-factory/src/api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/api.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory.egg-info/PKG-INFO: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory.egg-info/PKG-INFO -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory.egg-info/SOURCES.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory.egg-info/SOURCES.txt -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory.egg-info/dependency_links.txt: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory.egg-info/entry_points.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory.egg-info/entry_points.txt -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory.egg-info/requires.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory.egg-info/requires.txt -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory.egg-info/top_level.txt: -------------------------------------------------------------------------------- 1 | llamafactory 2 | -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/api/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/api/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/api/app.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/api/chat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/api/chat.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/api/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/api/common.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/api/protocol.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/api/protocol.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/chat/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/chat/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/chat/base_engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/chat/base_engine.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/chat/chat_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/chat/chat_model.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/chat/hf_engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/chat/hf_engine.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/chat/vllm_engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/chat/vllm_engine.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/cli.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/collator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/collator.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/converter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/converter.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/data_utils.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/formatter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/formatter.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/loader.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/mm_plugin.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/mm_plugin.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/parser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/parser.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/processor/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/processor/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/processor/feedback.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/processor/feedback.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/processor/pairwise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/processor/pairwise.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/processor/pretrain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/processor/pretrain.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/processor/processor_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/processor/processor_utils.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/processor/supervised.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/processor/supervised.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/processor/unsupervised.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/processor/unsupervised.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/template.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/data/tool_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/data/tool_utils.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/eval/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/eval/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/eval/evaluator.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/eval/template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/eval/template.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/extras/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/extras/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/extras/constants.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/extras/env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/extras/env.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/extras/logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/extras/logging.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/extras/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/extras/misc.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/extras/packages.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/extras/packages.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/extras/ploting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/extras/ploting.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/hparams/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/hparams/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/hparams/data_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/hparams/data_args.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/hparams/evaluation_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/hparams/evaluation_args.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/hparams/finetuning_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/hparams/finetuning_args.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/hparams/generating_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/hparams/generating_args.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/hparams/model_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/hparams/model_args.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/hparams/parser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/hparams/parser.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/hparams/training_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/hparams/training_args.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/launcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/launcher.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/adapter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/adapter.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/loader.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/attention.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/checkpointing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/checkpointing.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/embedding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/embedding.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/liger_kernel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/liger_kernel.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/longlora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/longlora.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/misc.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/mod.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/mod.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/moe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/moe.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/packing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/packing.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/quantization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/quantization.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/rope.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/rope.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/unsloth.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/unsloth.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/valuehead.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/valuehead.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/model_utils/visual.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/model_utils/visual.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/model/patcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/model/patcher.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/callbacks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/callbacks.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/dpo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/dpo/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/dpo/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/dpo/trainer.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/dpo/workflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/dpo/workflow.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/kto/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/kto/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/kto/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/kto/trainer.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/kto/workflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/kto/workflow.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/ppo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/ppo/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/ppo/ppo_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/ppo/ppo_utils.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/ppo/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/ppo/trainer.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/ppo/workflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/ppo/workflow.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/pt/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/pt/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/pt/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/pt/trainer.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/pt/workflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/pt/workflow.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/rm/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/rm/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/rm/metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/rm/metric.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/rm/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/rm/trainer.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/rm/workflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/rm/workflow.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/sft/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/sft/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/sft/metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/sft/metric.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/sft/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/sft/trainer.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/sft/workflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/sft/workflow.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/test_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/test_utils.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/trainer_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/trainer_utils.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/train/tuner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/train/tuner.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/chatter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/chatter.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/common.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/components/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/components/__init__.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/components/chatbot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/components/chatbot.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/components/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/components/data.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/components/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/components/eval.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/components/export.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/components/export.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/components/infer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/components/infer.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/components/top.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/components/top.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/components/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/components/train.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/control.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/control.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/css.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/css.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/engine.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/interface.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/locales.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/locales.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/manager.py -------------------------------------------------------------------------------- /train/llama-factory/src/llamafactory/webui/runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/llamafactory/webui/runner.py -------------------------------------------------------------------------------- /train/llama-factory/src/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/train.py -------------------------------------------------------------------------------- /train/llama-factory/src/webui.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/train/llama-factory/src/webui.py -------------------------------------------------------------------------------- /utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /utils/clean_answer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/utils/clean_answer.py -------------------------------------------------------------------------------- /utils/upload_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yihedeng9/OpenVLThinker/HEAD/utils/upload_model.py --------------------------------------------------------------------------------