├── api
    ├── rag
    │   ├── r1rag
    │   │   └── __init__.py
    │   ├── .gitignore
    │   ├── configs
    │   │   └── egolife.yaml
    │   └── pyproject.toml
    └── visual_tools
    │   ├── configs.yaml
    │   ├── egoschema_videollm_llava
    │       └── video_llm.py
    │   ├── videomme_videollm_llava
    │       └── video_llm.py
    │   ├── egoschema_vlm
    │       ├── vlm.py
    │       └── api.py
    │   ├── videomme_vlm
    │       ├── vlm.py
    │       └── api.py
    │   ├── egor1_vlm
    │       ├── vlm.py
    │       └── api.py
    │   └── egor1_videollm_llava
    │       └── video_llm.py
├── Ego-R1-Agent
    ├── verl
    │   ├── version
    │   │   └── version
    │   ├── single_controller
    │   │   ├── version
    │   │   │   └── version
    │   │   ├── base
    │   │   │   ├── megatron
    │   │   │   │   ├── __init__.py
    │   │   │   │   └── worker.py
    │   │   │   ├── register_center
    │   │   │   │   ├── __init__.py
    │   │   │   │   └── ray.py
    │   │   │   └── __init__.py
    │   │   ├── ray
    │   │   │   └── __init__.py
    │   │   └── __init__.py
    │   ├── trainer
    │   │   ├── runtime_env.yaml
    │   │   ├── config
    │   │   │   ├── evaluation.yaml
    │   │   │   ├── generation.yaml
    │   │   │   └── sft_trainer.yaml
    │   │   ├── __init__.py
    │   │   └── ppo
    │   │   │   └── __init__.py
    │   ├── models
    │   │   ├── __init__.py
    │   │   ├── llama
    │   │   │   ├── __init__.py
    │   │   │   └── megatron
    │   │   │   │   ├── checkpoint_utils
    │   │   │   │       └── __init__.py
    │   │   │   │   ├── layers
    │   │   │   │       ├── __init__.py
    │   │   │   │       └── parallel_rmsnorm.py
    │   │   │   │   └── __init__.py
    │   │   ├── transformers
    │   │   │   └── __init__.py
    │   │   ├── weight_loader_registry.py
    │   │   └── README.md
    │   ├── workers
    │   │   ├── __init__.py
    │   │   ├── reward_model
    │   │   │   ├── __init__.py
    │   │   │   ├── megatron
    │   │   │   │   └── __init__.py
    │   │   │   └── base.py
    │   │   ├── rollout
    │   │   │   ├── naive
    │   │   │   │   └── __init__.py
    │   │   │   ├── vllm_rollout
    │   │   │   │   └── __init__.py
    │   │   │   ├── __init__.py
    │   │   │   └── base.py
    │   │   ├── actor
    │   │   │   └── __init__.py
    │   │   ├── critic
    │   │   │   ├── __init__.py
    │   │   │   └── base.py
    │   │   └── sharding_manager
    │   │   │   ├── base.py
    │   │   │   └── __init__.py
    │   ├── third_party
    │   │   ├── __init__.py
    │   │   └── vllm
    │   │   │   ├── vllm_v_0_3_1
    │   │   │       └── __init__.py
    │   │   │   ├── vllm_v_0_4_2
    │   │   │       └── __init__.py
    │   │   │   ├── vllm_v_0_5_4
    │   │   │       ├── __init__.py
    │   │   │       └── hf_weight_loader.py
    │   │   │   ├── vllm_v_0_6_3
    │   │   │       ├── __init__.py
    │   │   │       ├── tokenizer.py
    │   │   │       └── hf_weight_loader.py
    │   │   │   └── __init__.py
    │   ├── utils
    │   │   ├── logger
    │   │   │   ├── __init__.py
    │   │   │   └── aggregate_logger.py
    │   │   ├── megatron
    │   │   │   ├── __init__.py
    │   │   │   ├── memory.py
    │   │   │   └── sequence_parallel.py
    │   │   ├── rendezvous
    │   │   │   └── __init__.py
    │   │   ├── reward_score
    │   │   │   └── __init__.py
    │   │   ├── debug
    │   │   │   ├── __init__.py
    │   │   │   └── performance.py
    │   │   ├── dataset
    │   │   │   ├── __init__.py
    │   │   │   └── README.md
    │   │   ├── __init__.py
    │   │   ├── config.py
    │   │   ├── logging_utils.py
    │   │   ├── distributed.py
    │   │   ├── import_utils.py
    │   │   ├── ray_utils.py
    │   │   └── py_functional.py
    │   └── __init__.py
    ├── ego_r1
    │   ├── llm_agent
    │   │   └── __init__.py
    │   └── search
    │   │   ├── retrieval_request.py
    │   │   ├── build_index.sh
    │   │   └── retrieval.sh
    ├── utils
    │   └── serve.sh
    ├── README.md
    ├── eval
    │   └── infer_bench_summ.sh
    ├── .gitignore
    └── setup.py
├── LLaMA-Factory
    ├── src
    │   ├── llamafactory
    │   │   ├── api
    │   │   │   ├── __init__.py
    │   │   │   └── common.py
    │   │   ├── eval
    │   │   │   └── __init__.py
    │   │   ├── train
    │   │   │   ├── __init__.py
    │   │   │   ├── pt
    │   │   │   │   └── __init__.py
    │   │   │   ├── rm
    │   │   │   │   ├── __init__.py
    │   │   │   │   └── metric.py
    │   │   │   ├── dpo
    │   │   │   │   └── __init__.py
    │   │   │   ├── kto
    │   │   │   │   └── __init__.py
    │   │   │   ├── ppo
    │   │   │   │   └── __init__.py
    │   │   │   └── sft
    │   │   │   │   └── __init__.py
    │   │   ├── webui
    │   │   │   ├── __init__.py
    │   │   │   ├── components
    │   │   │   │   └── __init__.py
    │   │   │   └── css.py
    │   │   ├── extras
    │   │   │   └── __init__.py
    │   │   ├── third_party
    │   │   │   ├── __init__.py
    │   │   │   └── muon
    │   │   │   │   └── __init__.py
    │   │   ├── model
    │   │   │   ├── model_utils
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── mod.py
    │   │   │   │   └── kv_cache.py
    │   │   │   └── __init__.py
    │   │   ├── chat
    │   │   │   └── __init__.py
    │   │   ├── launcher.py
    │   │   ├── __init__.py
    │   │   ├── data
    │   │   │   ├── processor
    │   │   │   │   └── __init__.py
    │   │   │   └── __init__.py
    │   │   └── hparams
    │   │   │   └── __init__.py
    │   ├── train.py
    │   ├── api.py
    │   └── webui.py
    ├── MANIFEST.in
    ├── .github
    │   ├── ISSUE_TEMPLATE
    │   │   ├── config.yml
    │   │   └── 2-feature-request.yml
    │   ├── PULL_REQUEST_TEMPLATE.md
    │   ├── SECURITY.md
    │   └── workflows
    │   │   ├── publish.yml
    │   │   └── label_issue.yml
    ├── .gitattributes
    ├── data
    │   ├── mllm_demo_data
    │   │   ├── 1.jpg
    │   │   ├── 1.mp3
    │   │   ├── 1.mp4
    │   │   ├── 2.avi
    │   │   ├── 2.jpg
    │   │   ├── 2.wav
    │   │   ├── 3.flac
    │   │   ├── 3.jpg
    │   │   ├── 3.mp4
    │   │   ├── 4.mp3
    │   │   └── 4.mp4
    │   ├── mllm_video_demo.json
    │   ├── mllm_audio_demo.json
    │   └── mllm_video_audio_demo.json
    ├── examples
    │   ├── extras
    │   │   ├── pissa
    │   │   │   ├── init.sh
    │   │   │   └── llama3_lora_sft.yaml
    │   │   ├── llama_pro
    │   │   │   ├── expand.sh
    │   │   │   └── llama3_freeze_sft.yaml
    │   │   ├── fsdp_qlora
    │   │   │   ├── train.sh
    │   │   │   └── llama3_lora_sft.yaml
    │   │   ├── nlg_eval
    │   │   │   └── llama3_lora_predict.yaml
    │   │   ├── muon
    │   │   │   └── qwen2_full_sft.yaml
    │   │   ├── adam_mini
    │   │   │   └── qwen2_full_sft.yaml
    │   │   ├── mod
    │   │   │   └── llama3_full_sft.yaml
    │   │   ├── loraplus
    │   │   │   └── llama3_lora_sft.yaml
    │   │   ├── badam
    │   │   │   └── llama3_full_sft.yaml
    │   │   ├── galore
    │   │   │   └── llama3_full_sft.yaml
    │   │   └── apollo
    │   │   │   └── llama3_full_sft.yaml
    │   ├── inference
    │   │   ├── llama3_full_sft.yaml
    │   │   ├── qwen2_vl.yaml
    │   │   ├── llama3.yaml
    │   │   └── llama3_lora_sft.yaml
    │   ├── merge_lora
    │   │   ├── llama3_full_sft.yaml
    │   │   ├── llama3_gptq.yaml
    │   │   ├── llama3_lora_sft.yaml
    │   │   └── qwen2vl_lora_sft.yaml
    │   ├── train_lora
    │   │   ├── llama3_lora_eval.yaml
    │   │   ├── llama3_preprocess.yaml
    │   │   ├── llama3_lora_ppo.yaml
    │   │   ├── llama3_lora_kto.yaml
    │   │   ├── llama3_lora_sft.sh
    │   │   ├── llama3_lora_pretrain.yaml
    │   │   ├── llama3_lora_reward.yaml
    │   │   ├── llama3_lora_sft.yaml
    │   │   ├── qwen2vl_lora_sft.yaml
    │   │   ├── llama3_lora_dpo.yaml
    │   │   ├── qwen2vl_lora_dpo.yaml
    │   │   ├── llama3_lora_sft_ds3.yaml
    │   │   ├── llama4_lora_sft_ds3.yaml
    │   │   └── llama3_lora_sft_ray.yaml
    │   ├── accelerate
    │   │   ├── fsdp_config.yaml
    │   │   └── fsdp_config_offload.yaml
    │   ├── train_qlora
    │   │   ├── llama3_lora_sft_awq.yaml
    │   │   ├── llama3_lora_sft_gptq.yaml
    │   │   ├── llama3_lora_sft_aqlm.yaml
    │   │   ├── llama3_lora_sft_bnb_npu.yaml
    │   │   └── llama3_lora_sft_otfq.yaml
    │   └── train_full
    │   │   ├── llama3_full_sft.yaml
    │   │   ├── qwen2vl_full_sft.yaml
    │   │   └── qwen.yaml
    ├── .dockerignore
    ├── Makefile
    ├── .pre-commit-config.yaml
    ├── .env.local
    ├── docker
    │   ├── docker-npu
    │   │   └── docker-compose.yml
    │   ├── docker-cuda
    │   │   └── docker-compose.yml
    │   └── docker-rocm
    │   │   └── docker-compose.yml
    ├── tests
    │   ├── data
    │   │   ├── processor
    │   │   │   └── test_processor_utils.py
    │   │   └── test_loader.py
    │   ├── check_license.py
    │   ├── e2e
    │   │   └── test_chat.py
    │   └── model
    │   │   ├── test_base.py
    │   │   ├── model_utils
    │   │       ├── test_misc.py
    │   │       ├── test_add_tokens.py
    │   │       └── test_attention.py
    │   │   └── test_full.py
    ├── CITATION.cff
    └── scripts
    │   ├── convert_ckpt
    │       └── tiny_llama4.py
    │   └── stat_utils
    │       └── cal_flops.py
├── assets
    └── teaser.png
├── .gitignore
└── cott_gen
    └── __init__.py


/api/rag/r1rag/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/version/version:
--------------------------------------------------------------------------------
1 | 0.1


--------------------------------------------------------------------------------
/Ego-R1-Agent/ego_r1/llm_agent/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/api/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/eval/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/train/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/webui/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/extras/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/single_controller/version/version:
--------------------------------------------------------------------------------
1 | 0.0.2


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/third_party/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/MANIFEST.in:
--------------------------------------------------------------------------------
1 | include LICENSE requirements.txt
2 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/model/model_utils/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/.github/ISSUE_TEMPLATE/config.yml:
--------------------------------------------------------------------------------
1 | blank_issues_enabled: false
2 | 


--------------------------------------------------------------------------------
/assets/teaser.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/egolife-ai/Ego-R1/HEAD/assets/teaser.png


--------------------------------------------------------------------------------
/LLaMA-Factory/.gitattributes:
--------------------------------------------------------------------------------
1 | # Auto detect text files and perform LF normalization
2 | * text=auto
3 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_demo_data/1.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/egolife-ai/Ego-R1/HEAD/LLaMA-Factory/data/mllm_demo_data/1.jpg


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_demo_data/1.mp3:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/egolife-ai/Ego-R1/HEAD/LLaMA-Factory/data/mllm_demo_data/1.mp3


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_demo_data/1.mp4:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/egolife-ai/Ego-R1/HEAD/LLaMA-Factory/data/mllm_demo_data/1.mp4


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_demo_data/2.avi:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/egolife-ai/Ego-R1/HEAD/LLaMA-Factory/data/mllm_demo_data/2.avi


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_demo_data/2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/egolife-ai/Ego-R1/HEAD/LLaMA-Factory/data/mllm_demo_data/2.jpg


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_demo_data/2.wav:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/egolife-ai/Ego-R1/HEAD/LLaMA-Factory/data/mllm_demo_data/2.wav


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_demo_data/3.flac:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/egolife-ai/Ego-R1/HEAD/LLaMA-Factory/data/mllm_demo_data/3.flac


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_demo_data/3.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/egolife-ai/Ego-R1/HEAD/LLaMA-Factory/data/mllm_demo_data/3.jpg


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_demo_data/3.mp4:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/egolife-ai/Ego-R1/HEAD/LLaMA-Factory/data/mllm_demo_data/3.mp4


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_demo_data/4.mp3:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/egolife-ai/Ego-R1/HEAD/LLaMA-Factory/data/mllm_demo_data/4.mp3


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_demo_data/4.mp4:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/egolife-ai/Ego-R1/HEAD/LLaMA-Factory/data/mllm_demo_data/4.mp4


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/trainer/runtime_env.yaml:
--------------------------------------------------------------------------------
1 | working_dir: ./
2 | excludes: ["/.git/"]
3 | env_vars:
4 |   TORCH_NCCL_AVOID_RECORD_STREAMS: "1"
5 |   VLLM_ATTENTION_BACKEND: "XFORMERS"


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/pissa/init.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | 
3 | python scripts/pissa_init.py \
4 |     --model_name_or_path meta-llama/Meta-Llama-3-8B-Instruct \
5 |     --output_dir models/llama3-8b-pissa
6 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/inference/llama3_full_sft.yaml:
--------------------------------------------------------------------------------
1 | model_name_or_path: saves/llama3-8b/full/sft
2 | template: llama3
3 | infer_backend: huggingface  # choices: [huggingface, vllm, sglang]
4 | trust_remote_code: true
5 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/inference/qwen2_vl.yaml:
--------------------------------------------------------------------------------
1 | model_name_or_path: Qwen/Qwen2.5-VL-7B-Instruct
2 | template: qwen2_vl
3 | infer_backend: huggingface  # choices: [huggingface, vllm, sglang]
4 | trust_remote_code: true
5 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/trainer/config/evaluation.yaml:
--------------------------------------------------------------------------------
1 | data:
2 |   path: /tmp/math_Qwen2-7B-Instruct.parquet
3 |   prompt_key: prompt
4 |   response_key: responses
5 |   data_source_key: data_source
6 |   reward_model_key: reward_model


--------------------------------------------------------------------------------
/LLaMA-Factory/.dockerignore:
--------------------------------------------------------------------------------
 1 | .vscode
 2 | .git
 3 | .github
 4 | .venv
 5 | cache
 6 | data
 7 | docker
 8 | saves
 9 | hf_cache
10 | ms_cache
11 | om_cache
12 | output
13 | .dockerignore
14 | .gitattributes
15 | .gitignore
16 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/inference/llama3.yaml:
--------------------------------------------------------------------------------
1 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
2 | template: llama3
3 | infer_backend: huggingface  # choices: [huggingface, vllm, sglang]
4 | trust_remote_code: true
5 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/llama_pro/expand.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | 
3 | python scripts/llama_pro.py \
4 |     --model_name_or_path meta-llama/Meta-Llama-3-8B-Instruct \
5 |     --output_dir models/llama3-8b-pro \
6 |     --num_expand 8
7 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/inference/llama3_lora_sft.yaml:
--------------------------------------------------------------------------------
1 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
2 | adapter_name_or_path: saves/llama3-8b/lora/sft
3 | template: llama3
4 | infer_backend: huggingface  # choices: [huggingface, vllm, sglang]
5 | trust_remote_code: true
6 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/fsdp_qlora/train.sh:
--------------------------------------------------------------------------------
1 | #!/bin/bash
2 | # DO NOT use GPTQ/AWQ model in FSDP+QLoRA
3 | 
4 | CUDA_VISIBLE_DEVICES=0,1 accelerate launch \
5 |     --config_file examples/accelerate/fsdp_config.yaml \
6 |     src/train.py examples/extras/fsdp_qlora/llama3_lora_sft.yaml
7 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/.github/PULL_REQUEST_TEMPLATE.md:
--------------------------------------------------------------------------------
1 | # What does this PR do?
2 | 
3 | Fixes # (issue)
4 | 
5 | ## Before submitting
6 | 
7 | - [ ] Did you read the [contributor guideline](https://github.com/hiyouga/LLaMA-Factory/blob/main/.github/CONTRIBUTING.md)?
8 | - [ ] Did you write any new necessary tests?
9 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/merge_lora/llama3_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: saves/llama3-8b/full/sft
 3 | template: llama3
 4 | trust_remote_code: true
 5 | 
 6 | ### export
 7 | export_dir: output/llama3_full_sft
 8 | export_size: 5
 9 | export_device: cpu  # choices: [cpu, auto]
10 | export_legacy_format: false
11 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | *.json
 2 | *.jpg
 3 | *.png
 4 | *.mp4
 5 | *.pt
 6 | *.pth
 7 | *.safetensors
 8 | __pycache__
 9 | *.pyc
10 | *.log
11 | *.txt
12 | *.csv
13 | *.jsonl
14 | *.sample
15 | *.xlsx
16 | *.avi
17 | *.mp3
18 | *.wav
19 | *.flac
20 | *.zip
21 | *.tar
22 | *.gz
23 | api/hmguo/NVIDIA-Linux-x86_64-*.run
24 | api/hmguo/fastrag/database/JAKE/*.pkl
25 | Search_R1/tmp
26 | api/


--------------------------------------------------------------------------------
/Ego-R1-Agent/utils/serve.sh:
--------------------------------------------------------------------------------
 1 | export CUDA_VISIBLE_DEVICES=0,1
 2 | 
 3 | # vllm serve Qwen/Qwen2.5-3B-Instruct --port=23332 \
 4 | #     --tensor-parallel-size=2 \
 5 | #     --gpu-memory-utilization=0.7 \
 6 | #     --disable-custom-all-reduce
 7 | 
 8 | 
 9 | vllm serve Ego-R1/Ego-R1-Agent-3B --port=23333 \
10 |     --tensor-parallel-size=2 \
11 |     --gpu-memory-utilization=0.7 \
12 |     --disable-custom-all-reduce


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/merge_lora/llama3_gptq.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | template: llama3
 4 | trust_remote_code: true
 5 | 
 6 | ### export
 7 | export_dir: output/llama3_gptq
 8 | export_quantization_bit: 4
 9 | export_quantization_dataset: data/c4_demo.jsonl
10 | export_size: 5
11 | export_device: cpu  # choices: [cpu, auto]
12 | export_legacy_format: false
13 | 


--------------------------------------------------------------------------------
/api/rag/.gitignore:
--------------------------------------------------------------------------------
 1 | # Ignore logs directory
 2 | logs/
 3 | logs/*
 4 | 
 5 | # Ignore data directory
 6 | data/
 7 | data/*
 8 | 
 9 | # Python specific ignores
10 | __pycache__/
11 | *.py[cod]
12 | *$py.class
13 | *.so
14 | .Python
15 | build/
16 | develop-eggs/
17 | dist/
18 | downloads/
19 | eggs/
20 | .eggs/
21 | lib/
22 | lib64/
23 | parts/
24 | sdist/
25 | var/
26 | wheels/
27 | *.egg-info/
28 | .installed.cfg
29 | *.egg 


--------------------------------------------------------------------------------
/api/rag/configs/egolife.yaml:
--------------------------------------------------------------------------------
 1 | # API configurations
 2 | apis:
 3 |   A1:
 4 |     identity: JAKE
 5 |     port: 8001
 6 |   A2:
 7 |     identity: ALICE
 8 |     port: 8002
 9 |   A3:
10 |     identity: TASHA
11 |     port: 8003
12 |   A4:
13 |     identity: LUCIA
14 |     port: 8004
15 |   A5:
16 |     identity: KATRINA
17 |     port: 8005
18 |   A6:
19 |     identity: SHURE
20 |     port: 8006
21 | 
22 | # Base settings
23 | base:
24 |   data_dir: data/egolife
25 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/merge_lora/llama3_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### Note: DO NOT use quantized model or quantization_bit when merging lora adapters
 2 | 
 3 | ### model
 4 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 5 | adapter_name_or_path: saves/llama3-8b/lora/sft
 6 | template: llama3
 7 | trust_remote_code: true
 8 | 
 9 | ### export
10 | export_dir: output/llama3_lora_sft
11 | export_size: 5
12 | export_device: cpu  # choices: [cpu, auto]
13 | export_legacy_format: false
14 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/merge_lora/qwen2vl_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### Note: DO NOT use quantized model or quantization_bit when merging lora adapters
 2 | 
 3 | ### model
 4 | model_name_or_path: Qwen/Qwen2.5-VL-7B-Instruct
 5 | adapter_name_or_path: saves/qwen2_vl-7b/lora/sft
 6 | template: qwen2_vl
 7 | trust_remote_code: true
 8 | 
 9 | ### export
10 | export_dir: output/qwen2_vl_lora_sft
11 | export_size: 5
12 | export_device: cpu  # choices: [cpu, auto]
13 | export_legacy_format: false
14 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/llama3_lora_eval.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | adapter_name_or_path: saves/llama3-8b/lora/sft
 4 | trust_remote_code: true
 5 | 
 6 | ### method
 7 | finetuning_type: lora
 8 | 
 9 | ### dataset
10 | task: mmlu_test  # choices: [mmlu_test, ceval_validation, cmmlu_test]
11 | template: fewshot
12 | lang: en
13 | n_shot: 5
14 | 
15 | ### output
16 | save_dir: saves/llama3-8b/lora/eval
17 | 
18 | ### eval
19 | batch_size: 4
20 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/Makefile:
--------------------------------------------------------------------------------
 1 | .PHONY: build commit license quality style test
 2 | 
 3 | check_dirs := scripts src tests setup.py
 4 | 
 5 | build:
 6 | 	pip3 install build && python3 -m build
 7 | 
 8 | commit:
 9 | 	pre-commit install
10 | 	pre-commit run --all-files
11 | 
12 | license:
13 | 	python3 tests/check_license.py $(check_dirs)
14 | 
15 | quality:
16 | 	ruff check $(check_dirs)
17 | 	ruff format --check $(check_dirs)
18 | 
19 | style:
20 | 	ruff check $(check_dirs) --fix
21 | 	ruff format $(check_dirs)
22 | 
23 | test:
24 | 	CUDA_VISIBLE_DEVICES= WANDB_DISABLED=true pytest -vv tests/
25 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/.github/SECURITY.md:
--------------------------------------------------------------------------------
1 | # Reporting Security Issues
2 | 
3 | To report a security issue, please use the GitHub Security Advisory ["Report a Vulnerability"](https://github.com/hiyouga/LLaMA-Factory/security/advisories/new) tab.
4 | 
5 | We will send a response indicating the next steps in handling your report. After the initial reply to your report, the security team will keep you informed of the progress towards a fix and full announcement, and may ask for additional information or guidance.
6 | 
7 | Report security bugs in third-party modules to the person or team maintaining the module.
8 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/llama3_preprocess.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | 
12 | ### dataset
13 | dataset: identity,alpaca_en_demo
14 | template: llama3
15 | cutoff_len: 2048
16 | max_samples: 1000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | tokenized_path: saves/llama3-8b/dataset/sft
20 | 
21 | ### output
22 | output_dir: saves/llama3-8b/lora/sft
23 | overwrite_output_dir: true
24 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/ego_r1/search/retrieval_request.py:
--------------------------------------------------------------------------------
 1 | import requests
 2 | 
 3 | # URL for your local FastAPI server
 4 | url = "http://127.0.0.1:8000/retrieve"
 5 | 
 6 | # Example payload
 7 | payload = {
 8 |     "queries": ["What is the capital of France?", "Explain neural networks."] * 200,
 9 |     "topk": 5,
10 |     "return_scores": True
11 | }
12 | 
13 | # Send POST request
14 | response = requests.post(url, json=payload)
15 | 
16 | # Raise an exception if the request failed
17 | response.raise_for_status()
18 | 
19 | # Get the JSON response
20 | retrieved_data = response.json()
21 | 
22 | print("Response from server:")
23 | print(retrieved_data)
24 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/models/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/trainer/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/models/llama/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/third_party/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/trainer/ppo/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/logger/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/megatron/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/rendezvous/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/models/transformers/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/reward_score/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/single_controller/base/megatron/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/third_party/vllm/vllm_v_0_3_1/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/third_party/vllm/vllm_v_0_4_2/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/third_party/vllm/vllm_v_0_5_4/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/third_party/vllm/vllm_v_0_6_3/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/models/llama/megatron/checkpoint_utils/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/single_controller/base/register_center/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/debug/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .performance import log_gpu_memory_usage


--------------------------------------------------------------------------------
/api/rag/pyproject.toml:
--------------------------------------------------------------------------------
 1 | [build-system]
 2 | requires = ["hatchling"]
 3 | build-backend = "hatchling.build"
 4 | 
 5 | [project]
 6 | name = "r1rag"
 7 | version = "0.1.0"
 8 | description = "A RAG system for video captions with temporal indexing"
 9 | requires-python = ">=3.8"
10 | license = "MIT"
11 | authors = [
12 |     { name = "Hongming", email = "ghm0221@bupt.edu.cn" }
13 | ]
14 | dependencies = [
15 |     "numpy>=1.21.0,<1.27.0",
16 |     "pandas>=1.3.0,<2.0.0",
17 |     "nltk>=3.6.0",
18 |     "fastapi",
19 |     "uvicorn[standard]",
20 |     "pillow>=9.2.0",
21 |     "PyYAML",
22 |     "psutil",
23 |     "openai>=1.0.0", 
24 |     "requests",
25 |     "google-genai",  
26 |     "ffmpeg-python",
27 |     "opencv-python"
28 | ]
29 | 
30 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/reward_model/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .base import BasePPORewardModel
16 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/rollout/naive/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .naive_rollout import NaiveRollout
16 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/rollout/vllm_rollout/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .vllm_rollout import vLLMRollout


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/reward_model/megatron/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .reward_model import MegatronRewardModel
16 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/third_party/muon/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .muon import Muon
16 | 
17 | 
18 | __all__ = ["Muon"]
19 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/train/pt/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .workflow import run_pt
16 | 
17 | 
18 | __all__ = ["run_pt"]
19 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/train/rm/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .workflow import run_rm
16 | 
17 | 
18 | __all__ = ["run_rm"]
19 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/train/dpo/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .workflow import run_dpo
16 | 
17 | 
18 | __all__ = ["run_dpo"]
19 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/train/kto/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .workflow import run_kto
16 | 
17 | 
18 | __all__ = ["run_kto"]
19 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/train/ppo/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .workflow import run_ppo
16 | 
17 | 
18 | __all__ = ["run_ppo"]
19 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/train/sft/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .workflow import run_sft
16 | 
17 | 
18 | __all__ = ["run_sft"]
19 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/dataset/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .rl_dataset import RLHFDataset
16 | from .rm_dataset import RMDataset


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from . import tokenizer
16 | from .tokenizer import *
17 | 
18 | __all__ = tokenizer.__all__


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/single_controller/base/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .worker import Worker
16 | from .worker_group import WorkerGroup, ClassWithInitArgs, ResourcePool
17 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/.github/workflows/publish.yml:
--------------------------------------------------------------------------------
 1 | name: publish
 2 | 
 3 | on:
 4 |   workflow_dispatch:
 5 |   release:
 6 |     types:
 7 |       - published
 8 | 
 9 | jobs:
10 |   publish:
11 |     name: Upload release to PyPI
12 | 
13 |     runs-on: ubuntu-latest
14 | 
15 |     environment:
16 |       name: release
17 |       url: https://pypi.org/p/llamafactory
18 | 
19 |     permissions:
20 |       id-token: write
21 | 
22 |     steps:
23 |       - name: Checkout
24 |         uses: actions/checkout@v4
25 | 
26 |       - name: Set up Python
27 |         uses: actions/setup-python@v5
28 |         with:
29 |           python-version: "3.9"
30 | 
31 |       - name: Build package
32 |         run: |
33 |           make build
34 | 
35 |       - name: Publish package
36 |         uses: pypa/gh-action-pypi-publish@release/v1
37 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/chat/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .base_engine import BaseEngine
16 | from .chat_model import ChatModel
17 | 
18 | 
19 | __all__ = ["BaseEngine", "ChatModel"]
20 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/actor/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .base import BasePPOActor
16 | from .dp_actor import DataParallelPPOActor
17 | 
18 | __all__ = ["BasePPOActor", "DataParallelPPOActor"]
19 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/critic/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .base import BasePPOCritic
16 | from .dp_critic import DataParallelPPOCritic
17 | 
18 | __all__ = ["BasePPOCritic", "DataParallelPPOCritic"]
19 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/ego_r1/search/build_index.sh:
--------------------------------------------------------------------------------
 1 | 
 2 | corpus_file=example/corpus.jsonl
 3 | save_dir=data
 4 | retriever_name=e5 # this is for indexing naming
 5 | retriever_model=intfloat/e5-base-v2
 6 | 
 7 | <<<<<<< HEAD
 8 | CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 python search_r1/search/index_builder.py \
 9 | =======
10 | # change faiss_type to HNSW32/64/128 for ANN indexing
11 | # change retriever_name to bm25 for BM25 indexing
12 | CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 python index_builder.py \
13 | >>>>>>> 573ed7e86a4143bb13d69752c3a0745cd184bc54
14 |     --retrieval_method $retriever_name \
15 |     --model_path $retriever_model \
16 |     --corpus_path $corpus_file \
17 |     --save_dir $save_dir \
18 |     --use_fp16 \
19 |     --max_length 256 \
20 |     --batch_size 512 \
21 |     --pooling_method mean \
22 |     --faiss_type Flat \
23 |     --save_embedding
24 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/accelerate/fsdp_config.yaml:
--------------------------------------------------------------------------------
 1 | compute_environment: LOCAL_MACHINE
 2 | debug: false
 3 | distributed_type: FSDP
 4 | downcast_bf16: 'no'
 5 | fsdp_config:
 6 |   fsdp_auto_wrap_policy: TRANSFORMER_BASED_WRAP
 7 |   fsdp_backward_prefetch: BACKWARD_PRE
 8 |   fsdp_forward_prefetch: false
 9 |   fsdp_cpu_ram_efficient_loading: true
10 |   fsdp_offload_params: false
11 |   fsdp_sharding_strategy: FULL_SHARD
12 |   fsdp_state_dict_type: FULL_STATE_DICT
13 |   fsdp_sync_module_states: true
14 |   fsdp_use_orig_params: true
15 | machine_rank: 0
16 | main_training_function: main
17 | mixed_precision: bf16  # or fp16
18 | num_machines: 1  # the number of nodes
19 | num_processes: 2  # the number of GPUs in all nodes
20 | rdzv_backend: static
21 | same_network: true
22 | tpu_env: []
23 | tpu_use_cluster: false
24 | tpu_use_sudo: false
25 | use_cpu: false
26 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/launcher.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from llamafactory.train.tuner import run_exp  # use absolute import
16 | 
17 | 
18 | def launch():
19 |     run_exp()
20 | 
21 | 
22 | if __name__ == "__main__":
23 |     launch()
24 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/.pre-commit-config.yaml:
--------------------------------------------------------------------------------
 1 | repos:
 2 | -   repo: https://github.com/pre-commit/pre-commit-hooks
 3 |     rev: v5.0.0
 4 |     hooks:
 5 |     -   id: check-ast
 6 |     -   id: check-added-large-files
 7 |         args: ['--maxkb=25000']
 8 |     -   id: check-merge-conflict
 9 |     -   id: check-yaml
10 |     -   id: debug-statements
11 |     -   id: end-of-file-fixer
12 |     -   id: trailing-whitespace
13 |         args: [--markdown-linebreak-ext=md]
14 |     -   id: no-commit-to-branch
15 |         args: ['--branch', 'main']
16 | 
17 | -   repo: https://github.com/asottile/pyupgrade
18 |     rev: v3.17.0
19 |     hooks:
20 |     -   id: pyupgrade
21 |         args: [--py38-plus]
22 | 
23 | -   repo: https://github.com/astral-sh/ruff-pre-commit
24 |     rev: v0.6.9
25 |     hooks:
26 |     -   id: ruff
27 |         args: [--fix]
28 |     -   id: ruff-format
29 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/rollout/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .base import BaseRollout
16 | from .naive import NaiveRollout
17 | from .hf_rollout import HFRollout
18 | 
19 | __all__ = ["BaseRollout", "NaiveRollout", "HFRollout"]
20 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/single_controller/ray/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .base import RayResourcePool, RayClassWithInitArgs, RayWorkerGroup, create_colocated_worker_cls
16 | from .megatron import (MegatronRayWorkerGroup, DistRankInfo, DistGlobalInfo)


--------------------------------------------------------------------------------
/api/visual_tools/configs.yaml:
--------------------------------------------------------------------------------
 1 | 
 2 | egolife:
 3 |   videollm:
 4 |     gemini_api_keys: ["your-gemini-api-key-1", "your-gemini-api-key-2","..."]
 5 |     data_dir: "/path/to/egolife"
 6 |     gemini_port: 8060
 7 |     llava_port: 8010
 8 |   vlm:
 9 |     data_dir: "/path/to/egolife"
10 |     vlm_port: 8080
11 | 
12 | videomme:
13 |   videollm:
14 |     gemini_api_keys: ["your-gemini-api-key-1", "your-gemini-api-key-2","..."]
15 |     data_dir: "/path/to/videomme"
16 |     gemini_port: 7060
17 |     llava_port: 7010
18 |   vlm:
19 |     data_dir: "/path/to/videomme"
20 |     vlm_port: 7080
21 | 
22 | egoschema:
23 |   videollm:
24 |     gemini_api_keys: ["your-gemini-api-key-1", "your-gemini-api-key-2","..."]
25 |     data_dir: "/path/to/egoschema"
26 |     gemini_port: 6060
27 |     llava_port: 6010
28 |   vlm:
29 |     data_dir: "/path/to/egoschema"
30 |     vlm_port: 6080
31 | 
32 | 
33 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/.env.local:
--------------------------------------------------------------------------------
 1 | # Note: actually we do not support .env, just for reference
 2 | # api
 3 | API_HOST=
 4 | API_PORT=
 5 | API_KEY=
 6 | API_MODEL_NAME=
 7 | API_VERBOSE=
 8 | FASTAPI_ROOT_PATH=
 9 | MAX_CONCURRENT=
10 | # general
11 | DISABLE_VERSION_CHECK=
12 | FORCE_CHECK_IMPORTS=
13 | ALLOW_EXTRA_ARGS=
14 | LLAMAFACTORY_VERBOSITY=
15 | USE_MODELSCOPE_HUB=
16 | USE_OPENMIND_HUB=
17 | USE_RAY=
18 | RECORD_VRAM=
19 | OPTIM_TORCH=
20 | NPU_JIT_COMPILE=
21 | # torchrun
22 | FORCE_TORCHRUN=
23 | MASTER_ADDR=
24 | MASTER_PORT=
25 | NNODES=
26 | NODE_RANK=
27 | NPROC_PER_NODE=
28 | # wandb
29 | WANDB_DISABLED=
30 | WANDB_PROJECT=
31 | WANDB_API_KEY=
32 | # gradio ui
33 | GRADIO_SHARE=
34 | GRADIO_SERVER_NAME=
35 | GRADIO_SERVER_PORT=
36 | GRADIO_ROOT_PATH=
37 | GRADIO_IPV6=
38 | # setup
39 | ENABLE_SHORT_CONSOLE=
40 | # reserved (do not use)
41 | LLAMABOARD_ENABLED=
42 | LLAMABOARD_WORKDIR=
43 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/dataset/README.md:
--------------------------------------------------------------------------------
 1 | # Dataset Format
 2 | ## RLHF dataset
 3 | We combine all the data sources into a single parquet files. We directly organize the prompt into the chat format so that multi-turn chats can be easily incorporated. In the prompt, we may add instruction following texts to guide the model output the answers in a particular format so that we can extract the answers.
 4 | 
 5 | Math problems
 6 | ```json
 7 | {
 8 |     "data_source": "openai/gsm8k",
 9 |     "prompt": [{"role": "user", "content": "Natalia sold clips to 48 of her friends in April, and then she sold half as many clips in May. How many clips did Natalia sell altogether in April and May? Let's think step by step and output the final answer after \"####\""}],
10 |     "ability": "math",
11 |     "reward_model": {
12 |         "style": "rule",
13 |         "ground_truth": ["72"]
14 |     },
15 | }
16 | ```
17 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/accelerate/fsdp_config_offload.yaml:
--------------------------------------------------------------------------------
 1 | compute_environment: LOCAL_MACHINE
 2 | debug: false
 3 | distributed_type: FSDP
 4 | downcast_bf16: 'no'
 5 | fsdp_config:
 6 |   fsdp_auto_wrap_policy: TRANSFORMER_BASED_WRAP
 7 |   fsdp_backward_prefetch: BACKWARD_PRE
 8 |   fsdp_forward_prefetch: false
 9 |   fsdp_cpu_ram_efficient_loading: true
10 |   fsdp_offload_params: true  # offload may affect training speed
11 |   fsdp_sharding_strategy: FULL_SHARD
12 |   fsdp_state_dict_type: FULL_STATE_DICT
13 |   fsdp_sync_module_states: true
14 |   fsdp_use_orig_params: true
15 | machine_rank: 0
16 | main_training_function: main
17 | mixed_precision: bf16  # or fp16
18 | num_machines: 1  # the number of nodes
19 | num_processes: 2  # the number of GPUs in all nodes
20 | rdzv_backend: static
21 | same_network: true
22 | tpu_env: []
23 | tpu_use_cluster: false
24 | tpu_use_sudo: false
25 | use_cpu: false
26 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/train.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from llamafactory.train.tuner import run_exp
16 | 
17 | 
18 | def main():
19 |     run_exp()
20 | 
21 | 
22 | def _mp_fn(index):
23 |     # For xla_spawn (TPUs)
24 |     run_exp()
25 | 
26 | 
27 | if __name__ == "__main__":
28 |     main()
29 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/single_controller/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | version_folder = os.path.dirname(os.path.join(os.path.abspath(__file__)))
18 | 
19 | with open(os.path.join(version_folder, 'version/version')) as f:
20 |     __version__ = f.read().strip()
21 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/nlg_eval/llama3_lora_predict.yaml:
--------------------------------------------------------------------------------
 1 | # The batch generation can be SLOW using this config.
 2 | # For faster inference, we recommend to use `scripts/vllm_infer.py`.
 3 | 
 4 | ### model
 5 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 6 | adapter_name_or_path: saves/llama3-8b/lora/sft
 7 | trust_remote_code: true
 8 | 
 9 | ### method
10 | stage: sft
11 | do_predict: true
12 | finetuning_type: lora
13 | 
14 | ### dataset
15 | eval_dataset: identity,alpaca_en_demo
16 | template: llama3
17 | cutoff_len: 2048
18 | max_samples: 50
19 | overwrite_cache: true
20 | preprocessing_num_workers: 16
21 | dataloader_num_workers: 4
22 | 
23 | ### output
24 | output_dir: saves/llama3-8b/lora/predict
25 | overwrite_output_dir: true
26 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
27 | 
28 | ### eval
29 | per_device_eval_batch_size: 1
30 | predict_with_generate: true
31 | ddp_timeout: 180000000
32 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/models/llama/megatron/layers/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .parallel_attention import ParallelLlamaAttention
16 | from .parallel_decoder import ParallelLlamaDecoderLayer, ParallelLlamaDecoderLayerRmPad
17 | from .parallel_mlp import ParallelLlamaMLP
18 | from .parallel_rmsnorm import ParallelLlamaRMSNorm
19 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/config.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from typing import Dict
16 | 
17 | from omegaconf import DictConfig
18 | 
19 | 
20 | def update_dict_with_config(dictionary: Dict, config: DictConfig):
21 |     for key in dictionary:
22 |         if hasattr(config, key):
23 |             dictionary[key] = getattr(config, key)
24 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/trainer/config/generation.yaml:
--------------------------------------------------------------------------------
 1 | trainer:
 2 |   nnodes: 1
 3 |   n_gpus_per_node: 8
 4 | 
 5 | data:
 6 |   path: ~/data/rlhf/math/test.parquet
 7 |   prompt_key: prompt
 8 |   n_samples: 5
 9 |   output_path: /opt/tiger/math_Qwen2-7B-Instruct.parquet
10 |   batch_size: 128
11 | 
12 | model:
13 |   path: ~/models/Qwen2-7B-Instruct
14 |   external_lib: null
15 | rollout:
16 |   name: vllm
17 |   temperature: 1.0
18 |   top_k: 50 # 0 for hf rollout, -1 for vllm rollout
19 |   top_p: 0.7
20 |   prompt_length: 1536
21 |   response_length: 512
22 |   # for vllm rollout
23 |   dtype: bfloat16 # should align with FSDP
24 |   gpu_memory_utilization: 0.5
25 |   ignore_eos: False
26 |   micro_batch_size: 256
27 |   enforce_eager: True
28 |   free_cache_engine: True
29 |   load_format: dummy_dtensor
30 |   tensor_model_parallel_size: 1
31 |   max_num_batched_tokens: 8192
32 |   max_num_seqs: 1024
33 |   log_prob_micro_batch_size: 8
34 |   # for hf rollout
35 |   do_sample: True


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/logging_utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import logging
16 | 
17 | 
18 | def set_basic_config(level):
19 |     """
20 |     This function sets the global logging format and level. It will be called when import verl
21 |     """
22 |     logging.basicConfig(format='%(levelname)s:%(asctime)s:%(message)s', level=level)
23 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/.github/workflows/label_issue.yml:
--------------------------------------------------------------------------------
 1 | name: label_issue
 2 | 
 3 | on:
 4 |   issues:
 5 |     types:
 6 |       - opened
 7 | 
 8 | jobs:
 9 |   label_issue:
10 |     runs-on: ubuntu-latest
11 | 
12 |     permissions:
13 |       issues: write
14 | 
15 |     steps:
16 |       - env:
17 |           GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
18 |           ISSUE_URL: ${{ github.event.issue.html_url }}
19 |           ISSUE_TITLE: ${{ github.event.issue.title }}
20 |         run: |
21 |           LABEL=""
22 |           NPU_KEYWORDS=(npu huawei ascend 华为 昇腾)
23 |           ISSUE_TITLE_LOWER=$(echo $ISSUE_TITLE | tr '[:upper:]' '[:lower:]')
24 |           for KEYWORD in ${NPU_KEYWORDS[@]}; do
25 |             if [[ $ISSUE_TITLE_LOWER == *$KEYWORD* ]] && [[ $ISSUE_TITLE_LOWER != *input* ]]; then
26 |               LABEL="npu"
27 |               break
28 |             fi
29 |           done
30 |           if [ -n "$LABEL" ]; then
31 |             gh issue edit $ISSUE_URL --add-label $LABEL
32 |           fi
33 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/ego_r1/search/retrieval.sh:
--------------------------------------------------------------------------------
 1 | 
 2 | DATA_NAME=nq
 3 | 
 4 | DATASET_PATH="/home/peterjin/mnt/data/$DATA_NAME"
 5 | 
 6 | SPLIT='test'
 7 | TOPK=3
 8 | 
 9 | INDEX_PATH=/home/peterjin/mnt/index/wiki-18
10 | CORPUS_PATH=/home/peterjin/mnt/data/retrieval-corpus/wiki-18.jsonl
11 | SAVE_NAME=e5_${TOPK}_wiki18.json
12 | 
13 | # INDEX_PATH=/home/peterjin/rm_retrieval_corpus/index/wiki-21
14 | # CORPUS_PATH=/home/peterjin/rm_retrieval_corpus/corpora/wiki/enwiki-dec2021/text-list-100-sec.jsonl
15 | # SAVE_NAME=e5_${TOPK}_wiki21.json
16 | 
17 | CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 python retrieval.py --retrieval_method e5 \
18 |                     --retrieval_topk $TOPK \
19 |                     --index_path $INDEX_PATH \
20 |                     --corpus_path $CORPUS_PATH \
21 |                     --dataset_path $DATASET_PATH \
22 |                     --data_split $SPLIT \
23 |                     --retrieval_model_path "intfloat/e5-base-v2" \
24 |                     --retrieval_pooling_method "mean" \
25 |                     --retrieval_batch_size 512 \
26 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | version_folder = os.path.dirname(os.path.join(os.path.abspath(__file__)))
18 | 
19 | with open(os.path.join(version_folder, 'version/version')) as f:
20 |     __version__ = f.read().strip()
21 | 
22 | from .protocol import DataProto
23 | 
24 | from .utils.logging_utils import set_basic_config
25 | import logging
26 | 
27 | set_basic_config(level=logging.WARNING)
28 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_video_demo.json:
--------------------------------------------------------------------------------
 1 | [
 2 |   {
 3 |     "messages": [
 4 |       {
 5 |         "content": "<video>Why is this video funny?",
 6 |         "role": "user"
 7 |       },
 8 |       {
 9 |         "content": "Because a baby is reading, and he is so cute!",
10 |         "role": "assistant"
11 |       }
12 |     ],
13 |     "videos": [
14 |       "mllm_demo_data/1.mp4"
15 |     ]
16 |   },
17 |   {
18 |     "messages": [
19 |       {
20 |         "content": "<video>What is she doing?",
21 |         "role": "user"
22 |       },
23 |       {
24 |         "content": "She is cooking.",
25 |         "role": "assistant"
26 |       }
27 |     ],
28 |     "videos": [
29 |       "mllm_demo_data/2.avi"
30 |     ]
31 |   },
32 |   {
33 |     "messages": [
34 |       {
35 |         "content": "<video>What's in the video?",
36 |         "role": "user"
37 |       },
38 |       {
39 |         "content": "A baby is playing in the living room.",
40 |         "role": "assistant"
41 |       }
42 |     ],
43 |     "videos": [
44 |       "mllm_demo_data/3.mp4"
45 |     ]
46 |   }
47 | ]
48 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/models/llama/megatron/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .modeling_llama_megatron import (
16 |     # original model with megatron
17 |     ParallelLlamaModel,
18 |     ParallelLlamaForCausalLM,
19 |     # rmpad with megatron
20 |     ParallelLlamaForCausalLMRmPad,
21 |     ParallelLlamaForValueRmPad,
22 |     # rmpad with megatron and pipeline parallelism
23 |     ParallelLlamaForCausalLMRmPadPP,
24 |     ParallelLlamaForValueRmPadPP)
25 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/muon/qwen2_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: Qwen/Qwen2-1.5B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | use_muon: true
10 | 
11 | ### dataset
12 | dataset: identity,alpaca_en_demo
13 | template: qwen
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | dataloader_num_workers: 4
19 | 
20 | ### output
21 | output_dir: saves/qwen2-1_5b/full/sft
22 | logging_steps: 10
23 | save_steps: 500
24 | plot_loss: true
25 | overwrite_output_dir: true
26 | save_only_model: false
27 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
28 | 
29 | ### train
30 | per_device_train_batch_size: 1
31 | gradient_accumulation_steps: 8
32 | learning_rate: 1.0e-5
33 | num_train_epochs: 3.0
34 | lr_scheduler_type: cosine
35 | warmup_ratio: 0.1
36 | bf16: true
37 | ddp_timeout: 180000000
38 | 
39 | ### eval
40 | # val_size: 0.1
41 | # per_device_eval_batch_size: 1
42 | # eval_strategy: steps
43 | # eval_steps: 500
44 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/llama3_lora_ppo.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | reward_model: saves/llama3-8b/lora/reward
 4 | trust_remote_code: true
 5 | 
 6 | ### method
 7 | stage: ppo
 8 | do_train: true
 9 | finetuning_type: lora
10 | lora_rank: 8
11 | lora_target: all
12 | 
13 | ### dataset
14 | dataset: identity,alpaca_en_demo
15 | template: llama3
16 | cutoff_len: 2048
17 | max_samples: 1000
18 | overwrite_cache: true
19 | preprocessing_num_workers: 16
20 | dataloader_num_workers: 4
21 | 
22 | ### output
23 | output_dir: saves/llama3-8b/lora/ppo
24 | logging_steps: 10
25 | save_steps: 500
26 | plot_loss: true
27 | overwrite_output_dir: true
28 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
29 | 
30 | ### train
31 | per_device_train_batch_size: 1
32 | gradient_accumulation_steps: 8
33 | learning_rate: 1.0e-5
34 | num_train_epochs: 3.0
35 | lr_scheduler_type: cosine
36 | warmup_ratio: 0.1
37 | bf16: true
38 | ddp_timeout: 180000000
39 | 
40 | ### generate
41 | max_new_tokens: 512
42 | top_k: 0
43 | top_p: 0.9
44 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/adam_mini/qwen2_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: Qwen/Qwen2-1.5B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | use_adam_mini: true
10 | 
11 | ### dataset
12 | dataset: identity,alpaca_en_demo
13 | template: qwen
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | dataloader_num_workers: 4
19 | 
20 | ### output
21 | output_dir: saves/qwen2-1_5b/full/sft
22 | logging_steps: 10
23 | save_steps: 500
24 | plot_loss: true
25 | overwrite_output_dir: true
26 | save_only_model: false
27 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
28 | 
29 | ### train
30 | per_device_train_batch_size: 1
31 | gradient_accumulation_steps: 8
32 | learning_rate: 1.0e-5
33 | num_train_epochs: 3.0
34 | lr_scheduler_type: cosine
35 | warmup_ratio: 0.1
36 | bf16: true
37 | ddp_timeout: 180000000
38 | 
39 | ### eval
40 | # val_size: 0.1
41 | # per_device_eval_batch_size: 1
42 | # eval_strategy: steps
43 | # eval_steps: 500
44 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/llama3_lora_kto.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: kto
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | pref_beta: 0.1
12 | 
13 | ### dataset
14 | dataset: kto_en_demo
15 | template: llama3
16 | cutoff_len: 2048
17 | max_samples: 1000
18 | overwrite_cache: true
19 | preprocessing_num_workers: 16
20 | dataloader_num_workers: 4
21 | 
22 | ### output
23 | output_dir: saves/llama3-8b/lora/kto
24 | logging_steps: 10
25 | save_steps: 500
26 | plot_loss: true
27 | overwrite_output_dir: true
28 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
29 | 
30 | ### train
31 | per_device_train_batch_size: 1
32 | gradient_accumulation_steps: 8
33 | learning_rate: 5.0e-6
34 | num_train_epochs: 3.0
35 | lr_scheduler_type: cosine
36 | warmup_ratio: 0.1
37 | bf16: true
38 | ddp_timeout: 180000000
39 | 
40 | ### eval
41 | # val_size: 0.1
42 | # per_device_eval_batch_size: 1
43 | # eval_strategy: steps
44 | # eval_steps: 500
45 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/llama3_lora_sft.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | set -x
 4 | 
 5 | MODEL_PATH=meta-llama/Meta-Llama-3-8B-Instruct
 6 | 
 7 | llamafactory-cli train \
 8 |     --model_name_or_path ${MODEL_PATH} \
 9 |     --trust_remote_code \
10 |     --stage sft \
11 |     --do_train \
12 |     --finetuning_type lora \
13 |     --lora_rank 8 \
14 |     --lora_target all \
15 |     --dataset identity,alpaca_en_demo \
16 |     --template llama3 \
17 |     --cutoff_len 2048 \
18 |     --max_samples 1000 \
19 |     --overwrite_cache \
20 |     --preprocessing_num_workers 16 \
21 |     --dataloader_num_workers 4 \
22 |     --output_dir saves/llama3-8b/lora/sft \
23 |     --logging_steps 10 \
24 |     --save_steps 500 \
25 |     --plot_loss \
26 |     --overwrite_output_dir \
27 |     --save_only_model false \
28 |     --report_to none \
29 |     --per_device_train_batch_size 1 \
30 |     --gradient_accumulation_steps 8 \
31 |     --learning_rate 1e-4 \
32 |     --num_train_epochs 3.0 \
33 |     --lr_scheduler_type cosine \
34 |     --warmup_ratio 0.1 \
35 |     --bf16 \
36 |     --ddp_timeout 180000000
37 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/single_controller/base/register_center/ray.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import ray
16 | 
17 | 
18 | @ray.remote
19 | class WorkerGroupRegisterCenter:
20 | 
21 |     def __init__(self, rank_zero_info):
22 |         self.rank_zero_info = rank_zero_info
23 | 
24 |     def get_rank_zero_info(self):
25 |         return self.rank_zero_info
26 | 
27 | 
28 | def create_worker_group_register_center(name, info):
29 |     return WorkerGroupRegisterCenter.options(name=name).remote(info)
30 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/docker/docker-npu/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   llamafactory:
 3 |     build:
 4 |       dockerfile: ./docker/docker-npu/Dockerfile
 5 |       context: ../..
 6 |       args:
 7 |         INSTALL_DEEPSPEED: "false"
 8 |         PIP_INDEX: https://pypi.org/simple
 9 |     container_name: llamafactory
10 |     volumes:
11 |       - ../../hf_cache:/root/.cache/huggingface
12 |       - ../../ms_cache:/root/.cache/modelscope
13 |       - ../../om_cache:/root/.cache/openmind
14 |       - ../../data:/app/data
15 |       - ../../output:/app/output
16 |       - /usr/local/dcmi:/usr/local/dcmi
17 |       - /usr/local/bin/npu-smi:/usr/local/bin/npu-smi
18 |       - /usr/local/Ascend/driver:/usr/local/Ascend/driver
19 |       - /etc/ascend_install.info:/etc/ascend_install.info
20 |     ports:
21 |       - "7860:7860"
22 |       - "8000:8000"
23 |     ipc: host
24 |     tty: true
25 |     shm_size: "16gb"
26 |     stdin_open: true
27 |     command: bash
28 |     devices:
29 |       - /dev/davinci0
30 |       - /dev/davinci_manager
31 |       - /dev/devmm_svm
32 |       - /dev/hisi_hdc
33 |     restart: unless-stopped
34 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_audio_demo.json:
--------------------------------------------------------------------------------
 1 | [
 2 |   {
 3 |     "messages": [
 4 |       {
 5 |         "content": "<audio>What's that sound?",
 6 |         "role": "user"
 7 |       },
 8 |       {
 9 |         "content": "It is the sound of glass shattering.",
10 |         "role": "assistant"
11 |       }
12 |     ],
13 |     "audios": [
14 |       "mllm_demo_data/1.mp3"
15 |     ]
16 |   },
17 |   {
18 |     "messages": [
19 |       {
20 |         "content": "<audio>What can you hear?",
21 |         "role": "user"
22 |       },
23 |       {
24 |         "content": "A woman is coughing.",
25 |         "role": "assistant"
26 |       }
27 |     ],
28 |     "audios": [
29 |       "mllm_demo_data/2.wav"
30 |     ]
31 |   },
32 |   {
33 |     "messages": [
34 |       {
35 |         "content": "<audio>What does the person say?",
36 |         "role": "user"
37 |       },
38 |       {
39 |         "content": "Mister Quiller is the apostle of the middle classes and we are glad to welcome his gospel.",
40 |         "role": "assistant"
41 |       }
42 |     ],
43 |     "audios": [
44 |       "mllm_demo_data/3.flac"
45 |     ]
46 |   }
47 | ]
48 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_awq.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: TechxGenus/Meta-Llama-3-8B-Instruct-AWQ
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | 
12 | ### dataset
13 | dataset: identity,alpaca_en_demo
14 | template: llama3
15 | cutoff_len: 2048
16 | max_samples: 1000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | dataloader_num_workers: 4
20 | 
21 | ### output
22 | output_dir: saves/llama3-8b/lora/sft
23 | logging_steps: 10
24 | save_steps: 500
25 | plot_loss: true
26 | overwrite_output_dir: true
27 | save_only_model: false
28 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
29 | 
30 | ### train
31 | per_device_train_batch_size: 1
32 | gradient_accumulation_steps: 8
33 | learning_rate: 1.0e-4
34 | num_train_epochs: 3.0
35 | lr_scheduler_type: cosine
36 | warmup_ratio: 0.1
37 | bf16: true
38 | ddp_timeout: 180000000
39 | 
40 | ### eval
41 | # val_size: 0.1
42 | # per_device_eval_batch_size: 1
43 | # eval_strategy: steps
44 | # eval_steps: 500
45 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_gptq.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: TechxGenus/Meta-Llama-3-8B-Instruct-GPTQ
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | 
12 | ### dataset
13 | dataset: identity,alpaca_en_demo
14 | template: llama3
15 | cutoff_len: 2048
16 | max_samples: 1000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | dataloader_num_workers: 4
20 | 
21 | ### output
22 | output_dir: saves/llama3-8b/lora/sft
23 | logging_steps: 10
24 | save_steps: 500
25 | plot_loss: true
26 | overwrite_output_dir: true
27 | save_only_model: false
28 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
29 | 
30 | ### train
31 | per_device_train_batch_size: 1
32 | gradient_accumulation_steps: 8
33 | learning_rate: 1.0e-4
34 | num_train_epochs: 3.0
35 | lr_scheduler_type: cosine
36 | warmup_ratio: 0.1
37 | bf16: true
38 | ddp_timeout: 180000000
39 | 
40 | ### eval
41 | # val_size: 0.1
42 | # per_device_eval_batch_size: 1
43 | # eval_strategy: steps
44 | # eval_steps: 500
45 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/webui/components/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .chatbot import create_chat_box
16 | from .eval import create_eval_tab
17 | from .export import create_export_tab
18 | from .infer import create_infer_tab
19 | from .top import create_top
20 | from .train import create_train_tab
21 | 
22 | 
23 | __all__ = [
24 |     "create_chat_box",
25 |     "create_eval_tab",
26 |     "create_export_tab",
27 |     "create_infer_tab",
28 |     "create_top",
29 |     "create_train_tab",
30 | ]
31 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_aqlm.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: ISTA-DASLab/Meta-Llama-3-8B-Instruct-AQLM-2Bit-1x16
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | 
12 | ### dataset
13 | dataset: identity,alpaca_en_demo
14 | template: llama3
15 | cutoff_len: 2048
16 | max_samples: 1000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | dataloader_num_workers: 4
20 | 
21 | ### output
22 | output_dir: saves/llama3-8b/lora/sft
23 | logging_steps: 10
24 | save_steps: 500
25 | plot_loss: true
26 | overwrite_output_dir: true
27 | save_only_model: false
28 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
29 | 
30 | ### train
31 | per_device_train_batch_size: 1
32 | gradient_accumulation_steps: 8
33 | learning_rate: 1.0e-4
34 | num_train_epochs: 3.0
35 | lr_scheduler_type: cosine
36 | warmup_ratio: 0.1
37 | bf16: true
38 | ddp_timeout: 180000000
39 | 
40 | ### eval
41 | # val_size: 0.1
42 | # per_device_eval_batch_size: 1
43 | # eval_strategy: steps
44 | # eval_steps: 500
45 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/model/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .loader import load_config, load_model, load_tokenizer
16 | from .model_utils.misc import find_all_linear_modules
17 | from .model_utils.quantization import QuantizationMethod
18 | from .model_utils.valuehead import load_valuehead_params
19 | 
20 | 
21 | __all__ = [
22 |     "QuantizationMethod",
23 |     "find_all_linear_modules",
24 |     "load_config",
25 |     "load_model",
26 |     "load_tokenizer",
27 |     "load_valuehead_params",
28 | ]
29 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/fsdp_qlora/llama3_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | quantization_bit: 4
 4 | trust_remote_code: true
 5 | 
 6 | ### method
 7 | stage: sft
 8 | do_train: true
 9 | finetuning_type: lora
10 | lora_rank: 8
11 | lora_target: all
12 | 
13 | ### dataset
14 | dataset: identity,alpaca_en_demo
15 | template: llama3
16 | cutoff_len: 2048
17 | max_samples: 1000
18 | overwrite_cache: true
19 | preprocessing_num_workers: 16
20 | dataloader_num_workers: 4
21 | 
22 | ### output
23 | output_dir: saves/llama3-8b/lora/sft
24 | logging_steps: 10
25 | save_steps: 500
26 | plot_loss: true
27 | overwrite_output_dir: true
28 | save_only_model: false
29 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
30 | 
31 | ### train
32 | per_device_train_batch_size: 1
33 | gradient_accumulation_steps: 8
34 | learning_rate: 1.0e-4
35 | num_train_epochs: 3.0
36 | lr_scheduler_type: cosine
37 | warmup_ratio: 0.1
38 | bf16: true
39 | ddp_timeout: 180000000
40 | 
41 | ### eval
42 | # val_size: 0.1
43 | # per_device_eval_batch_size: 1
44 | # eval_strategy: steps
45 | # eval_steps: 500
46 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/mod/llama3_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | mixture_of_depths: convert
10 | 
11 | ### dataset
12 | dataset: identity,alpaca_en_demo
13 | template: llama3
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | dataloader_num_workers: 4
19 | 
20 | ### output
21 | output_dir: saves/llama3-8b-mod/full/sft
22 | logging_steps: 10
23 | save_steps: 500
24 | plot_loss: true
25 | overwrite_output_dir: true
26 | save_only_model: false
27 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
28 | 
29 | ### train
30 | per_device_train_batch_size: 1
31 | gradient_accumulation_steps: 8
32 | optim: paged_adamw_8bit
33 | learning_rate: 1.0e-5
34 | num_train_epochs: 3.0
35 | lr_scheduler_type: cosine
36 | warmup_ratio: 0.1
37 | pure_bf16: true
38 | ddp_timeout: 180000000
39 | 
40 | ### eval
41 | # val_size: 0.1
42 | # per_device_eval_batch_size: 1
43 | # eval_strategy: steps
44 | # eval_steps: 500
45 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/loraplus/llama3_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | loraplus_lr_ratio: 16.0
12 | 
13 | ### dataset
14 | dataset: identity,alpaca_en_demo
15 | template: llama3
16 | cutoff_len: 2048
17 | max_samples: 1000
18 | overwrite_cache: true
19 | preprocessing_num_workers: 16
20 | dataloader_num_workers: 4
21 | 
22 | ### output
23 | output_dir: saves/llama3-8b/lora/sft
24 | logging_steps: 10
25 | save_steps: 500
26 | plot_loss: true
27 | overwrite_output_dir: true
28 | save_only_model: false
29 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
30 | 
31 | ### train
32 | per_device_train_batch_size: 1
33 | gradient_accumulation_steps: 8
34 | learning_rate: 1.0e-4
35 | num_train_epochs: 3.0
36 | lr_scheduler_type: cosine
37 | warmup_ratio: 0.1
38 | bf16: true
39 | ddp_timeout: 180000000
40 | 
41 | ### eval
42 | # val_size: 0.1
43 | # per_device_eval_batch_size: 1
44 | # eval_strategy: steps
45 | # eval_steps: 500
46 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/llama3_lora_pretrain.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: pt
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | 
12 | ### dataset
13 | dataset: c4_demo
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | dataloader_num_workers: 4
19 | 
20 | ### output
21 | output_dir: saves/llama3-8b/lora/pretrain
22 | logging_steps: 10
23 | save_steps: 500
24 | plot_loss: true
25 | overwrite_output_dir: true
26 | save_only_model: false
27 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
28 | 
29 | ### train
30 | per_device_train_batch_size: 1
31 | gradient_accumulation_steps: 8
32 | learning_rate: 1.0e-4
33 | num_train_epochs: 3.0
34 | lr_scheduler_type: cosine
35 | warmup_ratio: 0.1
36 | bf16: true
37 | ddp_timeout: 180000000
38 | resume_from_checkpoint: null
39 | 
40 | ### eval
41 | # eval_dataset: c4_demo
42 | # val_size: 0.1
43 | # per_device_eval_batch_size: 1
44 | # eval_strategy: steps
45 | # eval_steps: 500
46 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/sharding_manager/base.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | """
15 | Sharding manager to implement HybridEngine
16 | """
17 | 
18 | from verl import DataProto
19 | 
20 | 
21 | class BaseShardingManager:
22 | 
23 |     def __enter__(self):
24 |         pass
25 | 
26 |     def __exit__(self, exc_type, exc_value, traceback):
27 |         pass
28 | 
29 |     def preprocess_data(self, data: DataProto) -> DataProto:
30 |         return data
31 | 
32 |     def postprocess_data(self, data: DataProto) -> DataProto:
33 |         return data
34 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/docker/docker-cuda/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   llamafactory:
 3 |     build:
 4 |       dockerfile: ./docker/docker-cuda/Dockerfile
 5 |       context: ../..
 6 |       args:
 7 |         INSTALL_BNB: "false"
 8 |         INSTALL_VLLM: "false"
 9 |         INSTALL_DEEPSPEED: "false"
10 |         INSTALL_FLASHATTN: "false"
11 |         INSTALL_LIGER_KERNEL: "false"
12 |         INSTALL_HQQ: "false"
13 |         INSTALL_EETQ: "false"
14 |         PIP_INDEX: https://pypi.org/simple
15 |     container_name: llamafactory
16 |     volumes:
17 |       - ../../hf_cache:/root/.cache/huggingface
18 |       - ../../ms_cache:/root/.cache/modelscope
19 |       - ../../om_cache:/root/.cache/openmind
20 |       - ../../data:/app/data
21 |       - ../../output:/app/output
22 |     ports:
23 |       - "7860:7860"
24 |       - "8000:8000"
25 |     ipc: host
26 |     tty: true
27 |     shm_size: "16gb"
28 |     stdin_open: true
29 |     command: bash
30 |     deploy:
31 |       resources:
32 |         reservations:
33 |           devices:
34 |           - driver: nvidia
35 |             count: "all"
36 |             capabilities: [gpu]
37 |     restart: unless-stopped
38 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/docker/docker-rocm/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | services:
 2 |   llamafactory:
 3 |     build:
 4 |       dockerfile: ./docker/docker-rocm/Dockerfile
 5 |       context: ../..
 6 |       args:
 7 |         INSTALL_BNB: "false"
 8 |         INSTALL_VLLM: "false"
 9 |         INSTALL_DEEPSPEED: "false"
10 |         INSTALL_FLASHATTN: "false"
11 |         INSTALL_LIGER_KERNEL: "false"
12 |         INSTALL_PYTORCH: "true"
13 |         INSTALL_HQQ: "false"
14 |         PIP_INDEX: https://pypi.org/simple
15 |         PYTORCH_INDEX: https://download.pytorch.org/whl/nightly/rocm6.3
16 |     container_name: llamafactory
17 |     volumes:
18 |       - ../../hf_cache:/root/.cache/huggingface
19 |       - ../../ms_cache:/root/.cache/modelscope
20 |       - ../../om_cache:/root/.cache/openmind
21 |       - ../../data:/app/data
22 |       - ../../output:/app/output
23 |       - ../../saves:/app/saves
24 |     ports:
25 |       - "7860:7860"
26 |       - "8000:8000"
27 |     ipc: host
28 |     tty: true
29 |     shm_size: "16gb"
30 |     stdin_open: true
31 |     command: bash
32 |     devices:
33 |       - /dev/kfd:/dev/kfd
34 |       - /dev/dri:/dev/dri
35 |     restart: unless-stopped
36 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/llama_pro/llama3_freeze_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: models/llama3-8b-pro
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: freeze
 9 | freeze_trainable_layers: 8
10 | freeze_trainable_modules: all
11 | use_llama_pro: true
12 | 
13 | ### dataset
14 | dataset: identity,alpaca_en_demo
15 | template: llama3
16 | cutoff_len: 2048
17 | max_samples: 1000
18 | overwrite_cache: true
19 | preprocessing_num_workers: 16
20 | dataloader_num_workers: 4
21 | 
22 | ### output
23 | output_dir: saves/llama3-8b-pro/freeze/sft
24 | logging_steps: 10
25 | save_steps: 500
26 | plot_loss: true
27 | overwrite_output_dir: true
28 | save_only_model: false
29 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
30 | 
31 | ### train
32 | per_device_train_batch_size: 1
33 | gradient_accumulation_steps: 8
34 | learning_rate: 1.0e-4
35 | num_train_epochs: 3.0
36 | lr_scheduler_type: cosine
37 | warmup_ratio: 0.1
38 | bf16: true
39 | ddp_timeout: 180000000
40 | 
41 | ### eval
42 | # val_size: 0.1
43 | # per_device_eval_batch_size: 1
44 | # eval_strategy: steps
45 | # eval_steps: 500
46 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/llama3_lora_reward.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: rm
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | 
12 | ### dataset
13 | dataset: dpo_en_demo
14 | template: llama3
15 | cutoff_len: 2048
16 | max_samples: 1000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | dataloader_num_workers: 4
20 | 
21 | ### output
22 | output_dir: saves/llama3-8b/lora/reward
23 | logging_steps: 10
24 | save_steps: 500
25 | plot_loss: true
26 | overwrite_output_dir: true
27 | save_only_model: false
28 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
29 | 
30 | ### train
31 | per_device_train_batch_size: 1
32 | gradient_accumulation_steps: 8
33 | learning_rate: 1.0e-4
34 | num_train_epochs: 3.0
35 | lr_scheduler_type: cosine
36 | warmup_ratio: 0.1
37 | bf16: true
38 | ddp_timeout: 180000000
39 | resume_from_checkpoint: null
40 | 
41 | ### eval
42 | # eval_dataset: dpo_en_demo
43 | # val_size: 0.1
44 | # per_device_eval_batch_size: 1
45 | # eval_strategy: steps
46 | # eval_steps: 500
47 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/pissa/llama3_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | pissa_init: true
12 | pissa_iter: 16
13 | pissa_convert: true
14 | 
15 | ### dataset
16 | dataset: identity,alpaca_en_demo
17 | template: llama3
18 | cutoff_len: 2048
19 | max_samples: 1000
20 | overwrite_cache: true
21 | preprocessing_num_workers: 16
22 | dataloader_num_workers: 4
23 | 
24 | ### output
25 | output_dir: saves/llama3-8b/lora/sft
26 | logging_steps: 10
27 | save_steps: 500
28 | plot_loss: true
29 | overwrite_output_dir: true
30 | save_only_model: false
31 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
32 | 
33 | ### train
34 | per_device_train_batch_size: 1
35 | gradient_accumulation_steps: 8
36 | learning_rate: 1.0e-4
37 | num_train_epochs: 3.0
38 | lr_scheduler_type: cosine
39 | warmup_ratio: 0.1
40 | bf16: true
41 | ddp_timeout: 180000000
42 | 
43 | ### eval
44 | # val_size: 0.1
45 | # per_device_eval_batch_size: 1
46 | # eval_strategy: steps
47 | # eval_steps: 500
48 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/llama3_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | 
12 | ### dataset
13 | dataset: identity,alpaca_en_demo
14 | template: llama3
15 | cutoff_len: 2048
16 | max_samples: 1000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | dataloader_num_workers: 4
20 | 
21 | ### output
22 | output_dir: saves/llama3-8b/lora/sft
23 | logging_steps: 10
24 | save_steps: 500
25 | plot_loss: true
26 | overwrite_output_dir: true
27 | save_only_model: false
28 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
29 | 
30 | ### train
31 | per_device_train_batch_size: 1
32 | gradient_accumulation_steps: 8
33 | learning_rate: 1.0e-4
34 | num_train_epochs: 3.0
35 | lr_scheduler_type: cosine
36 | warmup_ratio: 0.1
37 | bf16: true
38 | ddp_timeout: 180000000
39 | resume_from_checkpoint: null
40 | 
41 | ### eval
42 | # eval_dataset: alpaca_en_demo
43 | # val_size: 0.1
44 | # per_device_eval_batch_size: 1
45 | # eval_strategy: steps
46 | # eval_steps: 500
47 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | r"""Efficient fine-tuning of large language models.
16 | 
17 | Level:
18 |   api, webui > chat, eval, train > data, model > hparams > extras
19 | 
20 | Disable version checking: DISABLE_VERSION_CHECK=1
21 | Enable VRAM recording: RECORD_VRAM=1
22 | Force using torchrun: FORCE_TORCHRUN=1
23 | Set logging verbosity: LLAMAFACTORY_VERBOSITY=WARN
24 | Use modelscope: USE_MODELSCOPE_HUB=1
25 | Use openmind: USE_OPENMIND_HUB=1
26 | """
27 | 
28 | from .extras.env import VERSION
29 | 
30 | 
31 | __version__ = VERSION
32 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/api.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | import uvicorn
18 | 
19 | from llamafactory.api.app import create_app
20 | from llamafactory.chat import ChatModel
21 | 
22 | 
23 | def main():
24 |     chat_model = ChatModel()
25 |     app = create_app(chat_model)
26 |     api_host = os.getenv("API_HOST", "0.0.0.0")
27 |     api_port = int(os.getenv("API_PORT", "8000"))
28 |     print(f"Visit http://localhost:{api_port}/docs for API document.")
29 |     uvicorn.run(app, host=api_host, port=api_port)
30 | 
31 | 
32 | if __name__ == "__main__":
33 |     main()
34 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_bnb_npu.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | quantization_bit: 4
 4 | quantization_method: bnb
 5 | double_quantization: false
 6 | trust_remote_code: true
 7 | 
 8 | ### method
 9 | stage: sft
10 | do_train: true
11 | finetuning_type: lora
12 | lora_rank: 8
13 | lora_target: all
14 | 
15 | ### dataset
16 | dataset: identity,alpaca_en_demo
17 | template: llama3
18 | cutoff_len: 2048
19 | max_samples: 1000
20 | overwrite_cache: true
21 | preprocessing_num_workers: 16
22 | dataloader_num_workers: 4
23 | 
24 | ### output
25 | output_dir: saves/llama3-8b/lora/sft
26 | logging_steps: 10
27 | save_steps: 500
28 | plot_loss: true
29 | overwrite_output_dir: true
30 | save_only_model: false
31 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
32 | 
33 | ### train
34 | per_device_train_batch_size: 1
35 | gradient_accumulation_steps: 8
36 | learning_rate: 1.0e-4
37 | num_train_epochs: 3.0
38 | lr_scheduler_type: cosine
39 | warmup_ratio: 0.1
40 | bf16: true
41 | ddp_timeout: 180000000
42 | 
43 | ### eval
44 | # val_size: 0.1
45 | # per_device_eval_batch_size: 1
46 | # eval_strategy: steps
47 | # eval_steps: 500
48 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/badam/llama3_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | use_badam: true
10 | badam_mode: layer
11 | badam_switch_mode: ascending
12 | badam_switch_interval: 50
13 | badam_verbose: 2
14 | # deepspeed: examples/deepspeed/ds_z3_config.json
15 | 
16 | ### dataset
17 | dataset: identity,alpaca_en_demo
18 | template: llama3
19 | cutoff_len: 2048
20 | max_samples: 1000
21 | overwrite_cache: true
22 | preprocessing_num_workers: 16
23 | dataloader_num_workers: 4
24 | 
25 | ### output
26 | output_dir: saves/llama3-8b/full/sft
27 | logging_steps: 10
28 | save_steps: 500
29 | plot_loss: true
30 | overwrite_output_dir: true
31 | save_only_model: false
32 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
33 | 
34 | ### train
35 | per_device_train_batch_size: 1
36 | gradient_accumulation_steps: 8
37 | learning_rate: 1.0e-5
38 | num_train_epochs: 3.0
39 | lr_scheduler_type: cosine
40 | warmup_ratio: 0.1
41 | 
42 | ### eval
43 | # val_size: 0.1
44 | # per_device_eval_batch_size: 1
45 | # eval_strategy: steps
46 | # eval_steps: 500
47 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/qwen2vl_lora_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: Qwen/Qwen2.5-VL-7B-Instruct
 3 | image_max_pixels: 262144
 4 | video_max_pixels: 16384
 5 | trust_remote_code: true
 6 | 
 7 | ### method
 8 | stage: sft
 9 | do_train: true
10 | finetuning_type: lora
11 | lora_rank: 8
12 | lora_target: all
13 | 
14 | ### dataset
15 | dataset: mllm_demo,identity,alpaca_en_demo  # video: mllm_video_demo
16 | template: qwen2_vl
17 | cutoff_len: 2048
18 | max_samples: 1000
19 | overwrite_cache: true
20 | preprocessing_num_workers: 16
21 | dataloader_num_workers: 4
22 | 
23 | ### output
24 | output_dir: saves/qwen2_vl-7b/lora/sft
25 | logging_steps: 10
26 | save_steps: 500
27 | plot_loss: true
28 | overwrite_output_dir: true
29 | save_only_model: false
30 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
31 | 
32 | ### train
33 | per_device_train_batch_size: 1
34 | gradient_accumulation_steps: 8
35 | learning_rate: 1.0e-4
36 | num_train_epochs: 3.0
37 | lr_scheduler_type: cosine
38 | warmup_ratio: 0.1
39 | bf16: true
40 | ddp_timeout: 180000000
41 | resume_from_checkpoint: null
42 | 
43 | ### eval
44 | # val_size: 0.1
45 | # per_device_eval_batch_size: 1
46 | # eval_strategy: steps
47 | # eval_steps: 500
48 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/llama3_lora_dpo.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: dpo
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | pref_beta: 0.1
12 | pref_loss: sigmoid  # choices: [sigmoid (dpo), orpo, simpo]
13 | 
14 | ### dataset
15 | dataset: dpo_en_demo
16 | template: llama3
17 | cutoff_len: 2048
18 | max_samples: 1000
19 | overwrite_cache: true
20 | preprocessing_num_workers: 16
21 | dataloader_num_workers: 4
22 | 
23 | ### output
24 | output_dir: saves/llama3-8b/lora/dpo
25 | logging_steps: 10
26 | save_steps: 500
27 | plot_loss: true
28 | overwrite_output_dir: true
29 | save_only_model: false
30 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
31 | 
32 | ### train
33 | per_device_train_batch_size: 1
34 | gradient_accumulation_steps: 8
35 | learning_rate: 5.0e-6
36 | num_train_epochs: 3.0
37 | lr_scheduler_type: cosine
38 | warmup_ratio: 0.1
39 | bf16: true
40 | ddp_timeout: 180000000
41 | resume_from_checkpoint: null
42 | 
43 | ### eval
44 | # eval_dataset: dpo_en_demo
45 | # val_size: 0.1
46 | # per_device_eval_batch_size: 1
47 | # eval_strategy: steps
48 | # eval_steps: 500
49 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_qlora/llama3_lora_sft_otfq.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | quantization_bit: 4  # choices: [8 (bnb/hqq/eetq), 4 (bnb/hqq), 3 (hqq), 2 (hqq)]
 4 | quantization_method: bnb  # choices: [bnb, hqq, eetq]
 5 | trust_remote_code: true
 6 | 
 7 | ### method
 8 | stage: sft
 9 | do_train: true
10 | finetuning_type: lora
11 | lora_rank: 8
12 | lora_target: all
13 | 
14 | ### dataset
15 | dataset: identity,alpaca_en_demo
16 | template: llama3
17 | cutoff_len: 2048
18 | max_samples: 1000
19 | overwrite_cache: true
20 | preprocessing_num_workers: 16
21 | dataloader_num_workers: 4
22 | 
23 | ### output
24 | output_dir: saves/llama3-8b/lora/sft
25 | logging_steps: 10
26 | save_steps: 500
27 | plot_loss: true
28 | overwrite_output_dir: true
29 | save_only_model: false
30 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
31 | 
32 | ### train
33 | per_device_train_batch_size: 1
34 | gradient_accumulation_steps: 8
35 | learning_rate: 1.0e-4
36 | num_train_epochs: 3.0
37 | lr_scheduler_type: cosine
38 | warmup_ratio: 0.1
39 | bf16: true
40 | ddp_timeout: 180000000
41 | 
42 | ### eval
43 | # val_size: 0.1
44 | # per_device_eval_batch_size: 1
45 | # eval_strategy: steps
46 | # eval_steps: 500
47 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/models/weight_loader_registry.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | 
16 | def get_weight_loader(arch: str):
17 |     from verl.models.llama.megatron.checkpoint_utils.llama_loader import load_state_dict_to_megatron_llama
18 |     _MODEL_WEIGHT_MEGATRON_LOADER_REGISTRY = {'LlamaForCausalLM': load_state_dict_to_megatron_llama}
19 | 
20 |     if arch in _MODEL_WEIGHT_MEGATRON_LOADER_REGISTRY:
21 |         return _MODEL_WEIGHT_MEGATRON_LOADER_REGISTRY[arch]
22 |     raise ValueError(f"Model architectures {arch} are not supported for now. "
23 |                      f"Supported architectures: {_MODEL_WEIGHT_MEGATRON_LOADER_REGISTRY.keys()}")
24 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/distributed.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | """Utilities for distributed training."""
15 | import os
16 | 
17 | 
18 | def initialize_global_process_group(timeout_second=36000):
19 |     import torch.distributed
20 |     from datetime import timedelta
21 |     torch.distributed.init_process_group('nccl', timeout=timedelta(seconds=timeout_second))
22 |     local_rank = int(os.environ["LOCAL_RANK"])
23 |     rank = int(os.environ["RANK"])
24 |     world_size = int(os.environ["WORLD_SIZE"])
25 | 
26 |     if torch.distributed.is_initialized():
27 |         torch.cuda.set_device(local_rank)
28 |     return local_rank, rank, world_size
29 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_full/llama3_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | deepspeed: examples/deepspeed/ds_z3_config.json  # choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
10 | 
11 | ### dataset
12 | dataset: identity,alpaca_en_demo
13 | template: llama3
14 | cutoff_len: 2048
15 | max_samples: 1000
16 | overwrite_cache: true
17 | preprocessing_num_workers: 16
18 | dataloader_num_workers: 4
19 | 
20 | ### output
21 | output_dir: saves/llama3-8b/full/sft
22 | logging_steps: 10
23 | save_steps: 500
24 | plot_loss: true
25 | overwrite_output_dir: true
26 | save_only_model: false
27 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
28 | 
29 | ### train
30 | per_device_train_batch_size: 1
31 | gradient_accumulation_steps: 2
32 | learning_rate: 1.0e-5
33 | num_train_epochs: 3.0
34 | lr_scheduler_type: cosine
35 | warmup_ratio: 0.1
36 | bf16: true
37 | ddp_timeout: 180000000
38 | resume_from_checkpoint: null
39 | 
40 | ### eval
41 | # eval_dataset: alpaca_en_demo
42 | # val_size: 0.1
43 | # per_device_eval_batch_size: 1
44 | # eval_strategy: steps
45 | # eval_steps: 500
46 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/qwen2vl_lora_dpo.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: Qwen/Qwen2.5-VL-7B-Instruct
 3 | image_max_pixels: 262144
 4 | video_max_pixels: 16384
 5 | trust_remote_code: true
 6 | 
 7 | ### method
 8 | stage: dpo
 9 | do_train: true
10 | finetuning_type: lora
11 | lora_rank: 8
12 | lora_target: all
13 | pref_beta: 0.1
14 | pref_loss: sigmoid  # choices: [sigmoid (dpo), orpo, simpo]
15 | 
16 | ### dataset
17 | dataset: rlhf_v
18 | template: qwen2_vl
19 | cutoff_len: 2048
20 | max_samples: 1000
21 | overwrite_cache: true
22 | preprocessing_num_workers: 16
23 | dataloader_num_workers: 4
24 | 
25 | ### output
26 | output_dir: saves/qwen2_vl-7b/lora/dpo
27 | logging_steps: 10
28 | save_steps: 500
29 | plot_loss: true
30 | overwrite_output_dir: true
31 | save_only_model: false
32 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
33 | 
34 | ### train
35 | per_device_train_batch_size: 1
36 | gradient_accumulation_steps: 8
37 | learning_rate: 5.0e-6
38 | num_train_epochs: 3.0
39 | lr_scheduler_type: cosine
40 | warmup_ratio: 0.1
41 | bf16: true
42 | ddp_timeout: 180000000
43 | resume_from_checkpoint: null
44 | 
45 | ### eval
46 | # val_size: 0.1
47 | # per_device_eval_batch_size: 1
48 | # eval_strategy: steps
49 | # eval_steps: 500
50 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/galore/llama3_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | use_galore: true
10 | galore_layerwise: true  # choices: [true, false], use false for DDP training
11 | galore_target: all
12 | galore_rank: 128
13 | galore_scale: 2.0
14 | 
15 | ### dataset
16 | dataset: identity,alpaca_en_demo
17 | template: llama3
18 | cutoff_len: 2048
19 | max_samples: 1000
20 | overwrite_cache: true
21 | preprocessing_num_workers: 16
22 | dataloader_num_workers: 4
23 | 
24 | ### output
25 | output_dir: saves/llama3-8b/full/sft
26 | logging_steps: 10
27 | save_steps: 500
28 | plot_loss: true
29 | overwrite_output_dir: true
30 | save_only_model: false
31 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
32 | 
33 | ### train
34 | per_device_train_batch_size: 1
35 | gradient_accumulation_steps: 1  # use 1 for layerwise galore
36 | learning_rate: 1.0e-5
37 | num_train_epochs: 3.0
38 | lr_scheduler_type: cosine
39 | warmup_ratio: 0.1
40 | pure_bf16: true
41 | ddp_timeout: 180000000
42 | 
43 | ### eval
44 | # val_size: 0.1
45 | # per_device_eval_batch_size: 1
46 | # eval_strategy: steps
47 | # eval_steps: 500
48 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/critic/base.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | """
15 | Base class for a critic
16 | """
17 | from abc import ABC, abstractmethod
18 | 
19 | import torch
20 | 
21 | from verl import DataProto
22 | 
23 | __all__ = ['BasePPOCritic']
24 | 
25 | 
26 | class BasePPOCritic(ABC):
27 | 
28 |     def __init__(self, config):
29 |         super().__init__()
30 |         self.config = config
31 | 
32 |     @abstractmethod
33 |     def compute_values(self, data: DataProto) -> torch.Tensor:
34 |         """Compute values"""
35 |         pass
36 | 
37 |     @abstractmethod
38 |     def update_critic(self, data: DataProto):
39 |         """Update the critic"""
40 |         pass
41 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/llama3_lora_sft_ds3.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | deepspeed: examples/deepspeed/ds_z3_config.json  # choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
12 | 
13 | ### dataset
14 | dataset: identity,alpaca_en_demo
15 | template: llama3
16 | cutoff_len: 2048
17 | max_samples: 1000
18 | overwrite_cache: true
19 | preprocessing_num_workers: 16
20 | dataloader_num_workers: 4
21 | 
22 | ### output
23 | output_dir: saves/llama3-8b/lora/sft
24 | logging_steps: 10
25 | save_steps: 500
26 | plot_loss: true
27 | overwrite_output_dir: true
28 | save_only_model: false
29 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
30 | 
31 | ### train
32 | per_device_train_batch_size: 1
33 | gradient_accumulation_steps: 2
34 | learning_rate: 1.0e-4
35 | num_train_epochs: 3.0
36 | lr_scheduler_type: cosine
37 | warmup_ratio: 0.1
38 | bf16: true
39 | ddp_timeout: 180000000
40 | resume_from_checkpoint: null
41 | 
42 | ### eval
43 | # eval_dataset: alpaca_en_demo
44 | # val_size: 0.1
45 | # per_device_eval_batch_size: 1
46 | # eval_strategy: steps
47 | # eval_steps: 500
48 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/webui.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | from llamafactory.extras.misc import fix_proxy, is_env_enabled
18 | from llamafactory.webui.interface import create_ui
19 | 
20 | 
21 | def main():
22 |     gradio_ipv6 = is_env_enabled("GRADIO_IPV6")
23 |     gradio_share = is_env_enabled("GRADIO_SHARE")
24 |     server_name = os.getenv("GRADIO_SERVER_NAME", "[::]" if gradio_ipv6 else "0.0.0.0")
25 |     print("Visit http://ip:port for Web UI, e.g., http://127.0.0.1:7860")
26 |     fix_proxy(ipv6_enabled=gradio_ipv6)
27 |     create_ui().queue().launch(share=gradio_share, server_name=server_name, inbrowser=True)
28 | 
29 | 
30 | if __name__ == "__main__":
31 |     main()
32 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/extras/apollo/llama3_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: full
 9 | use_apollo: true
10 | apollo_layerwise: true  # choices: [true, false], use false for DDP training
11 | apollo_target: all
12 | apollo_rank: 128
13 | apollo_scale: 32.0
14 | apollo_scale_type: channel
15 | 
16 | ### dataset
17 | dataset: identity,alpaca_en_demo
18 | template: llama3
19 | cutoff_len: 2048
20 | max_samples: 1000
21 | overwrite_cache: true
22 | preprocessing_num_workers: 16
23 | dataloader_num_workers: 4
24 | 
25 | ### output
26 | output_dir: saves/llama3-8b/full/sft
27 | logging_steps: 10
28 | save_steps: 500
29 | plot_loss: true
30 | overwrite_output_dir: true
31 | save_only_model: false
32 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
33 | 
34 | ### train
35 | per_device_train_batch_size: 1
36 | gradient_accumulation_steps: 1  # use 1 for layerwise apollo
37 | learning_rate: 1.0e-5
38 | num_train_epochs: 3.0
39 | lr_scheduler_type: cosine
40 | warmup_ratio: 0.1
41 | pure_bf16: true
42 | ddp_timeout: 180000000
43 | 
44 | ### eval
45 | # val_size: 0.1
46 | # per_device_eval_batch_size: 1
47 | # eval_strategy: steps
48 | # eval_steps: 500
49 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_full/qwen2vl_full_sft.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: Qwen/Qwen2-VL-7B-Instruct
 3 | image_max_pixels: 262144
 4 | video_max_pixels: 16384
 5 | trust_remote_code: true
 6 | 
 7 | ### method
 8 | stage: sft
 9 | do_train: true
10 | finetuning_type: full
11 | freeze_vision_tower: true
12 | freeze_multi_modal_projector: true
13 | freeze_language_model: false
14 | deepspeed: examples/deepspeed/ds_z3_config.json
15 | 
16 | ### dataset
17 | dataset: mllm_demo,identity,alpaca_en_demo
18 | template: qwen2_vl
19 | cutoff_len: 2048
20 | max_samples: 1000
21 | overwrite_cache: true
22 | preprocessing_num_workers: 16
23 | dataloader_num_workers: 4
24 | 
25 | ### output
26 | output_dir: saves/qwen2_vl-7b/full/sft
27 | logging_steps: 10
28 | save_steps: 500
29 | plot_loss: true
30 | overwrite_output_dir: true
31 | save_only_model: false
32 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
33 | 
34 | ### train
35 | per_device_train_batch_size: 1
36 | gradient_accumulation_steps: 2
37 | learning_rate: 1.0e-5
38 | num_train_epochs: 3.0
39 | lr_scheduler_type: cosine
40 | warmup_ratio: 0.1
41 | bf16: true
42 | ddp_timeout: 180000000
43 | resume_from_checkpoint: null
44 | 
45 | ### eval
46 | # val_size: 0.1
47 | # per_device_eval_batch_size: 1
48 | # eval_strategy: steps
49 | # eval_steps: 500
50 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/rollout/base.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from abc import ABC, abstractmethod
16 | from typing import Iterable, Union
17 | 
18 | from verl import DataProto
19 | 
20 | __all__ = ['BaseRollout']
21 | 
22 | 
23 | class BaseRollout(ABC):
24 | 
25 |     def __init__(self):
26 |         """
27 | 
28 |         Args:
29 |             dataloader: an Iterable of TensorDict that consistently generates prompts. Note that the dataloader
30 |             should handle when the training stops.
31 |         """
32 |         super().__init__()
33 | 
34 |     @abstractmethod
35 |     def generate_sequences(self, prompts: DataProto) -> DataProto:
36 |         """Generate sequences"""
37 |         pass
38 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/data/processor/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .feedback import FeedbackDatasetProcessor
16 | from .pairwise import PairwiseDatasetProcessor
17 | from .pretrain import PretrainDatasetProcessor
18 | from .processor_utils import DatasetProcessor
19 | from .supervised import PackedSupervisedDatasetProcessor, SupervisedDatasetProcessor
20 | from .unsupervised import UnsupervisedDatasetProcessor
21 | 
22 | 
23 | __all__ = [
24 |     "DatasetProcessor",
25 |     "FeedbackDatasetProcessor",
26 |     "PackedSupervisedDatasetProcessor",
27 |     "PairwiseDatasetProcessor",
28 |     "PretrainDatasetProcessor",
29 |     "SupervisedDatasetProcessor",
30 |     "UnsupervisedDatasetProcessor",
31 | ]
32 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/api/common.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import json
16 | from typing import TYPE_CHECKING, Any
17 | 
18 | 
19 | if TYPE_CHECKING:
20 |     from pydantic import BaseModel
21 | 
22 | 
23 | def dictify(data: "BaseModel") -> dict[str, Any]:
24 |     try:  # pydantic v2
25 |         return data.model_dump(exclude_unset=True)
26 |     except AttributeError:  # pydantic v1
27 |         return data.dict(exclude_unset=True)
28 | 
29 | 
30 | def jsonify(data: "BaseModel") -> str:
31 |     try:  # pydantic v2
32 |         return json.dumps(data.model_dump(exclude_unset=True), ensure_ascii=False)
33 |     except AttributeError:  # pydantic v1
34 |         return data.json(exclude_unset=True, ensure_ascii=False)
35 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/sharding_manager/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from verl.utils.import_utils import is_vllm_available, is_megatron_core_available
16 | 
17 | from .base import BaseShardingManager
18 | from .fsdp_ulysses import FSDPUlyssesShardingManager
19 | 
20 | AllGatherPPModel = None
21 | 
22 | if is_megatron_core_available() and is_vllm_available():
23 |     from .megatron_vllm import AllGatherPPModel, MegatronVLLMShardingManager
24 | elif AllGatherPPModel is not None:
25 |     pass
26 | else:
27 |     AllGatherPPModel = None
28 |     MegatronVLLMShardingManager = None
29 | 
30 | if is_vllm_available():
31 |     from .fsdp_vllm import FSDPVLLMShardingManager
32 | else:
33 |     FSDPVLLMShardingManager = None
34 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/.github/ISSUE_TEMPLATE/2-feature-request.yml:
--------------------------------------------------------------------------------
 1 | name: "\U0001F680 Feature request"
 2 | description: Submit a request for a new feature
 3 | labels: ["enhancement", "pending"]
 4 | body:
 5 |   - type: markdown
 6 |     attributes:
 7 |       value: |
 8 |         Please do not create issues that are not related to new features under this category.
 9 |         请勿在此分类下创建和新特性无关的 issues。
10 | 
11 |   - type: checkboxes
12 |     id: reminder
13 |     attributes:
14 |       label: Reminder
15 |       description: |
16 |         Please ensure you have read the above rules carefully and searched the existing issues.
17 |         请确保您已经认真阅读了上述规则并且搜索过现有的 issues。
18 | 
19 |       options:
20 |         - label: I have read the above rules and searched the existing issues.
21 |           required: true
22 | 
23 |   - type: textarea
24 |     id: description
25 |     validations:
26 |       required: true
27 |     attributes:
28 |       label: Description
29 |       description: |
30 |         A clear and concise description of the feature proposal.
31 |         请详细描述您希望加入的新功能特性。
32 | 
33 |   - type: textarea
34 |     id: contribution
35 |     validations:
36 |       required: false
37 |     attributes:
38 |       label: Pull Request
39 |       description: |
40 |         Have you already created the relevant PR and submitted the code?
41 |         您是否已经创建了相关 PR 并提交了代码？
42 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/data/mllm_video_audio_demo.json:
--------------------------------------------------------------------------------
 1 | [
 2 |   {
 3 |     "messages": [
 4 |       {
 5 |         "content": "<video><audio>What is the video describing?",
 6 |         "role": "user"
 7 |       },
 8 |       {
 9 |         "content": "A girl who is drawing a picture of a guitar and feel nervous.",
10 |         "role": "assistant"
11 |       }
12 |     ],
13 |     "videos": [
14 |       "mllm_demo_data/4.mp4"
15 |     ],
16 |     "audios": [
17 |       "mllm_demo_data/4.mp3"
18 |     ]
19 |   },
20 |   {
21 |     "messages": [
22 |       {
23 |         "content": "<video><audio>What does this girl say?",
24 |         "role": "user"
25 |       },
26 |       {
27 |         "content": "She says: 'Hello! Take a look at what am I drawing!'",
28 |         "role": "assistant"
29 |       }
30 |     ],
31 |     "videos": [
32 |       "mllm_demo_data/4.mp4"
33 |     ],
34 |     "audios": [
35 |       "mllm_demo_data/4.mp3"
36 |     ]
37 |   },
38 |   {
39 |     "messages": [
40 |       {
41 |         "content": "<video><audio>What is this girl drawing with?",
42 |         "role": "user"
43 |       },
44 |       {
45 |         "content": "She is drawing with an iPad.",
46 |         "role": "assistant"
47 |       }
48 |     ],
49 |     "videos": [
50 |       "mllm_demo_data/4.mp4"
51 |     ],
52 |     "audios": [
53 |       "mllm_demo_data/4.mp3"
54 |     ]
55 |   }
56 | ]
57 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/tests/data/processor/test_processor_utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | 
16 | import pytest
17 | 
18 | from llamafactory.data.processor.processor_utils import infer_seqlen
19 | 
20 | 
21 | @pytest.mark.parametrize(
22 |     "test_input,test_output",
23 |     [
24 |         ((3000, 2000, 1000), (600, 400)),
25 |         ((2000, 3000, 1000), (400, 600)),
26 |         ((1000, 100, 1000), (900, 100)),
27 |         ((100, 1000, 1000), (100, 900)),
28 |         ((100, 500, 1000), (100, 500)),
29 |         ((500, 100, 1000), (500, 100)),
30 |         ((10, 10, 1000), (10, 10)),
31 |     ],
32 | )
33 | def test_infer_seqlen(test_input: tuple[int, int, int], test_output: tuple[int, int]):
34 |     assert test_output == infer_seqlen(*test_input)
35 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/trainer/config/sft_trainer.yaml:
--------------------------------------------------------------------------------
 1 | data:
 2 |   train_batch_size: 256
 3 |   micro_batch_size: 16  # this is also val batch size
 4 |   train_files: ~/data/gsm8k/train.parquet
 5 |   val_files: ~/data/gsm8k/test.parquet
 6 |   prompt_key: question
 7 |   response_key: answer
 8 |   max_length: 1024
 9 |   truncation: error
10 |   balance_dp_token: False
11 |   chat_template: null
12 | model:
13 |   partial_pretrain: ~/models/gemma-1.1-7b-it
14 |   fsdp_config:
15 |     wrap_policy:
16 |       min_num_params: 0
17 |     cpu_offload: False
18 |     offload_params: False
19 |   external_lib: null
20 |   enable_gradient_checkpointing: False
21 |   trust_remote_code: False
22 |   lora_rank: 0  # Set to positive value to enable LoRA (e.g., 32)
23 |   lora_alpha: 16  # LoRA scaling factor
24 |   target_modules: [q_proj, v_proj]  # Target modules for LoRA adaptation
25 | optim:
26 |   lr: 1e-5
27 |   betas: [0.9, 0.95]
28 |   weight_decay: 0.01
29 |   warmup_steps_ratio: 0.1
30 |   clip_grad: 1.0
31 | 
32 | trainer:
33 |   default_local_dir: /tmp/sft_model
34 |   default_hdfs_dir: hdfs://tmp/experiments/gsm8k/gemma-1.1-7b-it/ # change the hdfs path here
35 |   resume_path: null
36 |   project_name: gsm8k-sft
37 |   experiment_name: test
38 |   total_epochs: 4
39 |   total_training_steps: null
40 |   validate_before_training: False
41 |   logger: ['console']
42 |   seed: 1
43 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/debug/performance.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import torch
16 | import torch.distributed as dist
17 | import logging
18 | 
19 | 
20 | def log_gpu_memory_usage(head: str, logger: logging.Logger = None, level=logging.DEBUG, rank: int = 0):
21 |     if (not dist.is_initialized()) or (rank is None) or (dist.get_rank() == rank):
22 |         memory_allocated = torch.cuda.memory_allocated() / 1024**3
23 |         memory_reserved = torch.cuda.memory_reserved() / 1024**3
24 | 
25 |         message = f'{head}, memory allocated (GB): {memory_allocated}, memory reserved (GB): {memory_reserved}'
26 | 
27 |         if logger is None:
28 |             print(message)
29 |         else:
30 |             logger.log(msg=message, level=level)
31 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/data/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .collator import (
16 |     KTODataCollatorWithPadding,
17 |     MultiModalDataCollatorForSeq2Seq,
18 |     PairwiseDataCollatorWithPadding,
19 |     SFTDataCollatorWith4DAttentionMask,
20 | )
21 | from .data_utils import Role, split_dataset
22 | from .loader import get_dataset
23 | from .template import TEMPLATES, Template, get_template_and_fix_tokenizer
24 | 
25 | 
26 | __all__ = [
27 |     "TEMPLATES",
28 |     "KTODataCollatorWithPadding",
29 |     "MultiModalDataCollatorForSeq2Seq",
30 |     "PairwiseDataCollatorWithPadding",
31 |     "Role",
32 |     "SFTDataCollatorWith4DAttentionMask",
33 |     "Template",
34 |     "get_dataset",
35 |     "get_template_and_fix_tokenizer",
36 |     "split_dataset",
37 | ]
38 | 


--------------------------------------------------------------------------------
/api/visual_tools/egoschema_videollm_llava/video_llm.py:
--------------------------------------------------------------------------------
 1 | # videollm.py
 2 | from google import genai
 3 | from typing_extensions import Annotated
 4 | import time
 5 | import os
 6 | import ffmpeg
 7 | from utils import locate_videos, config_videos
 8 | import contextlib
 9 | import requests
10 | 
11 | 
12 | 
13 | def video_llm(question: str, range: str,  cache_dir: str, data_dir: str) -> dict:
14 |     try:
15 |         start_time, end_time = range.split("-")
16 |     except:
17 |         raise ValueError("Invalid range format. Use DAYX_HHMMSSFF-DAYX_HHMMSSFF.")
18 | 
19 |    
20 | 
21 |     
22 | 
23 |     file_paths, exact_match,start_time = locate_videos(start_time, end_time, data_dir=data_dir, cache_dir=cache_dir)
24 |     combined_video, length = config_videos(file_paths, start_time, end_time, cache_dir=cache_dir)
25 | 
26 | 
27 |     url = "http://localhost:8000/video/infer"
28 |     pay_load = {
29 |         "video_path": combined_video,
30 |         "prompt": question,
31 |         "max_frames": 64,
32 |         "frame_step": 1
33 |     }
34 |     
35 |     
36 |     response = requests.post(url, json=pay_load)
37 | 
38 |     print(response.json()['response'])
39 | 
40 |     return {
41 |         "query_time": range,
42 |         "question": question,
43 |         "answer": response.json()['response'],
44 |         "exact_match": exact_match,
45 |         "length": length
46 |     }
47 | 
48 | 
49 | 
50 | 


--------------------------------------------------------------------------------
/api/visual_tools/videomme_videollm_llava/video_llm.py:
--------------------------------------------------------------------------------
 1 | # videollm.py
 2 | from google import genai
 3 | from typing_extensions import Annotated
 4 | import time
 5 | import os
 6 | import ffmpeg
 7 | from utils import locate_videos, config_videos
 8 | import contextlib
 9 | import requests
10 | 
11 | 
12 | 
13 | def video_llm(question: str, range: str,  cache_dir: str, data_dir: str) -> dict:
14 |     try:
15 |         start_time, end_time = range.split("-")
16 |     except:
17 |         raise ValueError("Invalid range format. Use DAYX_HHMMSSFF-DAYX_HHMMSSFF.")
18 | 
19 |    
20 | 
21 |     
22 | 
23 |     file_paths, exact_match,start_time = locate_videos(start_time, end_time, data_dir=data_dir, cache_dir=cache_dir)
24 |     combined_video, length = config_videos(file_paths, start_time, end_time, cache_dir=cache_dir)
25 | 
26 | 
27 |     url = "http://localhost:8000/video/infer"
28 |     pay_load = {
29 |         "video_path": combined_video,
30 |         "prompt": question,
31 |         "max_frames": 64,
32 |         "frame_step": 1
33 |     }
34 |     
35 |     
36 |     response = requests.post(url, json=pay_load)
37 | 
38 |     print(response.json()['response'])
39 | 
40 |     return {
41 |         "query_time": range,
42 |         "question": question,
43 |         "answer": response.json()['response'],
44 |         "exact_match": exact_match,
45 |         "length": length
46 |     }
47 | 
48 | 
49 | 
50 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_full/qwen.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: Qwen/Qwen2.5-3B-Instruct
 3 | trust_remote_code: true
 4 | add_tokens: <think>,</think>,<tool>,</tool>,<answer>,</answer>,<information>,</information>
 5 | 
 6 | ### method
 7 | stage: sft
 8 | do_train: true
 9 | finetuning_type: full
10 | deepspeed: examples/deepspeed/ds_z3_config.json  # choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
11 | 
12 | ### dataset
13 | dataset: train-cott
14 | template: qwen
15 | cutoff_len: 4096
16 | max_samples: 100000
17 | overwrite_cache: true
18 | preprocessing_num_workers: 16
19 | dataloader_num_workers: 0
20 | 
21 | ### output
22 | output_dir: saves/qwen25-3b-sft-cott
23 | logging_steps: 10
24 | save_steps: 50
25 | plot_loss: true
26 | overwrite_output_dir: true
27 | save_only_model: false
28 | report_to: wandb  # choices: [none, wandb, tensorboard, swanlab, mlflow]
29 | 
30 | ### train
31 | per_device_train_batch_size: 8
32 | gradient_accumulation_steps: 4
33 | learning_rate: 1.0e-5
34 | num_train_epochs: 3.0
35 | lr_scheduler_type: cosine
36 | warmup_ratio: 0.1
37 | bf16: true
38 | ddp_timeout: 180000000
39 | resume_from_checkpoint: null
40 | optim: paged_adamw_8bit
41 | use_unsloth_gc: true
42 | enable_liger_kernel: true
43 | 
44 | ### eval
45 | # eval_dataset: alpaca_en_demo
46 | # val_size: 0.1
47 | # per_device_eval_batch_size: 1
48 | # eval_strategy: steps
49 | # eval_steps: 500
50 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/llama4_lora_sft_ds3.yaml:
--------------------------------------------------------------------------------
 1 | # pip install git+https://github.com/hiyouga/transformers.git@llama4_train
 2 | 
 3 | ### model
 4 | model_name_or_path: meta-llama/Llama-4-Scout-17B-16E-Instruct
 5 | trust_remote_code: true
 6 | 
 7 | ### method
 8 | stage: sft
 9 | do_train: true
10 | finetuning_type: lora
11 | lora_rank: 8
12 | lora_target: all
13 | deepspeed: examples/deepspeed/ds_z3_config.json  # choices: [ds_z0_config.json, ds_z2_config.json, ds_z3_config.json]
14 | 
15 | ### dataset
16 | dataset: mllm_demo,identity,alpaca_en_demo
17 | template: llama4
18 | cutoff_len: 2048
19 | max_samples: 1000
20 | overwrite_cache: true
21 | preprocessing_num_workers: 16
22 | dataloader_num_workers: 4
23 | 
24 | ### output
25 | output_dir: saves/llama4-8b/lora/sft
26 | logging_steps: 10
27 | save_steps: 500
28 | plot_loss: true
29 | overwrite_output_dir: true
30 | save_only_model: false
31 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
32 | 
33 | ### train
34 | per_device_train_batch_size: 1
35 | gradient_accumulation_steps: 2
36 | learning_rate: 1.0e-4
37 | num_train_epochs: 3.0
38 | lr_scheduler_type: cosine
39 | warmup_ratio: 0.1
40 | bf16: true
41 | ddp_timeout: 180000000
42 | resume_from_checkpoint: null
43 | 
44 | ### eval
45 | # eval_dataset: alpaca_en_demo
46 | # val_size: 0.1
47 | # per_device_eval_batch_size: 1
48 | # eval_strategy: steps
49 | # eval_steps: 500
50 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/tests/check_license.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import sys
16 | from pathlib import Path
17 | 
18 | 
19 | KEYWORDS = ("Copyright", "2025", "LlamaFactory")
20 | 
21 | 
22 | def main():
23 |     path_list: list[Path] = []
24 |     for check_dir in sys.argv[1:]:
25 |         path_list.extend(Path(check_dir).glob("**/*.py"))
26 | 
27 |     for path in path_list:
28 |         with open(path.absolute(), encoding="utf-8") as f:
29 |             file_content = f.read().strip().split("\n")
30 |             if not file_content[0]:
31 |                 continue
32 | 
33 |             print(f"Check license: {path}")
34 |             assert all(keyword in file_content[0] for keyword in KEYWORDS), f"File {path} does not contain license."
35 | 
36 | 
37 | if __name__ == "__main__":
38 |     main()
39 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/hparams/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from .data_args import DataArguments
16 | from .evaluation_args import EvaluationArguments
17 | from .finetuning_args import FinetuningArguments
18 | from .generating_args import GeneratingArguments
19 | from .model_args import ModelArguments
20 | from .parser import get_eval_args, get_infer_args, get_ray_args, get_train_args, read_args
21 | from .training_args import RayArguments, TrainingArguments
22 | 
23 | 
24 | __all__ = [
25 |     "DataArguments",
26 |     "EvaluationArguments",
27 |     "FinetuningArguments",
28 |     "GeneratingArguments",
29 |     "ModelArguments",
30 |     "RayArguments",
31 |     "TrainingArguments",
32 |     "get_eval_args",
33 |     "get_infer_args",
34 |     "get_ray_args",
35 |     "get_train_args",
36 |     "read_args",
37 | ]
38 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/tests/e2e/test_chat.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | from llamafactory.chat import ChatModel
18 | 
19 | 
20 | TINY_LLAMA3 = os.getenv("TINY_LLAMA3", "llamafactory/tiny-random-Llama-3")
21 | 
22 | INFER_ARGS = {
23 |     "model_name_or_path": TINY_LLAMA3,
24 |     "finetuning_type": "lora",
25 |     "template": "llama3",
26 |     "infer_dtype": "float16",
27 |     "do_sample": False,
28 |     "max_new_tokens": 1,
29 | }
30 | 
31 | MESSAGES = [
32 |     {"role": "user", "content": "Hi"},
33 | ]
34 | 
35 | EXPECTED_RESPONSE = "_rho"
36 | 
37 | 
38 | def test_chat():
39 |     chat_model = ChatModel(INFER_ARGS)
40 |     assert chat_model.chat(MESSAGES)[0].response_text == EXPECTED_RESPONSE
41 | 
42 | 
43 | def test_stream_chat():
44 |     chat_model = ChatModel(INFER_ARGS)
45 |     response = ""
46 |     for token in chat_model.stream_chat(MESSAGES):
47 |         response += token
48 | 
49 |     assert response == EXPECTED_RESPONSE
50 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/CITATION.cff:
--------------------------------------------------------------------------------
 1 | cff-version: 1.2.0
 2 | date-released: 2024-03
 3 | message: "If you use this software, please cite it as below."
 4 | authors:
 5 | - family-names: "Zheng"
 6 |   given-names: "Yaowei"
 7 | - family-names: "Zhang"
 8 |   given-names: "Richong"
 9 | - family-names: "Zhang"
10 |   given-names: "Junhao"
11 | - family-names: "Ye"
12 |   given-names: "Yanhan"
13 | - family-names: "Luo"
14 |   given-names: "Zheyan"
15 | - family-names: "Feng"
16 |   given-names: "Zhangchi"
17 | - family-names: "Ma"
18 |   given-names: "Yongqiang"
19 | title: "LlamaFactory: Unified Efficient Fine-Tuning of 100+ Language Models"
20 | url: "https://arxiv.org/abs/2403.13372"
21 | preferred-citation:
22 |   type: conference-paper
23 |   conference:
24 |     name: "Proceedings of the 62nd Annual Meeting of the Association for Computational Linguistics (Volume 3: System Demonstrations)"
25 |   authors:
26 |     - family-names: "Zheng"
27 |       given-names: "Yaowei"
28 |     - family-names: "Zhang"
29 |       given-names: "Richong"
30 |     - family-names: "Zhang"
31 |       given-names: "Junhao"
32 |     - family-names: "Ye"
33 |       given-names: "Yanhan"
34 |     - family-names: "Luo"
35 |       given-names: "Zheyan"
36 |     - family-names: "Feng"
37 |       given-names: "Zhangchi"
38 |     - family-names: "Ma"
39 |       given-names: "Yongqiang"
40 |   title: "LlamaFactory: Unified Efficient Fine-Tuning of 100+ Language Models"
41 |   url: "https://arxiv.org/abs/2403.13372"
42 |   year: 2024
43 |   publisher: "Association for Computational Linguistics"
44 |   address: "Bangkok, Thailand"
45 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/import_utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | """
15 | Utilities to check if packages are available.
16 | We assume package availability won't change during runtime.
17 | """
18 | 
19 | from functools import cache
20 | from typing import List
21 | 
22 | 
23 | @cache
24 | def is_megatron_core_available():
25 |     try:
26 |         from megatron.core import parallel_state as mpu
27 |         return True
28 |     except ImportError:
29 |         return False
30 | 
31 | 
32 | @cache
33 | def is_vllm_available():
34 |     try:
35 |         import vllm
36 |         return True
37 |     except ImportError:
38 |         return False
39 | 
40 | 
41 | def import_external_libs(external_libs=None):
42 |     if external_libs is None:
43 |         return
44 |     if not isinstance(external_libs, List):
45 |         external_libs = [external_libs]
46 |     import importlib
47 |     for external_lib in external_libs:
48 |         importlib.import_module(external_lib)
49 | 


--------------------------------------------------------------------------------
/cott_gen/__init__.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Data generation package for EgoLifeQA question answering tasks.
 3 | 
 4 | This package provides tools and utilities for processing egocentric video data,
 5 | generating question-answer pairs, and running AI agents to analyze the data.
 6 | """
 7 | 
 8 | # Import main components from modules
 9 | from .main import AgentResponse, arg_parser, load_qa_data, main
10 | from .prompts import sys_prompt_v0, sys_prompt_v1, thought_prompt
11 | from .tools import (
12 |     rag, 
13 |     video_llm, 
14 |     vlm, 
15 |     terminate, 
16 |     GPT
17 | )
18 | from .utils import (
19 |     setup_logging_and_config,
20 |     locate_video_url,
21 |     locate_image_url,
22 |     extract_json,
23 |     calculate_time_diff,
24 |     convert_seconds_to_time,
25 |     process_qa
26 | )
27 | 
28 | # Define what's available when using "from data_gen import *"
29 | __all__ = [
30 |     # From main.py
31 |     'AgentResponse', 'arg_parser', 'load_qa_data', 'main',
32 |     
33 |     # From prompts.py
34 |     'sys_prompt_v0', 'sys_prompt_v1', 'thought_prompt',
35 |     
36 |     # From tools.py
37 |     'rag', 'video_llm', 'vlm', 'terminate', 'GPT',
38 |     
39 |     # From utils.py
40 |     'setup_logging_and_config', 'locate_video_url', 'locate_image_url',
41 |     'extract_json', 'calculate_time_diff', 'convert_seconds_to_time',
42 |     'process_qa'
43 | ]
44 | 
45 | # Package version
46 | __version__ = '0.1.0'
47 | 
48 | # Package metadata
49 | __author__ = 'Shulin Tian'
50 | __email__ = 'shulin002@e.ntu.edu.sg'
51 | __description__ = 'Tools for generating and processing EgoLifeQA data'
52 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/ray_utils.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | """
15 | Contains commonly used utilities for ray
16 | """
17 | 
18 | import ray
19 | 
20 | import concurrent.futures
21 | 
22 | 
23 | def parallel_put(data_list, max_workers=None):
24 | 
25 |     def put_data(index, data):
26 |         return index, ray.put(data)
27 | 
28 |     if max_workers is None:
29 |         max_workers = min(len(data_list), 16)
30 | 
31 |     with concurrent.futures.ThreadPoolExecutor(max_workers=max_workers) as executor:
32 |         data_list_f = [executor.submit(put_data, i, data) for i, data in enumerate(data_list)]
33 |         res_lst = []
34 |         for future in concurrent.futures.as_completed(data_list_f):
35 |             res_lst.append(future.result())
36 | 
37 |         # reorder based on index
38 |         output = [None for _ in range(len(data_list))]
39 |         for res in res_lst:
40 |             index, data_ref = res
41 |             output[index] = data_ref
42 | 
43 |     return output
44 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/logger/aggregate_logger.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | """
15 | A Ray logger will receive logging info from different processes.
16 | """
17 | import numbers
18 | from typing import Dict
19 | 
20 | 
21 | def concat_dict_to_str(dict: Dict, step):
22 |     output = [f'step:{step}']
23 |     for k, v in dict.items():
24 |         if isinstance(v, numbers.Number):
25 |             output.append(f'{k}:{v:.3f}')
26 |     output_str = ' - '.join(output)
27 |     return output_str
28 | 
29 | 
30 | class LocalLogger:
31 | 
32 |     def __init__(self, remote_logger=None, enable_wandb=False, print_to_console=False):
33 |         self.print_to_console = print_to_console
34 |         if print_to_console:
35 |             print('Using LocalLogger is deprecated. The constructor API will change ')
36 | 
37 |     def flush(self):
38 |         pass
39 | 
40 |     def log(self, data, step):
41 |         if self.print_to_console:
42 |             print(concat_dict_to_str(data, step=step), flush=True)


--------------------------------------------------------------------------------
/LLaMA-Factory/scripts/convert_ckpt/tiny_llama4.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from transformers import Llama4Config, Llama4ForConditionalGeneration, Llama4TextConfig, Llama4VisionConfig
16 | 
17 | 
18 | if __name__ == "__main__":
19 |     vision_config = Llama4VisionConfig(
20 |         hidden_size=1408,
21 |         image_size=336,
22 |         intermediate_size=5632,
23 |         num_attention_heads=16,
24 |         num_hidden_layers=4,
25 |         vision_output_dim=4096,
26 |     )
27 |     text_config = Llama4TextConfig(
28 |         hidden_size=512,
29 |         intermediate_size=1024,
30 |         intermediate_size_mlp=1024,
31 |         num_hidden_layers=4,
32 |         num_attention_heads=8,
33 |         num_key_value_heads=2,
34 |         head_dim=512 // 8,
35 |         num_local_experts=2,
36 |     )
37 |     config = Llama4Config(vision_config=vision_config, text_config=text_config)
38 |     model = Llama4ForConditionalGeneration._from_config(config)
39 |     model.save_pretrained("tiny-llama4")
40 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/examples/train_lora/llama3_lora_sft_ray.yaml:
--------------------------------------------------------------------------------
 1 | ### model
 2 | model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct  # or use local absolute path
 3 | trust_remote_code: true
 4 | 
 5 | ### method
 6 | stage: sft
 7 | do_train: true
 8 | finetuning_type: lora
 9 | lora_rank: 8
10 | lora_target: all
11 | 
12 | ### dataset
13 | dataset: identity,alpaca_en_demo
14 | dataset_dir: REMOTE:llamafactory/demo_data  # or use local absolute path
15 | template: llama3
16 | cutoff_len: 2048
17 | max_samples: 1000
18 | overwrite_cache: true
19 | preprocessing_num_workers: 16
20 | dataloader_num_workers: 4
21 | 
22 | ### output
23 | output_dir: tmp_dir
24 | logging_steps: 10
25 | save_steps: 500
26 | plot_loss: true
27 | overwrite_output_dir: true
28 | save_only_model: false
29 | report_to: none  # choices: [none, wandb, tensorboard, swanlab, mlflow]
30 | 
31 | ### ray
32 | ray_run_name: llama3_8b_sft_lora
33 | ray_storage_path: ./saves
34 | ray_num_workers: 4  # Number of GPUs to use.
35 | placement_strategy: PACK
36 | resources_per_worker:
37 |   GPU: 1
38 | # ray_init_kwargs:
39 | #   runtime_env:
40 | #     env_vars:
41 | #       <YOUR-ENV-VAR-HERE>: "<YOUR-ENV-VAR-HERE>"
42 | #     pip:
43 | #       - emoji
44 | 
45 | ### train
46 | per_device_train_batch_size: 1
47 | gradient_accumulation_steps: 8
48 | learning_rate: 1.0e-4
49 | num_train_epochs: 3.0
50 | lr_scheduler_type: cosine
51 | warmup_ratio: 0.1
52 | bf16: true
53 | ddp_timeout: 180000000
54 | resume_from_checkpoint: null
55 | 
56 | ### eval
57 | # eval_dataset: alpaca_en_demo
58 | # val_size: 0.1
59 | # per_device_eval_batch_size: 1
60 | # eval_strategy: steps
61 | # eval_steps: 500
62 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/model/model_utils/mod.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from typing import TYPE_CHECKING
16 | 
17 | from ...extras.constants import MOD_SUPPORTED_MODELS
18 | 
19 | 
20 | if TYPE_CHECKING:
21 |     from transformers import PretrainedConfig, PreTrainedModel
22 | 
23 |     from ...hparams import ModelArguments
24 | 
25 | 
26 | def load_mod_pretrained_model(**init_kwargs) -> "PreTrainedModel":
27 |     from MoD import AutoMoDModelForCausalLM
28 | 
29 |     return AutoMoDModelForCausalLM.from_pretrained(**init_kwargs)
30 | 
31 | 
32 | def convert_pretrained_model_to_mod(
33 |     model: "PreTrainedModel", config: "PretrainedConfig", model_args: "ModelArguments"
34 | ) -> "PreTrainedModel":
35 |     from MoD import apply_mod_to_hf
36 | 
37 |     if getattr(config, "model_type", None) not in MOD_SUPPORTED_MODELS:
38 |         raise ValueError("Current model is not supported by mixture-of-depth.")
39 | 
40 |     model = apply_mod_to_hf(model)
41 |     model = model.to(model_args.compute_dtype)
42 |     return model
43 | 


--------------------------------------------------------------------------------
/api/visual_tools/egoschema_vlm/vlm.py:
--------------------------------------------------------------------------------
 1 | from utils import *
 2 | 
 3 | def vlm(question: Annotated[str, "The question you want to use the vision language model to answer. Note: The question does not necessarily need to be the same as the question given by the user. You should propose a question based on the available observations."], timestamp: Annotated[str, "The timestamp of the video to answer the question. The format should be DAYX_HHMMSSFF (X is the day number, HHMMSS is the hour, minute, second, and FF is the frame number(00~19))"], data_dir: Annotated[str, "The directory of all videos"] = "/home/data2/sltian/code/Ego-R1_dev/EgoLife") -> dict:
 4 |     """
 5 |     Analyze a single image frame at the specified timestamp using a vision language model.
 6 |     Answers questions about visual scenes, events, and objects.
 7 |     Returns both the answer and image file metadata.
 8 |     
 9 |     FREQUENCY: 2/10    
10 |     COST: 2/5
11 |     TEMPORAL CAPABILITY: 1/5
12 |     VISUAL INPUT: True
13 |     
14 |     ## HINT
15 |     1. Ask targeted questions that align with your observation and reasoning process rather than repeating the user's original question.
16 |     """
17 |     
18 |     # Use OpenAI API to answer the question
19 |     os.makedirs("./cache", exist_ok=True)
20 |     frame_path, exact_match = locate_image_url(timestamp,data_dir)
21 |     print(f"Frame path: {frame_path}")
22 |     image_client = GPT()
23 |     answer = image_client.chat(question, frame_path)
24 |     
25 |     response = {
26 |         "query_time": timestamp,
27 |         "question": question,
28 |         "answer": answer,
29 |         "exact_match": exact_match
30 |     }
31 |     return response


--------------------------------------------------------------------------------
/api/visual_tools/videomme_vlm/vlm.py:
--------------------------------------------------------------------------------
 1 | from utils import *
 2 | 
 3 | def vlm(question: Annotated[str, "The question you want to use the vision language model to answer. Note: The question does not necessarily need to be the same as the question given by the user. You should propose a question based on the available observations."], timestamp: Annotated[str, "The timestamp of the video to answer the question. The format should be DAYX_HHMMSSFF (X is the day number, HHMMSS is the hour, minute, second, and FF is the frame number(00~19))"], data_dir: Annotated[str, "The directory of all videos"] = "/home/data2/sltian/code/Ego-R1_dev/EgoLife") -> dict:
 4 |     """
 5 |     Analyze a single image frame at the specified timestamp using a vision language model.
 6 |     Answers questions about visual scenes, events, and objects.
 7 |     Returns both the answer and image file metadata.
 8 |     
 9 |     FREQUENCY: 2/10    
10 |     COST: 2/5
11 |     TEMPORAL CAPABILITY: 1/5
12 |     VISUAL INPUT: True
13 |     
14 |     ## HINT
15 |     1. Ask targeted questions that align with your observation and reasoning process rather than repeating the user's original question.
16 |     """
17 |     
18 |     # Use OpenAI API to answer the question
19 |     os.makedirs("./cache", exist_ok=True)
20 |     frame_path, exact_match = locate_image_url(timestamp,data_dir)
21 |     print(f"Frame path: {frame_path}")
22 |     image_client = GPT()
23 |     answer = image_client.chat(question, frame_path)
24 |     
25 |     response = {
26 |         "query_time": timestamp,
27 |         "question": question,
28 |         "answer": answer,
29 |         "exact_match": exact_match
30 |     }
31 |     return response


--------------------------------------------------------------------------------
/Ego-R1-Agent/README.md:
--------------------------------------------------------------------------------
 1 | # Ego-R1-Agent
 2 | 
 3 | A reinforcement learning framework for training reasoning-and-searching interleaved language models for egocentric video understanding. Built on [veRL](https://github.com/volcengine/verl) and [Search-R1](https://github.com/PeterGriffinJin/Search-R1?tab=readme-ov-file).
 4 | 
 5 | ## 📁 Directory Structure
 6 | 
 7 | ```
 8 | Ego-R1-Agent/
 9 | ├── eval/                    # Evaluation scripts
10 | │   ├── infer.py            # Main inference script
11 | │   ├── infer_bench_summ.py # Benchmark evaluation
12 | │   ├── infer_summ.py       # Summary evaluation
13 | │   └── infer_bench_summ.sh # Benchmark evaluation script
14 | ├── utils/                   # Utility functions
15 | │   ├── constants.py        # System prompts and API endpoints
16 | │   ├── process.py          # Tool calling and response processing
17 | │   └── serve.sh            # Model serving script
18 | ├── verl/                    # veRL framework components
19 | ├── ego_r1/                 # Core implementation
20 | ├── train_grpo.sh           # GRPO training script
21 | ├── train_grpo_base.sh      # Base GRPO training configuration
22 | ├── environment.yml         # Conda environment specification
23 | ├── setup.py               # Package setup
24 | ├── pyproject.toml         # Project metadata
25 | └── VERL_README.md         # veRL framework documentation
26 | ```
27 | 
28 | ## 🔧 Quick Setup
29 | 
30 | ```bash
31 | # Environment
32 | conda create -n egor1 python=3.9
33 | conda activate egor1
34 | pip install -e .
35 | 
36 | # Training
37 | bash train_grpo.sh
38 | 
39 | # Inference
40 | bash utils/serve.sh
41 | python eval/infer.py --model_name_or_path Ego-R1/Ego-R1-Agent-3B
42 | ```
43 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/megatron/memory.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import torch
16 | 
17 | 
18 | class MemoryBuffer:
19 | 
20 |     def __init__(self, numel, numel_padded, dtype):
21 |         self.numel = numel
22 |         self.numel_padded = numel_padded
23 |         self.dtype = dtype
24 |         self.data = torch.zeros(self.numel_padded,
25 |                                 dtype=self.dtype,
26 |                                 device=torch.cuda.current_device(),
27 |                                 requires_grad=False)
28 | 
29 |     def zero(self):
30 |         """Reset the buffer to zero."""
31 |         self.data.zero_()
32 | 
33 |     def get(self, shape, start_index):
34 |         """Return a tensor with the input `shape` as a view into the
35 |         1-D data starting at `start_index`."""
36 |         end_index = start_index + shape.numel()
37 |         assert end_index <= self.numel, \
38 |             'requested tensor is out of the buffer range.'
39 |         buffer_tensor = self.data[start_index:end_index]
40 |         buffer_tensor = buffer_tensor.view(shape)
41 |         return buffer_tensor
42 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/tests/model/test_base.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | import pytest
18 | 
19 | from llamafactory.train.test_utils import compare_model, load_infer_model, load_reference_model, patch_valuehead_model
20 | 
21 | 
22 | TINY_LLAMA3 = os.getenv("TINY_LLAMA3", "llamafactory/tiny-random-Llama-3")
23 | 
24 | TINY_LLAMA_VALUEHEAD = os.getenv("TINY_LLAMA_VALUEHEAD", "llamafactory/tiny-random-Llama-3-valuehead")
25 | 
26 | INFER_ARGS = {
27 |     "model_name_or_path": TINY_LLAMA3,
28 |     "template": "llama3",
29 |     "infer_dtype": "float16",
30 | }
31 | 
32 | 
33 | @pytest.fixture
34 | def fix_valuehead_cpu_loading():
35 |     patch_valuehead_model()
36 | 
37 | 
38 | def test_base():
39 |     model = load_infer_model(**INFER_ARGS)
40 |     ref_model = load_reference_model(TINY_LLAMA3)
41 |     compare_model(model, ref_model)
42 | 
43 | 
44 | @pytest.mark.usefixtures("fix_valuehead_cpu_loading")
45 | def test_valuehead():
46 |     model = load_infer_model(add_valuehead=True, **INFER_ARGS)
47 |     ref_model = load_reference_model(TINY_LLAMA_VALUEHEAD, add_valuehead=True)
48 |     compare_model(model, ref_model)
49 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/tests/model/model_utils/test_misc.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | import pytest
18 | import torch
19 | from transformers import AutoConfig, AutoModelForCausalLM
20 | 
21 | from llamafactory.model.model_utils.misc import find_expanded_modules
22 | 
23 | 
24 | HF_TOKEN = os.getenv("HF_TOKEN")
25 | 
26 | 
27 | @pytest.mark.skipif(not HF_TOKEN, reason="Gated model.")
28 | def test_expanded_modules():
29 |     config = AutoConfig.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct")
30 |     with torch.device("meta"):
31 |         model = AutoModelForCausalLM.from_config(config)
32 | 
33 |     expanded_modules = find_expanded_modules(model, ["q_proj", "v_proj"], num_layer_trainable=4)
34 |     assert expanded_modules == [
35 |         "model.layers.7.self_attn.q_proj",
36 |         "model.layers.7.self_attn.v_proj",
37 |         "model.layers.15.self_attn.q_proj",
38 |         "model.layers.15.self_attn.v_proj",
39 |         "model.layers.23.self_attn.q_proj",
40 |         "model.layers.23.self_attn.v_proj",
41 |         "model.layers.31.self_attn.q_proj",
42 |         "model.layers.31.self_attn.v_proj",
43 |     ]
44 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/model/model_utils/kv_cache.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from typing import TYPE_CHECKING
16 | 
17 | from ...extras import logging
18 | 
19 | 
20 | logger = logging.get_logger(__name__)
21 | 
22 | 
23 | if TYPE_CHECKING:
24 |     from transformers import PretrainedConfig
25 | 
26 |     from ...hparams import ModelArguments
27 | 
28 | 
29 | def configure_kv_cache(config: "PretrainedConfig", model_args: "ModelArguments", is_trainable: bool) -> None:
30 |     if not is_trainable:
31 |         setattr(config, "use_cache", model_args.use_cache)
32 |         if hasattr(config, "text_config"):
33 |             setattr(config.text_config, "use_cache", model_args.use_cache)
34 | 
35 |         if model_args.use_cache:
36 |             logger.info_rank0("KV cache is enabled for faster generation.")
37 |         else:
38 |             logger.info_rank0("KV cache is disabled.")
39 |     else:
40 |         setattr(config, "use_cache", False)
41 |         if hasattr(config, "text_config"):
42 |             setattr(config.text_config, "use_cache", False)
43 | 
44 |         logger.info_rank0("KV cache is disabled during training.")
45 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/tests/model/model_utils/test_add_tokens.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | import pytest
18 | 
19 | from llamafactory.hparams import ModelArguments
20 | from llamafactory.model import load_tokenizer
21 | 
22 | 
23 | TINY_LLAMA3 = os.getenv("TINY_LLAMA3", "llamafactory/tiny-random-Llama-3")
24 | 
25 | UNUSED_TOKEN = "<|UNUSED_TOKEN|>"
26 | 
27 | 
28 | @pytest.mark.parametrize("special_tokens", [False, True])
29 | def test_add_tokens(special_tokens: bool):
30 |     if special_tokens:
31 |         model_args = ModelArguments(model_name_or_path=TINY_LLAMA3, add_special_tokens=UNUSED_TOKEN)
32 |     else:
33 |         model_args = ModelArguments(model_name_or_path=TINY_LLAMA3, add_tokens=UNUSED_TOKEN)
34 | 
35 |     tokenizer = load_tokenizer(model_args)["tokenizer"]
36 |     encoded_ids = tokenizer.encode(UNUSED_TOKEN, add_special_tokens=False)
37 |     assert len(encoded_ids) == 1
38 |     decoded_str = tokenizer.decode(encoded_ids, skip_special_tokens=True)
39 |     if special_tokens:
40 |         assert decoded_str == ""
41 |     else:
42 |         assert decoded_str == UNUSED_TOKEN
43 | 
44 | 
45 | if __name__ == "__main__":
46 |     pytest.main([__file__])
47 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/single_controller/base/megatron/worker.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | from dataclasses import dataclass
17 | from verl.single_controller.base.worker import Worker, DistRankInfo, DistGlobalInfo
18 | 
19 | 
20 | class MegatronWorker(Worker):
21 | 
22 |     def __init__(self, cuda_visible_devices=None) -> None:
23 |         super().__init__(cuda_visible_devices)
24 | 
25 |     def get_megatron_global_info(self):
26 |         from megatron.core import parallel_state as mpu
27 |         tp_size = mpu.get_tensor_model_parallel_world_size()
28 |         dp_size = mpu.get_data_parallel_world_size()
29 |         pp_size = mpu.get_pipeline_model_parallel_world_size()
30 |         info = DistGlobalInfo(tp_size=tp_size, dp_size=dp_size, pp_size=pp_size)
31 |         return info
32 | 
33 |     def get_megatron_rank_info(self):
34 |         from megatron.core import parallel_state as mpu
35 |         tp_rank = mpu.get_tensor_model_parallel_rank()
36 |         dp_rank = mpu.get_data_parallel_rank()
37 |         pp_rank = mpu.get_pipeline_model_parallel_rank()
38 |         info = DistRankInfo(tp_rank=tp_rank, dp_rank=dp_rank, pp_rank=pp_rank)
39 |         return info


--------------------------------------------------------------------------------
/api/visual_tools/egor1_vlm/vlm.py:
--------------------------------------------------------------------------------
 1 | from utils import *
 2 | 
 3 | def vlm(question: Annotated[str, "The question you want to use the vision language model to answer. Note: The question does not necessarily need to be the same as the question given by the user. You should propose a question based on the available observations."], timestamp: Annotated[str, "The timestamp of the video to answer the question. The format should be DAYX_HHMMSSFF (X is the day number, HHMMSS is the hour, minute, second, and FF is the frame number(00~19))"], identity: Annotated[str, "The identity of the person to answer the question. Identity comes from: A1_JAKE|A2_ALICE|A3_TASHA|A4_LUCIA|A5_KATRINA|A6_SHURE"],data_dir: Annotated[str, "The directory of all videos"] = "./EgoLife") -> dict:
 4 |     """
 5 |     Analyze a single image frame at the specified timestamp using a vision language model.
 6 |     Answers questions about visual scenes, events, and objects.
 7 |     Returns both the answer and image file metadata.
 8 |     
 9 |     FREQUENCY: 2/10    
10 |     COST: 2/5
11 |     TEMPORAL CAPABILITY: 1/5
12 |     VISUAL INPUT: True
13 |     
14 |     ## HINT
15 |     1. Ask targeted questions that align with your observation and reasoning process rather than repeating the user's original question.
16 |     """
17 |     
18 |     # Use OpenAI API to answer the question
19 |     os.makedirs("./cache", exist_ok=True)
20 |     frame_path, exact_match = locate_image_url(timestamp, identity=identity,data_dir=data_dir)
21 |     print(f"Frame path: {frame_path}")
22 |     image_client = GPT()
23 |     answer = image_client.chat(question, frame_path)
24 |     
25 |     response = {
26 |         "query_time": timestamp,
27 |         "question": question,
28 |         "answer": answer,
29 |         "exact_match": exact_match
30 |     }
31 |     return response


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/third_party/vllm/vllm_v_0_6_3/tokenizer.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | # Copyright 2023 The vLLM team.
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # Adapted from https://github.com/vllm-project/vllm/blob/main/vllm/transformers_utils/tokenizer_group/tokenizer_group.py
15 | 
16 | from typing import Optional
17 | 
18 | from transformers import PreTrainedTokenizer
19 | from vllm.transformers_utils.tokenizer_group import TokenizerGroup
20 | from vllm.utils import LRUCache
21 | 
22 | 
23 | class TokenizerGroup(TokenizerGroup):
24 |     """A group of tokenizers that can be used for LoRA adapters."""
25 | 
26 |     def __init__(self, tokenizer: PreTrainedTokenizer, enable_lora: bool, max_num_seqs: int,
27 |                  max_input_length: Optional[int]):
28 |         self.enable_lora = enable_lora
29 |         self.max_input_length = max_input_length
30 |         self.tokenizer = tokenizer
31 |         self.lora_tokenizers = LRUCache[PreTrainedTokenizer](capacity=max_num_seqs) if enable_lora else None
32 | 
33 |     # FIXME(sgm): for simplicity, we assign the special token here
34 |     @property
35 |     def pad_token_id(self):
36 |         return self.tokenizer.pad_token_id
37 | 
38 |     @property
39 |     def eos_token_id(self):
40 |         return self.tokenizer.eos_token_id
41 | 


--------------------------------------------------------------------------------
/api/visual_tools/egor1_vlm/api.py:
--------------------------------------------------------------------------------
 1 | from fastapi import FastAPI, HTTPException
 2 | from pydantic import BaseModel
 3 | from typing import Optional
 4 | from vlm import vlm
 5 | import os
 6 | import yaml
 7 | 
 8 | def load_config():
 9 |     config_path = os.path.join(os.path.dirname(os.path.dirname(__file__)), 'configs.yaml')
10 |     with open(config_path, 'r') as f:
11 |         return yaml.safe_load(f)
12 | 
13 | # Load configuration
14 | config = load_config()
15 | DATA_DIR = config['egolife']['vlm']['data_dir']
16 | VLM_PORT = config['egolife']['vlm']['vlm_port']
17 | app = FastAPI(title="Vision Language Model API")
18 | 
19 | class VLMRequest(BaseModel):
20 |     question: str
21 |     timestamp: str
22 |     identity: str
23 | 
24 | class VLMResponse(BaseModel):
25 |     query_time: str
26 |     question: str
27 |     answer: str
28 |     exact_match: bool
29 | 
30 | @app.post("/vlm", response_model=VLMResponse)
31 | async def vlm_endpoint(request: VLMRequest):
32 |     """
33 |     Analyze a single image frame at the specified timestamp using a vision language model.
34 |     
35 |     Parameters:
36 |     - question: The question to ask about the image
37 |     - timestamp: The timestamp in format DAYX_HHMMSSFF (X is day number, HHMMSS is hour:minute:second, FF is frame number 00-19)
38 |     
39 |     Returns:
40 |     - query_time: The timestamp used
41 |     - question: The question asked
42 |     - answer: The model's response
43 |     - exact_match: Whether the image was found exactly
44 |     """
45 |     try:
46 |         result = vlm(question=request.question, timestamp=request.timestamp, identity=request.identity,data_dir=DATA_DIR)
47 |         return result
48 |     except Exception as e:
49 |         print(e)
50 |         raise HTTPException(status_code=500, detail=str(e))
51 | 
52 | if __name__ == "__main__":
53 |     import uvicorn
54 |     uvicorn.run(app, host="0.0.0.0", port=VLM_PORT)
55 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/models/README.md:
--------------------------------------------------------------------------------
 1 | # Models
 2 | Common modelzoo such as huggingface/transformers stuggles when using Pytorch native model parallelism. Following the design principle of vLLM, we keep a simple, parallelizable, highly-optimized with packed inputs in verl. 
 3 | ## Adding a New Huggingface Model
 4 | ### Step 1: Copy the model file from HF to verl
 5 | - Add a new file under verl/models/hf
 6 | - Copy ONLY the model file from huggingface/transformers/models to verl/models/hf
 7 | 
 8 | ### Step 2: Modify the model file to use packed inputs
 9 | - Remove all the code related to inference (kv cache)
10 | - Modify the inputs to include only
11 |     - input_ids (total_nnz,)
12 |     - cu_seqlens (total_nnz + 1,)
13 |     - max_seqlen_in_batch: int
14 | - Note that this requires using flash attention with causal mask.
15 | 
16 | ### Step 2.5: Add tests
17 | - Add a test to compare this version and the huggingface version
18 | - Following the infrastructure and add tests to tests/models/hf
19 | 
20 | ### Step 3: Add a function to apply tensor parallelism
21 | - Please follow
22 |     - https://pytorch.org/docs/stable/distributed.tensor.parallel.html
23 |     - https://pytorch.org/tutorials/intermediate/TP_tutorial.html
24 | - General comments
25 |     - Tensor Parallelism in native Pytorch is NOT auto-parallelism. The way it works is to specify how model parameters and input/output reshards using configs. These configs are then registered as hooks to perform input/output resharding before/after model forward.
26 | 
27 | ### Step 4: Add a function to apply data parallelism
28 | - Please use FSDP2 APIs
29 | - See demo here https://github.com/pytorch/torchtitan/blob/main/torchtitan/parallelisms/parallelize_llama.py#L413
30 | 
31 | ### Step 5: Add a function to apply pipeline parallelism
32 | - Comes in Pytorch 2.4
33 | - Currently only in alpha in nightly version
34 | - Check torchtitan for more details
35 | 
36 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/tests/model/test_full.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | import torch
18 | 
19 | from llamafactory.train.test_utils import load_infer_model, load_train_model
20 | 
21 | 
22 | TINY_LLAMA3 = os.getenv("TINY_LLAMA3", "llamafactory/tiny-random-Llama-3")
23 | 
24 | TRAIN_ARGS = {
25 |     "model_name_or_path": TINY_LLAMA3,
26 |     "stage": "sft",
27 |     "do_train": True,
28 |     "finetuning_type": "full",
29 |     "dataset": "llamafactory/tiny-supervised-dataset",
30 |     "dataset_dir": "ONLINE",
31 |     "template": "llama3",
32 |     "cutoff_len": 1024,
33 |     "output_dir": "dummy_dir",
34 |     "overwrite_output_dir": True,
35 |     "fp16": True,
36 | }
37 | 
38 | INFER_ARGS = {
39 |     "model_name_or_path": TINY_LLAMA3,
40 |     "finetuning_type": "full",
41 |     "template": "llama3",
42 |     "infer_dtype": "float16",
43 | }
44 | 
45 | 
46 | def test_full_train():
47 |     model = load_train_model(**TRAIN_ARGS)
48 |     for param in model.parameters():
49 |         assert param.requires_grad is True
50 |         assert param.dtype == torch.float32
51 | 
52 | 
53 | def test_full_inference():
54 |     model = load_infer_model(**INFER_ARGS)
55 |     for param in model.parameters():
56 |         assert param.requires_grad is False
57 |         assert param.dtype == torch.float16
58 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/py_functional.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | """
15 | Contain small python utility functions
16 | """
17 | 
18 | from typing import Dict
19 | from types import SimpleNamespace
20 | 
21 | 
22 | def union_two_dict(dict1: Dict, dict2: Dict):
23 |     """Union two dict. Will throw an error if there is an item not the same object with the same key.
24 | 
25 |     Args:
26 |         dict1:
27 |         dict2:
28 | 
29 |     Returns:
30 | 
31 |     """
32 |     for key, val in dict2.items():
33 |         if key in dict1:
34 |             assert dict2[key] == dict1[key], \
35 |                 f'{key} in meta_dict1 and meta_dict2 are not the same object'
36 |         dict1[key] = val
37 | 
38 |     return dict1
39 | 
40 | 
41 | def append_to_dict(data: Dict, new_data: Dict):
42 |     for key, val in new_data.items():
43 |         if key not in data:
44 |             data[key] = []
45 |         data[key].append(val)
46 | 
47 | 
48 | class NestedNamespace(SimpleNamespace):
49 | 
50 |     def __init__(self, dictionary, **kwargs):
51 |         super().__init__(**kwargs)
52 |         for key, value in dictionary.items():
53 |             if isinstance(value, dict):
54 |                 self.__setattr__(key, NestedNamespace(value))
55 |             else:
56 |                 self.__setattr__(key, value)
57 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/workers/reward_model/base.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | """
15 | The base class for reward model
16 | """
17 | 
18 | from abc import ABC, abstractmethod
19 | 
20 | from verl import DataProto
21 | 
22 | 
23 | class BasePPORewardModel(ABC):
24 | 
25 |     def __init__(self, config):
26 |         self.config = config
27 | 
28 |     @abstractmethod
29 |     def compute_reward(self, data: DataProto) -> DataProto:
30 |         """Computing reward given input_ids. The transformers should output a tensor with shape
31 |            [batch_size, sequence_length], and the value at [EOS] mask should be gathered.
32 | 
33 |         Args:
34 |             data: must contain keys "input_ids", "attention_mask" and "position_ids".
35 |                 - input_ids: [batch_size, sequence_length]
36 |                 - attention_mask: [batch_size, sequence_length]
37 |                 - position_ids: [batch_size, sequence_length]
38 | 
39 |         Returns: a data pass protocol containing "reward". Only the [EOS] position contains the reward.
40 |             Other position should have zero reward. Note that this may change in the future if we use
41 |             dense reward. So, we leave the interface for general case.
42 |             - reward: [batch_size, sequence_length].
43 | 
44 |         """
45 |         pass
46 | 


--------------------------------------------------------------------------------
/api/visual_tools/videomme_vlm/api.py:
--------------------------------------------------------------------------------
 1 | from fastapi import FastAPI, HTTPException
 2 | from pydantic import BaseModel
 3 | from typing import Optional
 4 | from vlm import vlm
 5 | import os
 6 | import yaml
 7 | def load_config():
 8 |     config_path = os.path.join(os.path.dirname(os.path.dirname(__file__)), 'configs.yaml')
 9 |     with open(config_path, 'r') as f:
10 |         return yaml.safe_load(f)
11 | 
12 | # Load configuration
13 | config = load_config()
14 | DATA_DIR = config['videomme']['vlm']['data_dir']
15 | VLM_PORT = config['videomme']['vlm']['vlm_port']
16 | app = FastAPI(title="Vision Language Model API")
17 | 
18 | class VLMRequest(BaseModel):
19 |     question: str
20 |     timestamp: str
21 |     vid_id:str
22 | 
23 | class VLMResponse(BaseModel):
24 |     query_time: str
25 |     question: str
26 |     answer: str
27 |     exact_match: bool
28 | 
29 | @app.post("/vlm", response_model=VLMResponse)
30 | async def vlm_endpoint(request: VLMRequest):
31 |     """
32 |     Analyze a single image frame at the specified timestamp using a vision language model.
33 |     
34 |     Parameters:
35 |     - question: The question to ask about the image
36 |     - timestamp: The timestamp in format DAYX_HHMMSSFF (X is day number, HHMMSS is hour:minute:second, FF is frame number 00-19)
37 |     
38 |     Returns:
39 |     - query_time: The timestamp used
40 |     - question: The question asked
41 |     - answer: The model's response
42 |     - exact_match: Whether the image was found exactly
43 |     
44 |     """
45 |     print(request)
46 |     try:
47 |         data_dir = f"{DATA_DIR}/{request.vid_id}"
48 |         result = vlm(question=request.question, timestamp=request.timestamp, data_dir=data_dir)
49 |         return result
50 |     except Exception as e:
51 |         print(e)
52 |         raise HTTPException(status_code=500, detail=str(e))
53 | 
54 | if __name__ == "__main__":
55 |     import uvicorn
56 |     uvicorn.run(app, host="0.0.0.0", port=VLM_PORT)
57 | 


--------------------------------------------------------------------------------
/api/visual_tools/egoschema_vlm/api.py:
--------------------------------------------------------------------------------
 1 | from fastapi import FastAPI, HTTPException
 2 | from pydantic import BaseModel
 3 | from typing import Optional
 4 | from vlm import vlm
 5 | import os
 6 | import yaml
 7 | def load_config():
 8 |     config_path = os.path.join(os.path.dirname(os.path.dirname(__file__)), 'configs.yaml')
 9 |     with open(config_path, 'r') as f:
10 |         return yaml.safe_load(f)
11 | 
12 | # Load configuration
13 | config = load_config()
14 | DATA_DIR = config['egoschema']['vlm']['data_dir']
15 | VLM_PORT = config['egoschema']['vlm']['vlm_port']
16 | app = FastAPI(title="Vision Language Model API")
17 | 
18 | class VLMRequest(BaseModel):
19 |     question: str
20 |     timestamp: str
21 |     vid_id:str
22 | 
23 | class VLMResponse(BaseModel):
24 |     query_time: str
25 |     question: str
26 |     answer: str
27 |     exact_match: bool
28 | 
29 | @app.post("/vlm", response_model=VLMResponse)
30 | async def vlm_endpoint(request: VLMRequest):
31 |     """
32 |     Analyze a single image frame at the specified timestamp using a vision language model.
33 |     
34 |     Parameters:
35 |     - question: The question to ask about the image
36 |     - timestamp: The timestamp in format DAYX_HHMMSSFF (X is day number, HHMMSS is hour:minute:second, FF is frame number 00-19)
37 |     
38 |     Returns:
39 |     - query_time: The timestamp used
40 |     - question: The question asked
41 |     - answer: The model's response
42 |     - exact_match: Whether the image was found exactly
43 |     
44 |     """
45 |     print(request)
46 |     try:
47 |         data_dir = f"{DATA_DIR}/{request.vid_id}"
48 |         result = vlm(question=request.question, timestamp=request.timestamp, data_dir=data_dir)
49 |         return result
50 |     except Exception as e:
51 |         print(e)
52 |         raise HTTPException(status_code=500, detail=str(e))
53 | 
54 | if __name__ == "__main__":
55 |     import uvicorn
56 |     uvicorn.run(app, host="0.0.0.0", port=VLM_PORT)
57 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/eval/infer_bench_summ.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | export VIDEO_LLM_URL=http://127.0.0.1:7060/video_llm
 4 | export VLM_URL=http://127.0.0.1:7090/vlm
 5 | 
 6 | datetime=$(date +%Y%m%d_%H%M%S)
 7 | max_turns=7
 8 | # Create log directory if it doesn't exist
 9 | mkdir -p infer_logs
10 | 
11 | model_name_or_path=sieufgsb9dv77w-94r/qwen25-3b-it-sft4500-len8192-rl-bs4-gs145
12 | # sieufgsb9dv77w-94r/qwen25-3b-it-sft4500-len8192-rl-bs4-gs145
13 | # 184 have some issues
14 | CUDA_VISIBLE_DEVICES=0 PYTHONPATH=. python eval/infer_bench_summ.py \
15 |     --bench_name video-mme-long \
16 |     --max_turns ${max_turns} \
17 |     --data_start 620 \
18 |     --data_end -1 \
19 |     --model_name_or_path ${model_name_or_path} \
20 |     --dataset ./benchmarks/video-mme-long.parquet \
21 |     | tee infer_logs/log_video-mme-long_summ_mt${max_turns}-${datetime}_s620-e-1.log 2>&1
22 | 
23 | # CUDA_VISIBLE_DEVICES=1 PYTHONPATH=. python eval/infer_bench_summ.py \
24 | #     --bench_name video-mme-long \
25 | #     --max_turns ${max_turns} \
26 | #     --data_start 765 \
27 | #     --data_end 810 \
28 | #     --dataset ./benchmarks/video-mme-long.parquet \
29 | #     | tee infer_logs/log_video-mme-long_summ_mt${max_turns}-${datetime}_s765-e810.log 2>&1 &
30 | 
31 | # CUDA_VISIBLE_DEVICES=2 PYTHONPATH=. python eval/infer_bench_summ.py \
32 | #     --bench_name video-mme-long \
33 | #     --max_turns ${max_turns} \
34 | #     --data_start 810 \
35 | #     --data_end 855 \
36 | #     --dataset ./benchmarks/video-mme-long.parquet \
37 | #     | tee infer_logs/log_video-mme-long_summ_mt${max_turns}-${datetime}_s810-e855.log 2>&1 &
38 | 
39 | # CUDA_VISIBLE_DEVICES=3 PYTHONPATH=. python eval/infer_bench_summ.py \
40 | #     --bench_name video-mme-long \
41 | #     --max_turns ${max_turns} \
42 | #     --data_start 855 \
43 | #     --data_end 900 \
44 | #     --dataset ./benchmarks/video-mme-long.parquet \
45 | #     | tee infer_logs/log_video-mme-long_summ_mt${max_turns}-${datetime}_s855-e900.log 2>&1 &
46 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/webui/css.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | CSS = r"""
16 | .duplicate-button {
17 |   margin: auto !important;
18 |   color: white !important;
19 |   background: black !important;
20 |   border-radius: 100vh !important;
21 | }
22 | 
23 | .thinking-summary {
24 |   padding: 8px !important;
25 | }
26 | 
27 | .thinking-summary span {
28 |   border-radius: 4px !important;
29 |   padding: 4px !important;
30 |   cursor: pointer !important;
31 |   font-size: 14px !important;
32 |   background: rgb(245, 245, 245) !important;
33 | }
34 | 
35 | .dark .thinking-summary span {
36 |   background: rgb(73, 73, 73) !important;
37 | }
38 | 
39 | .thinking-container {
40 |   border-left: 2px solid #a6a6a6 !important;
41 |   padding-left: 10px !important;
42 |   margin: 4px 0 !important;
43 | }
44 | 
45 | .thinking-container p {
46 |   color: #a6a6a6 !important;
47 | }
48 | 
49 | .modal-box {
50 |   position: fixed !important;
51 |   top: 50%;
52 |   left: 50%;
53 |   transform: translate(-50%, -50%); /* center horizontally */
54 |   max-width: 1000px;
55 |   max-height: 750px;
56 |   overflow-y: auto;
57 |   background-color: var(--input-background-fill);
58 |   flex-wrap: nowrap !important;
59 |   border: 2px solid black !important;
60 |   z-index: 1000;
61 |   padding: 10px;
62 | }
63 | 
64 | .dark .modal-box {
65 |   border: 2px solid white !important;
66 | }
67 | """
68 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/third_party/vllm/__init__.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from importlib.metadata import version, PackageNotFoundError
16 | 
17 | 
18 | def get_version(pkg):
19 |     try:
20 |         return version(pkg)
21 |     except PackageNotFoundError:
22 |         return None
23 | 
24 | 
25 | package_name = 'vllm'
26 | package_version = get_version(package_name)
27 | 
28 | if package_version == '0.3.1':
29 |     vllm_version = '0.3.1'
30 |     from .vllm_v_0_3_1.llm import LLM
31 |     from .vllm_v_0_3_1.llm import LLMEngine
32 |     from .vllm_v_0_3_1 import parallel_state
33 | elif package_version == '0.4.2':
34 |     vllm_version = '0.4.2'
35 |     from .vllm_v_0_4_2.llm import LLM
36 |     from .vllm_v_0_4_2.llm import LLMEngine
37 |     from .vllm_v_0_4_2 import parallel_state
38 | elif package_version == '0.5.4':
39 |     vllm_version = '0.5.4'
40 |     from .vllm_v_0_5_4.llm import LLM
41 |     from .vllm_v_0_5_4.llm import LLMEngine
42 |     from .vllm_v_0_5_4 import parallel_state
43 | elif package_version == '0.6.3':
44 |     vllm_version = '0.6.3'
45 |     from .vllm_v_0_6_3.llm import LLM
46 |     from .vllm_v_0_6_3.llm import LLMEngine
47 |     from .vllm_v_0_6_3 import parallel_state
48 | else:
49 |     raise ValueError(
50 |         f'vllm version {package_version} not supported. Currently supported versions are 0.3.1, 0.4.2, 0.5.4 and 0.6.3.'
51 |     )
52 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/third_party/vllm/vllm_v_0_6_3/hf_weight_loader.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | # Copyright 2023 The vLLM team.
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # Adapted from https://github.com/vllm-project/vllm/tree/main/vllm/model_executor/model_loader
15 | 
16 | from typing import Dict
17 | 
18 | import torch.nn as nn
19 | from vllm.model_executor.model_loader.utils import set_default_torch_dtype
20 | 
21 | 
22 | def update_hf_weight_loader():
23 |     print("no hf weight loader need to be updated")
24 |     return
25 | 
26 | 
27 | def load_hf_weights(actor_weights: Dict, vllm_model: nn.Module):
28 |     assert isinstance(actor_weights, Dict)
29 |     with set_default_torch_dtype(next(vllm_model.parameters()).dtype):  # TODO
30 |         if vllm_model.config.tie_word_embeddings and "lm_head.weight" in actor_weights.keys():
31 |             del actor_weights["lm_head.weight"]
32 |         vllm_model.load_weights(actor_weights.items())
33 |     for _, module in vllm_model.named_modules():
34 |         quant_method = getattr(module, "quant_method", None)
35 |         if quant_method is not None:
36 |             quant_method.process_weights_after_loading(module)
37 |         # FIXME: Remove this after Mixtral is updated
38 |         # to use quant_method.
39 |         if hasattr(module, "process_weights_after_loading"):
40 |             module.process_weights_after_loading()
41 |     vllm_model = vllm_model.cuda()
42 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/src/llamafactory/train/rm/metric.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | from dataclasses import dataclass
16 | from typing import TYPE_CHECKING, Optional
17 | 
18 | import numpy as np
19 | 
20 | from ...extras.misc import numpify
21 | 
22 | 
23 | if TYPE_CHECKING:
24 |     from transformers import EvalPrediction
25 | 
26 | 
27 | @dataclass
28 | class ComputeAccuracy:
29 |     r"""Compute reward accuracy and support `batch_eval_metrics`."""
30 | 
31 |     def _dump(self) -> Optional[dict[str, float]]:
32 |         result = None
33 |         if hasattr(self, "score_dict"):
34 |             result = {k: float(np.mean(v)) for k, v in self.score_dict.items()}
35 | 
36 |         self.score_dict = {"accuracy": []}
37 |         return result
38 | 
39 |     def __post_init__(self):
40 |         self._dump()
41 | 
42 |     def __call__(self, eval_preds: "EvalPrediction", compute_result: bool = True) -> Optional[dict[str, float]]:
43 |         chosen_scores, rejected_scores = numpify(eval_preds.predictions[0]), numpify(eval_preds.predictions[1])
44 |         if not chosen_scores.shape:
45 |             self.score_dict["accuracy"].append(chosen_scores > rejected_scores)
46 |         else:
47 |             for i in range(len(chosen_scores)):
48 |                 self.score_dict["accuracy"].append(chosen_scores[i] > rejected_scores[i])
49 | 
50 |         if compute_result:
51 |             return self._dump()
52 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/tests/model/model_utils/test_attention.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | import pytest
18 | from transformers.utils import is_flash_attn_2_available, is_torch_sdpa_available
19 | 
20 | from llamafactory.extras.packages import is_transformers_version_greater_than
21 | from llamafactory.train.test_utils import load_infer_model
22 | 
23 | 
24 | TINY_LLAMA3 = os.getenv("TINY_LLAMA3", "llamafactory/tiny-random-Llama-3")
25 | 
26 | INFER_ARGS = {
27 |     "model_name_or_path": TINY_LLAMA3,
28 |     "template": "llama3",
29 | }
30 | 
31 | 
32 | @pytest.mark.xfail(is_transformers_version_greater_than("4.48"), reason="Attention refactor.")
33 | def test_attention():
34 |     attention_available = ["disabled"]
35 |     if is_torch_sdpa_available():
36 |         attention_available.append("sdpa")
37 | 
38 |     if is_flash_attn_2_available():
39 |         attention_available.append("fa2")
40 | 
41 |     llama_attention_classes = {
42 |         "disabled": "LlamaAttention",
43 |         "sdpa": "LlamaSdpaAttention",
44 |         "fa2": "LlamaFlashAttention2",
45 |     }
46 |     for requested_attention in attention_available:
47 |         model = load_infer_model(flash_attn=requested_attention, **INFER_ARGS)
48 |         for module in model.modules():
49 |             if "Attention" in module.__class__.__name__:
50 |                 assert module.__class__.__name__ == llama_attention_classes[requested_attention]
51 | 


--------------------------------------------------------------------------------
/api/visual_tools/egor1_videollm_llava/video_llm.py:
--------------------------------------------------------------------------------
 1 | # videollm.py
 2 | from google import genai
 3 | from typing_extensions import Annotated
 4 | import time
 5 | import os
 6 | import ffmpeg
 7 | from utils import locate_videos, config_videos
 8 | import contextlib
 9 | import requests
10 | 
11 | 
12 | 
13 | @contextlib.contextmanager
14 | def override_cache_dir(new_cache_dir: str):
15 |     """Temporarily override the CACHE_DIR environment variable."""
16 |     old_cache_dir = os.environ.get("CACHE_DIR")
17 |     os.environ["CACHE_DIR"] = new_cache_dir
18 |     try:
19 |         yield
20 |     finally:
21 |         if old_cache_dir is not None:
22 |             os.environ["CACHE_DIR"] = old_cache_dir
23 | 
24 | def video_llm_with_client(question: str, range_: str, identity: str, cache_dir: str, gemini_api_key: str, data_dir: str) -> dict:
25 |     return video_llm(question=question, range=range_, identity=identity, cache_dir=cache_dir, data_dir=data_dir)
26 | 
27 | def video_llm(question: str, range: str, identity: str, cache_dir: str, data_dir: str) -> dict:
28 |     try:
29 |         start_time, end_time = range.split("-")
30 |     except:
31 |         raise ValueError("Invalid range format. Use DAYX_HHMMSSFF-DAYX_HHMMSSFF.")
32 | 
33 |    
34 | 
35 |     file_paths, exact_match = locate_videos(start_time, end_time, identity=identity, cache_dir=cache_dir, data_dir=data_dir)
36 |     combined_video, length = config_videos(file_paths, start_time, end_time, cache_dir=cache_dir)
37 |     
38 |     url = "http://localhost:8000/video/infer"
39 |     pay_load = {
40 |         "video_path": combined_video,
41 |         "prompt": question,
42 |         "max_frames": 64,
43 |         "frame_step": 1
44 |     }
45 |     
46 |     
47 |     response = requests.post(url, json=pay_load)
48 | 
49 |     print(response.json()['response'])
50 | 
51 |     return {
52 |         "query_time": range,
53 |         "question": question,
54 |         "answer": response.json()['response'],
55 |         "exact_match": exact_match,
56 |         "length": length
57 |     }
58 | 
59 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/.gitignore:
--------------------------------------------------------------------------------
  1 | **/*.pt
  2 | **/checkpoints
  3 | verl_checkpoints
  4 | **/wget-log
  5 | **/_build/
  6 | **/*.ckpt
  7 | **/outputs
  8 | **/*.tar.gz
  9 | **/playground
 10 | **/wandb
 11 | 
 12 | # Byte-compiled / optimized / DLL files
 13 | __pycache__/
 14 | *.py[cod]
 15 | *$py.class
 16 | dataset/*
 17 | tensorflow/my_graph/*
 18 | .idea/
 19 | # C extensions
 20 | *.so
 21 | data
 22 | sft/output/*
 23 | sft/data/*
 24 | 
 25 | # Distribution / packaging
 26 | .Python
 27 | build/
 28 | develop-eggs/
 29 | dist/
 30 | downloads/
 31 | eggs/
 32 | .eggs/
 33 | lib/
 34 | lib64/
 35 | parts/
 36 | sdist/
 37 | var/
 38 | *.egg-info/
 39 | .installed.cfg
 40 | *.egg
 41 | 
 42 | # PyInstaller
 43 | #  Usually these files are written by a python script from a template
 44 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 45 | *.manifest
 46 | *.spec
 47 | 
 48 | # Installer logs
 49 | pip-log.txt
 50 | pip-delete-this-directory.txt
 51 | 
 52 | # Unit test / coverage reports
 53 | htmlcov/
 54 | .tox/
 55 | .coverage
 56 | .coverage.*
 57 | .cache
 58 | nosetests.xml
 59 | coverage.xml
 60 | *,cover
 61 | .hypothesis/
 62 | 
 63 | # Translations
 64 | *.mo
 65 | *.pot
 66 | 
 67 | # Django stuff:
 68 | *.log
 69 | local_settings.py
 70 | 
 71 | image_outputs
 72 | 
 73 | checkpoints
 74 | 
 75 | # Flask stuff:
 76 | instance/
 77 | .webassets-cache
 78 | 
 79 | # Scrapy stuff:
 80 | .scrapy
 81 | 
 82 | # Sphinx documentation
 83 | docs/_build/
 84 | 
 85 | # PyBuilder
 86 | target/
 87 | 
 88 | # IPython Notebook
 89 | .ipynb_checkpoints
 90 | 
 91 | # pyenv
 92 | .python-version
 93 | 
 94 | # celery beat schedule file
 95 | celerybeat-schedule
 96 | 
 97 | 
 98 | # virtualenv
 99 | venv/
100 | ENV/
101 | 
102 | # Spyder project settings
103 | .spyderproject
104 | 
105 | # Rope project settings
106 | .ropeproject
107 | 
108 | # vscode
109 | .vscode
110 | 
111 | # Mac
112 | .DS_Store
113 | 
114 | # output logs
115 | tests/e2e/toy_examples/deepspeed/synchronous/output.txt
116 | 
117 | # vim
118 | *.swp
119 | 
120 | # log*
121 | log/
122 | 
123 | **logs


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/utils/megatron/sequence_parallel.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | # Copyright (c) 2024, NVIDIA CORPORATION. All rights reserved.
 3 | #
 4 | # Licensed under the Apache License, Version 2.0 (the "License");
 5 | # you may not use this file except in compliance with the License.
 6 | # You may obtain a copy of the License at
 7 | #
 8 | #     http://www.apache.org/licenses/LICENSE-2.0
 9 | #
10 | # Unless required by applicable law or agreed to in writing, software
11 | # distributed under the License is distributed on an "AS IS" BASIS,
12 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 | # See the License for the specific language governing permissions and
14 | # limitations under the License.
15 | 
16 | import torch
17 | import torch.nn.functional as F
18 | from megatron.core import parallel_state as mpu
19 | 
20 | 
21 | def mark_parameter_as_sequence_parallel(parameter):
22 |     setattr(parameter, 'sequence_parallel', True)
23 | 
24 | 
25 | def is_sequence_parallel_param(param):
26 |     return hasattr(param, 'sequence_parallel') and param.sequence_parallel
27 | 
28 | 
29 | def pad_to_sequence_parallel(unpad_tokens: torch.Tensor):
30 |     """pad the tokens such that the total length is a multiple of sp world size
31 | 
32 |     Args:
33 |         unpad_tokens: (total_nnz, ...). Tokens after removing padding
34 | 
35 |     Returns:
36 | 
37 |     """
38 |     total_nnz = unpad_tokens.shape[0]
39 |     sp_world_size = mpu.get_tensor_model_parallel_world_size()
40 | 
41 |     if total_nnz % sp_world_size == 0:
42 |         pad_size = 0
43 |     else:
44 |         pad_size = sp_world_size - total_nnz % sp_world_size
45 | 
46 |     if pad_size > 0:
47 |         if unpad_tokens.ndim == 1:
48 |             unpad_tokens = F.pad(unpad_tokens, (0, pad_size))
49 |         elif unpad_tokens.ndim == 2:
50 |             unpad_tokens = F.pad(unpad_tokens, (0, 0, 0, pad_size))
51 |         else:
52 |             raise NotImplementedError(f'Padding dim {unpad_tokens.ndim()} is not supported')
53 | 
54 |     return unpad_tokens
55 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/models/llama/megatron/layers/parallel_rmsnorm.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import numbers
16 | import torch
17 | from megatron.core import ModelParallelConfig
18 | from torch import nn
19 | from transformers import LlamaConfig
20 | 
21 | from apex.normalization.fused_layer_norm import fused_rms_norm_affine
22 | from verl.utils.megatron import sequence_parallel as sp_utils
23 | 
24 | 
25 | class ParallelLlamaRMSNorm(nn.Module):
26 | 
27 |     def __init__(self, config: LlamaConfig, megatron_config: ModelParallelConfig):
28 |         """
29 |         LlamaRMSNorm is equivalent to T5LayerNorm
30 |         """
31 |         super().__init__()
32 |         if isinstance(config.hidden_size, numbers.Integral):
33 |             normalized_shape = (config.hidden_size,)
34 |         self.normalized_shape = torch.Size(normalized_shape)
35 |         self.weight = nn.Parameter(torch.ones(self.normalized_shape))
36 |         self.variance_epsilon = config.rms_norm_eps
37 | 
38 |         if megatron_config.sequence_parallel:
39 |             sp_utils.mark_parameter_as_sequence_parallel(self.weight)
40 | 
41 |     def forward(self, hidden_states):
42 |         return fused_rms_norm_affine(input=hidden_states,
43 |                                      weight=self.weight,
44 |                                      normalized_shape=self.normalized_shape,
45 |                                      eps=self.variance_epsilon,
46 |                                      memory_efficient=True)


--------------------------------------------------------------------------------
/LLaMA-Factory/tests/data/test_loader.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 the LlamaFactory team.
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | import os
16 | 
17 | from llamafactory.train.test_utils import load_dataset_module
18 | 
19 | 
20 | DEMO_DATA = os.getenv("DEMO_DATA", "llamafactory/demo_data")
21 | 
22 | TINY_LLAMA3 = os.getenv("TINY_LLAMA3", "llamafactory/tiny-random-Llama-3")
23 | 
24 | TINY_DATA = os.getenv("TINY_DATA", "llamafactory/tiny-supervised-dataset")
25 | 
26 | TRAIN_ARGS = {
27 |     "model_name_or_path": TINY_LLAMA3,
28 |     "stage": "sft",
29 |     "do_train": True,
30 |     "finetuning_type": "full",
31 |     "template": "llama3",
32 |     "dataset": TINY_DATA,
33 |     "dataset_dir": "ONLINE",
34 |     "cutoff_len": 8192,
35 |     "output_dir": "dummy_dir",
36 |     "overwrite_output_dir": True,
37 |     "fp16": True,
38 | }
39 | 
40 | 
41 | def test_load_train_only():
42 |     dataset_module = load_dataset_module(**TRAIN_ARGS)
43 |     assert dataset_module.get("train_dataset") is not None
44 |     assert dataset_module.get("eval_dataset") is None
45 | 
46 | 
47 | def test_load_val_size():
48 |     dataset_module = load_dataset_module(val_size=0.1, **TRAIN_ARGS)
49 |     assert dataset_module.get("train_dataset") is not None
50 |     assert dataset_module.get("eval_dataset") is not None
51 | 
52 | 
53 | def test_load_eval_data():
54 |     dataset_module = load_dataset_module(eval_dataset=TINY_DATA, **TRAIN_ARGS)
55 |     assert dataset_module.get("train_dataset") is not None
56 |     assert dataset_module.get("eval_dataset") is not None
57 | 


--------------------------------------------------------------------------------
/LLaMA-Factory/scripts/stat_utils/cal_flops.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2025 Microsoft Corporation and the LlamaFactory team.
 2 | #
 3 | # This code is inspired by the Microsoft's DeepSpeed library.
 4 | # https://www.deepspeed.ai/tutorials/flops-profiler/
 5 | #
 6 | # Licensed under the Apache License, Version 2.0 (the "License");
 7 | # you may not use this file except in compliance with the License.
 8 | # You may obtain a copy of the License at
 9 | #
10 | #     http://www.apache.org/licenses/LICENSE-2.0
11 | #
12 | # Unless required by applicable law or agreed to in writing, software
13 | # distributed under the License is distributed on an "AS IS" BASIS,
14 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15 | # See the License for the specific language governing permissions and
16 | # limitations under the License.
17 | 
18 | import fire
19 | import torch
20 | from deepspeed.accelerator import get_accelerator  # type: ignore
21 | from deepspeed.profiling.flops_profiler import get_model_profile  # type: ignore
22 | 
23 | from llamafactory.chat import ChatModel
24 | 
25 | 
26 | def calculate_flops(
27 |     model_name_or_path: str,
28 |     batch_size: int = 1,
29 |     seq_length: int = 512,
30 |     flash_attn: str = "auto",
31 | ):
32 |     r"""Calculate the flops of pre-trained models.
33 | 
34 |     Usage: python cal_flops.py --model_name_or_path path_to_model --batch_size 1 --seq_length 512
35 |     """
36 |     with get_accelerator().device(0):
37 |         chat_model = ChatModel(dict(model_name_or_path=model_name_or_path, template="empty", flash_attn=flash_attn))
38 |         fake_input = torch.ones((batch_size, seq_length), dtype=torch.long, device=chat_model.engine.model.device)
39 |         input_dict = {"input_ids": fake_input, "labels": fake_input.clone()}
40 |         flops, macs, params = get_model_profile(
41 |             chat_model.engine.model, kwargs=input_dict, print_profile=True, detailed=True
42 |         )
43 |         print("FLOPs:", flops)
44 |         print("MACs:", macs)
45 |         print("Params:", params)
46 | 
47 | 
48 | if __name__ == "__main__":
49 |     fire.Fire(calculate_flops)
50 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/verl/third_party/vllm/vllm_v_0_5_4/hf_weight_loader.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | # Copyright 2023 The vLLM team.
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | # Adapted from https://github.com/vllm-project/vllm/tree/main/vllm/model_executor/models
15 | 
16 | from typing import Dict, Union, Optional, Iterable, Tuple
17 | 
18 | import torch
19 | import torch.nn as nn
20 | 
21 | from vllm.model_executor.model_loader.utils import set_default_torch_dtype
22 | from vllm.model_executor.model_loader.weight_utils import default_weight_loader
23 | 
24 | 
25 | def update_hf_weight_loader():
26 |     print('no hf weight loader need to be updated')
27 |     return
28 | 
29 | 
30 | def load_hf_weights(actor_weights: Dict, vllm_model: nn.Module):
31 |     assert isinstance(actor_weights, Dict)
32 |     with set_default_torch_dtype(next(vllm_model.parameters()).dtype):  # TODO
33 |         if vllm_model.config.tie_word_embeddings and "lm_head.weight" in actor_weights.keys():
34 |             del actor_weights["lm_head.weight"]
35 |         vllm_model.load_weights(actor_weights.items())
36 |     for _, module in vllm_model.named_modules():
37 |         quant_method = getattr(module, "quant_method", None)
38 |         if quant_method is not None:
39 |             quant_method.process_weights_after_loading(module)
40 |         # FIXME: Remove this after Mixtral is updated
41 |         # to use quant_method.
42 |         if hasattr(module, "process_weights_after_loading"):
43 |             module.process_weights_after_loading()
44 |     vllm_model = vllm_model.cuda()
45 | 


--------------------------------------------------------------------------------
/Ego-R1-Agent/setup.py:
--------------------------------------------------------------------------------
 1 | # Copyright 2024 Bytedance Ltd. and/or its affiliates
 2 | #
 3 | # Licensed under the Apache License, Version 2.0 (the "License");
 4 | # you may not use this file except in compliance with the License.
 5 | # You may obtain a copy of the License at
 6 | #
 7 | #     http://www.apache.org/licenses/LICENSE-2.0
 8 | #
 9 | # Unless required by applicable law or agreed to in writing, software
10 | # distributed under the License is distributed on an "AS IS" BASIS,
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 | # See the License for the specific language governing permissions and
13 | # limitations under the License.
14 | 
15 | # setup.py is the fallback installation script when pyproject.toml does not work
16 | from setuptools import setup, find_packages
17 | import os
18 | 
19 | version_folder = os.path.dirname(os.path.join(os.path.abspath(__file__)))
20 | 
21 | with open(os.path.join(version_folder, 'verl/version/version')) as f:
22 |     __version__ = f.read().strip()
23 | 
24 | 
25 | with open('requirements.txt') as f:
26 |     required = f.read().splitlines()
27 |     install_requires = [item.strip() for item in required if item.strip()[0] != '#']
28 | 
29 | extras_require = {
30 |     'test': ['pytest', 'yapf']
31 | }
32 | 
33 | from pathlib import Path
34 | this_directory = Path(__file__).parent
35 | long_description = (this_directory / "README.md").read_text()
36 | 
37 | setup(
38 |     name='verl',
39 |     version=__version__,
40 |     package_dir={'': '.'},
41 |     packages=find_packages(where='.'),
42 |     url='https://github.com/volcengine/verl',
43 |     license='Apache 2.0',
44 |     author='Bytedance - Seed - MLSys',
45 |     author_email='zhangchi.usc1992@bytedance.com, gmsheng@connect.hku.hk',
46 |     description='veRL: Volcano Engine Reinforcement Learning for LLM',
47 |     install_requires=install_requires,
48 |     extras_require=extras_require,
49 |     package_data={'': ['version/*'],
50 |                   'verl': ['trainer/config/*.yaml'],},
51 |     include_package_data=True,
52 |     long_description=long_description,
53 |     long_description_content_type='text/markdown'
54 | )


--------------------------------------------------------------------------------