├── .gitignore ├── .pre-commit-config.yaml ├── ADORA ├── ADORA.sh ├── Notice.txt ├── README.md ├── data │ └── kk │ │ └── instruct │ │ ├── 3ppl │ │ ├── test.parquet │ │ └── train.parquet │ │ ├── 4ppl │ │ ├── test.parquet │ │ └── train.parquet │ │ ├── 5ppl │ │ ├── test.parquet │ │ └── train.parquet │ │ ├── 6ppl │ │ ├── test.parquet │ │ └── train.parquet │ │ └── 7ppl │ │ ├── test.parquet │ │ └── train.parquet ├── docker │ ├── Dockerfile.ngc.vllm │ └── Dockerfile.vemlp.vllm.te ├── docs │ ├── Makefile │ ├── README.md │ ├── _static │ │ └── logo.png │ ├── advance │ │ ├── dpo_extension.rst │ │ ├── fsdp_extension.rst │ │ ├── megatron_extension.rst │ │ └── placement.rst │ ├── conf.py │ ├── examples │ │ ├── config.rst │ │ ├── gsm8k_example.rst │ │ └── ppo_code_architecture.rst │ ├── experiment │ │ └── ppo.rst │ ├── faq │ │ └── faq.rst │ ├── index.rst │ ├── preparation │ │ ├── prepare_data.rst │ │ └── reward_function.rst │ ├── requirements-docs.txt │ ├── start │ │ ├── install.rst │ │ └── quickstart.rst │ └── workers │ │ ├── fsdp_workers.rst │ │ ├── megatron_workers.rst │ │ └── ray_trainer.rst ├── eval_kk │ ├── compute_score.py │ ├── eval.sh │ ├── kk_processor.py │ ├── kk_prompt.py │ └── main_eval_instruct.py ├── examples │ ├── data_preprocess │ │ ├── arth.py │ │ ├── countdown.py │ │ ├── full_hh_rlhf.py │ │ ├── gsm8k.py │ │ ├── hellaswag.py │ │ ├── kk.py │ │ ├── math_dataset.py │ │ └── multiply.py │ ├── generation │ │ └── run_deepseek_v2_lite_math.sh │ ├── grpo_trainer │ │ ├── run_deepseek7b_llm.sh │ │ ├── run_deepseek7b_llm_seq_balance.sh │ │ ├── run_qwen2-7b.sh │ │ └── run_qwen2-7b_seq_balance.sh │ ├── ppo_trainer │ │ ├── run_deepseek7b_llm.sh │ │ ├── run_deepseek7b_llm_sp2.sh │ │ ├── run_deepseek_full_hh_rlhf.sh │ │ ├── run_deepseek_math_gsm8k_megatron.sh │ │ ├── run_deepseek_megatron.sh │ │ ├── run_gemma.sh │ │ ├── run_qwen2-7b.sh │ │ ├── run_qwen2-7b_rm.sh │ │ ├── run_qwen2-7b_rm_seq_balance.sh │ │ ├── run_qwen2-7b_seq_balance.sh │ │ ├── run_qwen2.5-32b.sh │ │ └── verl_getting_started.ipynb │ ├── ray │ │ └── tutorial.ipynb │ ├── sft │ │ └── gsm8k │ │ │ ├── run_deepseek_6b7.sh │ │ │ ├── run_gemma_2b.sh │ │ │ └── run_gemma_7b.sh │ └── split_placement │ │ ├── README.md │ │ ├── config │ │ └── ppo_trainer_split.yaml │ │ ├── main_ppo_split.py │ │ ├── run_deepseek7b_llm.sh │ │ └── split_monkey_patch.py ├── math_eval │ ├── aime_2021_2024.jsonl │ ├── amc.jsonl │ ├── auto_test_aime.sh │ ├── test_aime.py │ ├── test_aime.sh │ ├── test_amc.py │ └── test_amc.sh ├── patches │ └── megatron_v4.patch ├── pyproject.toml ├── requirements.txt ├── scripts │ ├── curriculum.sh │ ├── format.sh │ ├── train_grpo_4gpu_7Binstruct.sh │ ├── train_ppo_3B_4gpu.sh │ ├── train_ppo_7B_4gpu.sh │ └── train_reinforce_plus_4gpu_7Binstruct.sh ├── setup.py ├── tests │ ├── __init__.py │ ├── e2e │ │ ├── __init__.py │ │ ├── arithmetic_sequence │ │ │ ├── data │ │ │ │ ├── create_dataset.py │ │ │ │ ├── test.parquet │ │ │ │ └── train.parquet │ │ │ ├── model │ │ │ │ ├── config.json │ │ │ │ ├── create_model_tokenizer.py │ │ │ │ ├── generation_config.json │ │ │ │ ├── model.safetensors │ │ │ │ └── tokenizer_config.json │ │ │ └── rl │ │ │ │ ├── README.md │ │ │ │ ├── config │ │ │ │ └── ray_trainer.yaml │ │ │ │ └── main_trainer.py │ │ ├── check_results.py │ │ ├── envs │ │ │ ├── __init__.py │ │ │ └── digit_completion │ │ │ │ ├── __init__.py │ │ │ │ ├── task.py │ │ │ │ └── tokenizer.py │ │ ├── run_qwen_gsm8k_function_rm.sh │ │ ├── run_qwen_gsm8k_function_rm_no_rmpad.sh │ │ ├── run_qwen_gsm8k_model_rm.sh │ │ ├── run_qwen_gsm8k_model_rm_no_rmpad.sh │ │ ├── run_qwen_gsm8k_model_rm_seq_balance.sh │ │ ├── run_qwen_gsm8k_model_rm_ulysses.sh │ │ ├── run_ray_trainer.sh │ │ └── run_ray_trainer_rmpad.sh │ ├── gpu_utility │ │ ├── test_memory_buffers.py │ │ ├── test_ops.py │ │ └── test_torch_functional.py │ ├── model │ │ ├── test_transformer.py │ │ └── test_transformers_ulysses.py │ ├── ray │ │ ├── check_worker_alive │ │ │ └── main.py │ │ ├── detached_worker │ │ │ ├── README.md │ │ │ ├── client.py │ │ │ ├── run.sh │ │ │ └── server.py │ │ ├── test_check_worker_alive.py │ │ ├── test_colocated_workers.py │ │ ├── test_data_transfer.py │ │ ├── test_driverfunc_to_worker.py │ │ ├── test_high_level_scheduling_api.py │ │ ├── test_ray_local_envs.py │ │ ├── test_rvdz.py │ │ ├── test_worker_group_basics.py │ │ └── test_worker_group_torch.py │ ├── rollout │ │ ├── run_fsdp_vllm.py │ │ └── test_vllm_hf_loader.py │ ├── sanity │ │ ├── check_license.py │ │ └── test_import.py │ ├── utility │ │ └── test_tensor_dict_utilities.py │ └── verl │ │ └── utils │ │ └── dataset │ │ ├── test_rl_dataset.py │ │ ├── test_rm_dataset.py │ │ └── test_sft_dataset.py └── verl │ ├── __init__.py │ ├── models │ ├── README.md │ ├── __init__.py │ ├── llama │ │ ├── __init__.py │ │ └── megatron │ │ │ ├── __init__.py │ │ │ ├── checkpoint_utils │ │ │ ├── __init__.py │ │ │ ├── llama_loader.py │ │ │ └── llama_saver.py │ │ │ ├── layers │ │ │ ├── __init__.py │ │ │ ├── parallel_attention.py │ │ │ ├── parallel_decoder.py │ │ │ ├── parallel_linear.py │ │ │ ├── parallel_mlp.py │ │ │ └── parallel_rmsnorm.py │ │ │ └── modeling_llama_megatron.py │ ├── registry.py │ ├── transformers │ │ ├── __init__.py │ │ ├── llama.py │ │ ├── monkey_patch.py │ │ └── qwen2.py │ └── weight_loader_registry.py │ ├── protocol.py │ ├── single_controller │ ├── __init__.py │ ├── base │ │ ├── __init__.py │ │ ├── decorator.py │ │ ├── megatron │ │ │ ├── __init__.py │ │ │ ├── worker.py │ │ │ └── worker_group.py │ │ ├── register_center │ │ │ ├── __init__.py │ │ │ └── ray.py │ │ ├── worker.py │ │ └── worker_group.py │ ├── ray │ │ ├── __init__.py │ │ ├── base.py │ │ └── megatron.py │ └── version │ │ └── version │ ├── third_party │ ├── __init__.py │ └── vllm │ │ ├── __init__.py │ │ ├── vllm_v_0_3_1 │ │ ├── __init__.py │ │ ├── arg_utils.py │ │ ├── config.py │ │ ├── llm.py │ │ ├── llm_engine_sp.py │ │ ├── model_loader.py │ │ ├── model_runner.py │ │ ├── parallel_state.py │ │ ├── tokenizer.py │ │ ├── weight_loaders.py │ │ └── worker.py │ │ ├── vllm_v_0_4_2 │ │ ├── __init__.py │ │ ├── arg_utils.py │ │ ├── config.py │ │ ├── dtensor_weight_loaders.py │ │ ├── hf_weight_loader.py │ │ ├── llm.py │ │ ├── llm_engine_sp.py │ │ ├── megatron_weight_loaders.py │ │ ├── model_loader.py │ │ ├── model_runner.py │ │ ├── parallel_state.py │ │ ├── spmd_gpu_executor.py │ │ ├── tokenizer.py │ │ └── worker.py │ │ ├── vllm_v_0_5_4 │ │ ├── __init__.py │ │ ├── arg_utils.py │ │ ├── config.py │ │ ├── dtensor_weight_loaders.py │ │ ├── hf_weight_loader.py │ │ ├── llm.py │ │ ├── llm_engine_sp.py │ │ ├── megatron_weight_loaders.py │ │ ├── model_loader.py │ │ ├── model_runner.py │ │ ├── parallel_state.py │ │ ├── spmd_gpu_executor.py │ │ ├── tokenizer.py │ │ └── worker.py │ │ └── vllm_v_0_6_3 │ │ ├── __init__.py │ │ ├── arg_utils.py │ │ ├── config.py │ │ ├── dtensor_weight_loaders.py │ │ ├── hf_weight_loader.py │ │ ├── llm.py │ │ ├── llm_engine_sp.py │ │ ├── megatron_weight_loaders.py │ │ ├── model_loader.py │ │ ├── model_runner.py │ │ ├── parallel_state.py │ │ ├── spmd_gpu_executor.py │ │ ├── tokenizer.py │ │ └── worker.py │ ├── trainer │ ├── __init__.py │ ├── config │ │ ├── evaluation.yaml │ │ ├── generation.yaml │ │ ├── ppo_megatron_trainer.yaml │ │ ├── ppo_trainer.yaml │ │ └── sft_trainer.yaml │ ├── fsdp_sft_trainer.py │ ├── main_eval.py │ ├── main_generation.py │ ├── main_ppo.py │ ├── ppo │ │ ├── __init__.py │ │ ├── core_algos.py │ │ └── ray_trainer.py │ └── runtime_env.yaml │ ├── utils │ ├── __init__.py │ ├── config.py │ ├── dataset │ │ ├── README.md │ │ ├── __init__.py │ │ ├── rl_dataset.py │ │ ├── rm_dataset.py │ │ └── sft_dataset.py │ ├── debug │ │ ├── __init__.py │ │ ├── performance.py │ │ └── trajectory_tracker.py │ ├── distributed.py │ ├── flops_counter.py │ ├── fs.py │ ├── fsdp_utils.py │ ├── hdfs_io.py │ ├── import_utils.py │ ├── logger │ │ ├── __init__.py │ │ └── aggregate_logger.py │ ├── logging_utils.py │ ├── megatron │ │ ├── __init__.py │ │ ├── memory.py │ │ ├── optimizer.py │ │ ├── optimizer_config.py │ │ ├── pipeline_parallel.py │ │ ├── sequence_parallel.py │ │ └── tensor_parallel.py │ ├── megatron_utils.py │ ├── memory_buffer.py │ ├── model.py │ ├── py_functional.py │ ├── ray_utils.py │ ├── rendezvous │ │ ├── __init__.py │ │ └── ray_backend.py │ ├── reward_score │ │ ├── __init__.py │ │ ├── countdown.py │ │ ├── gsm8k.py │ │ ├── kk.py │ │ ├── math.py │ │ └── multiply.py │ ├── seqlen_balancing.py │ ├── tokenizer.py │ ├── torch_dtypes.py │ ├── torch_functional.py │ ├── tracking.py │ └── ulysses.py │ ├── version │ └── version │ └── workers │ ├── __init__.py │ ├── actor │ ├── __init__.py │ ├── base.py │ ├── dp_actor.py │ └── megatron_actor.py │ ├── critic │ ├── __init__.py │ ├── base.py │ ├── dp_critic.py │ └── megatron_critic.py │ ├── fsdp_workers.py │ ├── megatron_workers.py │ ├── reward_model │ ├── __init__.py │ ├── base.py │ └── megatron │ │ ├── __init__.py │ │ └── reward_model.py │ ├── rollout │ ├── __init__.py │ ├── base.py │ ├── hf_rollout.py │ ├── naive │ │ ├── __init__.py │ │ └── naive_rollout.py │ ├── tokenizer.py │ └── vllm_rollout │ │ ├── __init__.py │ │ └── vllm_rollout.py │ └── sharding_manager │ ├── __init__.py │ ├── base.py │ ├── fsdp_ulysses.py │ ├── fsdp_vllm.py │ └── megatron_vllm.py ├── ADORA_VL ├── README.md ├── dockerfile │ ├── Dockerfile │ └── docker-entrypoint.sh ├── docs │ ├── logo.png │ ├── math_results.xlsx │ ├── ppo_examples.md │ └── ray_architecture.png ├── examples │ └── scripts │ │ ├── docker_run.sh │ │ ├── nvidia_docker_install.sh │ │ ├── qwen25vl_7b_geo3k_adora.sh │ │ ├── reward_func.py │ │ ├── reward_func_format_iou.py │ │ └── reward_func_math.py ├── openrlhf │ ├── __init__.py │ ├── cli │ │ ├── __init__.py │ │ ├── lora_combiner.py │ │ └── train_ppo_ray_vl.py │ ├── datasets │ │ ├── __init__.py │ │ ├── prompts_dataset_vl.py │ │ ├── reward_dataset_vl.py │ │ ├── sft_dataset_vl.py │ │ └── utils.py │ ├── models │ │ ├── __init__.py │ │ ├── actor_vl.py │ │ ├── loss.py │ │ ├── model_vl.py │ │ ├── ring_attn_utils.py │ │ └── utils.py │ ├── trainer │ │ ├── __init__.py │ │ ├── ppo_trainer_vl.py │ │ ├── ppo_utils │ │ │ ├── __init__.py │ │ │ ├── experience_maker_vl.py │ │ │ ├── kl_controller.py │ │ │ └── replay_buffer_vl.py │ │ └── ray │ │ │ ├── __init__.py │ │ │ ├── launcher_vl.py │ │ │ ├── ppo_actor_vl.py │ │ │ ├── ppo_critic_vl.py │ │ │ ├── utils.py │ │ │ ├── vllm_engine.py │ │ │ └── vllm_worker_wrap.py │ └── utils │ │ ├── __init__.py │ │ ├── deepspeed │ │ ├── __init__.py │ │ ├── deepspeed.py │ │ └── deepspeed_utils.py │ │ ├── distributed_sampler.py │ │ ├── distributed_util.py │ │ ├── intern_vl │ │ ├── __init__.py │ │ ├── image_processing_intern_vl.py │ │ └── processing_intern_vl.py │ │ ├── logging_utils.py │ │ ├── processor.py │ │ ├── remote_rm_utils.py │ │ ├── rl_logging_board │ │ ├── config.toml │ │ ├── rl_logging_board.py │ │ └── start.sh │ │ └── utils.py ├── pyproject.toml ├── requirements.txt ├── setup.py └── version.txt ├── CONTRIBUTING.md ├── LICENSE ├── README.md └── docs ├── adora.png └── adora_vl.png /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/.gitignore -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /ADORA/ADORA.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/ADORA.sh -------------------------------------------------------------------------------- /ADORA/Notice.txt: -------------------------------------------------------------------------------- 1 | Copyright 2023-2024 Bytedance Ltd. and/or its affiliates -------------------------------------------------------------------------------- /ADORA/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/README.md -------------------------------------------------------------------------------- /ADORA/data/kk/instruct/3ppl/test.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/data/kk/instruct/3ppl/test.parquet -------------------------------------------------------------------------------- /ADORA/data/kk/instruct/3ppl/train.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/data/kk/instruct/3ppl/train.parquet -------------------------------------------------------------------------------- /ADORA/data/kk/instruct/4ppl/test.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/data/kk/instruct/4ppl/test.parquet -------------------------------------------------------------------------------- /ADORA/data/kk/instruct/4ppl/train.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/data/kk/instruct/4ppl/train.parquet -------------------------------------------------------------------------------- /ADORA/data/kk/instruct/5ppl/test.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/data/kk/instruct/5ppl/test.parquet -------------------------------------------------------------------------------- /ADORA/data/kk/instruct/5ppl/train.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/data/kk/instruct/5ppl/train.parquet -------------------------------------------------------------------------------- /ADORA/data/kk/instruct/6ppl/test.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/data/kk/instruct/6ppl/test.parquet -------------------------------------------------------------------------------- /ADORA/data/kk/instruct/6ppl/train.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/data/kk/instruct/6ppl/train.parquet -------------------------------------------------------------------------------- /ADORA/data/kk/instruct/7ppl/test.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/data/kk/instruct/7ppl/test.parquet -------------------------------------------------------------------------------- /ADORA/data/kk/instruct/7ppl/train.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/data/kk/instruct/7ppl/train.parquet -------------------------------------------------------------------------------- /ADORA/docker/Dockerfile.ngc.vllm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docker/Dockerfile.ngc.vllm -------------------------------------------------------------------------------- /ADORA/docker/Dockerfile.vemlp.vllm.te: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docker/Dockerfile.vemlp.vllm.te -------------------------------------------------------------------------------- /ADORA/docs/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/Makefile -------------------------------------------------------------------------------- /ADORA/docs/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/README.md -------------------------------------------------------------------------------- /ADORA/docs/_static/logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/_static/logo.png -------------------------------------------------------------------------------- /ADORA/docs/advance/dpo_extension.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/advance/dpo_extension.rst -------------------------------------------------------------------------------- /ADORA/docs/advance/fsdp_extension.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/advance/fsdp_extension.rst -------------------------------------------------------------------------------- /ADORA/docs/advance/megatron_extension.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/advance/megatron_extension.rst -------------------------------------------------------------------------------- /ADORA/docs/advance/placement.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/advance/placement.rst -------------------------------------------------------------------------------- /ADORA/docs/conf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/conf.py -------------------------------------------------------------------------------- /ADORA/docs/examples/config.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/examples/config.rst -------------------------------------------------------------------------------- /ADORA/docs/examples/gsm8k_example.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/examples/gsm8k_example.rst -------------------------------------------------------------------------------- /ADORA/docs/examples/ppo_code_architecture.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/examples/ppo_code_architecture.rst -------------------------------------------------------------------------------- /ADORA/docs/experiment/ppo.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/experiment/ppo.rst -------------------------------------------------------------------------------- /ADORA/docs/faq/faq.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/faq/faq.rst -------------------------------------------------------------------------------- /ADORA/docs/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/index.rst -------------------------------------------------------------------------------- /ADORA/docs/preparation/prepare_data.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/preparation/prepare_data.rst -------------------------------------------------------------------------------- /ADORA/docs/preparation/reward_function.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/preparation/reward_function.rst -------------------------------------------------------------------------------- /ADORA/docs/requirements-docs.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/requirements-docs.txt -------------------------------------------------------------------------------- /ADORA/docs/start/install.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/start/install.rst -------------------------------------------------------------------------------- /ADORA/docs/start/quickstart.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/start/quickstart.rst -------------------------------------------------------------------------------- /ADORA/docs/workers/fsdp_workers.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/workers/fsdp_workers.rst -------------------------------------------------------------------------------- /ADORA/docs/workers/megatron_workers.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/workers/megatron_workers.rst -------------------------------------------------------------------------------- /ADORA/docs/workers/ray_trainer.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/docs/workers/ray_trainer.rst -------------------------------------------------------------------------------- /ADORA/eval_kk/compute_score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/eval_kk/compute_score.py -------------------------------------------------------------------------------- /ADORA/eval_kk/eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/eval_kk/eval.sh -------------------------------------------------------------------------------- /ADORA/eval_kk/kk_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/eval_kk/kk_processor.py -------------------------------------------------------------------------------- /ADORA/eval_kk/kk_prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/eval_kk/kk_prompt.py -------------------------------------------------------------------------------- /ADORA/eval_kk/main_eval_instruct.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/eval_kk/main_eval_instruct.py -------------------------------------------------------------------------------- /ADORA/examples/data_preprocess/arth.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/data_preprocess/arth.py -------------------------------------------------------------------------------- /ADORA/examples/data_preprocess/countdown.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/data_preprocess/countdown.py -------------------------------------------------------------------------------- /ADORA/examples/data_preprocess/full_hh_rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/data_preprocess/full_hh_rlhf.py -------------------------------------------------------------------------------- /ADORA/examples/data_preprocess/gsm8k.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/data_preprocess/gsm8k.py -------------------------------------------------------------------------------- /ADORA/examples/data_preprocess/hellaswag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/data_preprocess/hellaswag.py -------------------------------------------------------------------------------- /ADORA/examples/data_preprocess/kk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/data_preprocess/kk.py -------------------------------------------------------------------------------- /ADORA/examples/data_preprocess/math_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/data_preprocess/math_dataset.py -------------------------------------------------------------------------------- /ADORA/examples/data_preprocess/multiply.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/data_preprocess/multiply.py -------------------------------------------------------------------------------- /ADORA/examples/generation/run_deepseek_v2_lite_math.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/generation/run_deepseek_v2_lite_math.sh -------------------------------------------------------------------------------- /ADORA/examples/grpo_trainer/run_deepseek7b_llm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/grpo_trainer/run_deepseek7b_llm.sh -------------------------------------------------------------------------------- /ADORA/examples/grpo_trainer/run_deepseek7b_llm_seq_balance.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/grpo_trainer/run_deepseek7b_llm_seq_balance.sh -------------------------------------------------------------------------------- /ADORA/examples/grpo_trainer/run_qwen2-7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/grpo_trainer/run_qwen2-7b.sh -------------------------------------------------------------------------------- /ADORA/examples/grpo_trainer/run_qwen2-7b_seq_balance.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/grpo_trainer/run_qwen2-7b_seq_balance.sh -------------------------------------------------------------------------------- /ADORA/examples/ppo_trainer/run_deepseek7b_llm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ppo_trainer/run_deepseek7b_llm.sh -------------------------------------------------------------------------------- /ADORA/examples/ppo_trainer/run_deepseek7b_llm_sp2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ppo_trainer/run_deepseek7b_llm_sp2.sh -------------------------------------------------------------------------------- /ADORA/examples/ppo_trainer/run_deepseek_full_hh_rlhf.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ppo_trainer/run_deepseek_full_hh_rlhf.sh -------------------------------------------------------------------------------- /ADORA/examples/ppo_trainer/run_deepseek_math_gsm8k_megatron.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ppo_trainer/run_deepseek_math_gsm8k_megatron.sh -------------------------------------------------------------------------------- /ADORA/examples/ppo_trainer/run_deepseek_megatron.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ppo_trainer/run_deepseek_megatron.sh -------------------------------------------------------------------------------- /ADORA/examples/ppo_trainer/run_gemma.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ppo_trainer/run_gemma.sh -------------------------------------------------------------------------------- /ADORA/examples/ppo_trainer/run_qwen2-7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ppo_trainer/run_qwen2-7b.sh -------------------------------------------------------------------------------- /ADORA/examples/ppo_trainer/run_qwen2-7b_rm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ppo_trainer/run_qwen2-7b_rm.sh -------------------------------------------------------------------------------- /ADORA/examples/ppo_trainer/run_qwen2-7b_rm_seq_balance.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ppo_trainer/run_qwen2-7b_rm_seq_balance.sh -------------------------------------------------------------------------------- /ADORA/examples/ppo_trainer/run_qwen2-7b_seq_balance.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ppo_trainer/run_qwen2-7b_seq_balance.sh -------------------------------------------------------------------------------- /ADORA/examples/ppo_trainer/run_qwen2.5-32b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ppo_trainer/run_qwen2.5-32b.sh -------------------------------------------------------------------------------- /ADORA/examples/ppo_trainer/verl_getting_started.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ppo_trainer/verl_getting_started.ipynb -------------------------------------------------------------------------------- /ADORA/examples/ray/tutorial.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/ray/tutorial.ipynb -------------------------------------------------------------------------------- /ADORA/examples/sft/gsm8k/run_deepseek_6b7.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/sft/gsm8k/run_deepseek_6b7.sh -------------------------------------------------------------------------------- /ADORA/examples/sft/gsm8k/run_gemma_2b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/sft/gsm8k/run_gemma_2b.sh -------------------------------------------------------------------------------- /ADORA/examples/sft/gsm8k/run_gemma_7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/sft/gsm8k/run_gemma_7b.sh -------------------------------------------------------------------------------- /ADORA/examples/split_placement/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/split_placement/README.md -------------------------------------------------------------------------------- /ADORA/examples/split_placement/config/ppo_trainer_split.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/split_placement/config/ppo_trainer_split.yaml -------------------------------------------------------------------------------- /ADORA/examples/split_placement/main_ppo_split.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/split_placement/main_ppo_split.py -------------------------------------------------------------------------------- /ADORA/examples/split_placement/run_deepseek7b_llm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/split_placement/run_deepseek7b_llm.sh -------------------------------------------------------------------------------- /ADORA/examples/split_placement/split_monkey_patch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/examples/split_placement/split_monkey_patch.py -------------------------------------------------------------------------------- /ADORA/math_eval/aime_2021_2024.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/math_eval/aime_2021_2024.jsonl -------------------------------------------------------------------------------- /ADORA/math_eval/amc.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/math_eval/amc.jsonl -------------------------------------------------------------------------------- /ADORA/math_eval/auto_test_aime.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/math_eval/auto_test_aime.sh -------------------------------------------------------------------------------- /ADORA/math_eval/test_aime.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/math_eval/test_aime.py -------------------------------------------------------------------------------- /ADORA/math_eval/test_aime.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/math_eval/test_aime.sh -------------------------------------------------------------------------------- /ADORA/math_eval/test_amc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/math_eval/test_amc.py -------------------------------------------------------------------------------- /ADORA/math_eval/test_amc.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/math_eval/test_amc.sh -------------------------------------------------------------------------------- /ADORA/patches/megatron_v4.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/patches/megatron_v4.patch -------------------------------------------------------------------------------- /ADORA/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/pyproject.toml -------------------------------------------------------------------------------- /ADORA/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/requirements.txt -------------------------------------------------------------------------------- /ADORA/scripts/curriculum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/scripts/curriculum.sh -------------------------------------------------------------------------------- /ADORA/scripts/format.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/scripts/format.sh -------------------------------------------------------------------------------- /ADORA/scripts/train_grpo_4gpu_7Binstruct.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/scripts/train_grpo_4gpu_7Binstruct.sh -------------------------------------------------------------------------------- /ADORA/scripts/train_ppo_3B_4gpu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/scripts/train_ppo_3B_4gpu.sh -------------------------------------------------------------------------------- /ADORA/scripts/train_ppo_7B_4gpu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/scripts/train_ppo_7B_4gpu.sh -------------------------------------------------------------------------------- /ADORA/scripts/train_reinforce_plus_4gpu_7Binstruct.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/scripts/train_reinforce_plus_4gpu_7Binstruct.sh -------------------------------------------------------------------------------- /ADORA/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/setup.py -------------------------------------------------------------------------------- /ADORA/tests/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/__init__.py -------------------------------------------------------------------------------- /ADORA/tests/e2e/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/__init__.py -------------------------------------------------------------------------------- /ADORA/tests/e2e/arithmetic_sequence/data/create_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/arithmetic_sequence/data/create_dataset.py -------------------------------------------------------------------------------- /ADORA/tests/e2e/arithmetic_sequence/data/test.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/arithmetic_sequence/data/test.parquet -------------------------------------------------------------------------------- /ADORA/tests/e2e/arithmetic_sequence/data/train.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/arithmetic_sequence/data/train.parquet -------------------------------------------------------------------------------- /ADORA/tests/e2e/arithmetic_sequence/model/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/arithmetic_sequence/model/config.json -------------------------------------------------------------------------------- /ADORA/tests/e2e/arithmetic_sequence/model/create_model_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/arithmetic_sequence/model/create_model_tokenizer.py -------------------------------------------------------------------------------- /ADORA/tests/e2e/arithmetic_sequence/model/generation_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/arithmetic_sequence/model/generation_config.json -------------------------------------------------------------------------------- /ADORA/tests/e2e/arithmetic_sequence/model/model.safetensors: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/arithmetic_sequence/model/model.safetensors -------------------------------------------------------------------------------- /ADORA/tests/e2e/arithmetic_sequence/model/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/arithmetic_sequence/model/tokenizer_config.json -------------------------------------------------------------------------------- /ADORA/tests/e2e/arithmetic_sequence/rl/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/arithmetic_sequence/rl/README.md -------------------------------------------------------------------------------- /ADORA/tests/e2e/arithmetic_sequence/rl/config/ray_trainer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/arithmetic_sequence/rl/config/ray_trainer.yaml -------------------------------------------------------------------------------- /ADORA/tests/e2e/arithmetic_sequence/rl/main_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/arithmetic_sequence/rl/main_trainer.py -------------------------------------------------------------------------------- /ADORA/tests/e2e/check_results.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/check_results.py -------------------------------------------------------------------------------- /ADORA/tests/e2e/envs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/envs/__init__.py -------------------------------------------------------------------------------- /ADORA/tests/e2e/envs/digit_completion/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/envs/digit_completion/__init__.py -------------------------------------------------------------------------------- /ADORA/tests/e2e/envs/digit_completion/task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/envs/digit_completion/task.py -------------------------------------------------------------------------------- /ADORA/tests/e2e/envs/digit_completion/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/envs/digit_completion/tokenizer.py -------------------------------------------------------------------------------- /ADORA/tests/e2e/run_qwen_gsm8k_function_rm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/run_qwen_gsm8k_function_rm.sh -------------------------------------------------------------------------------- /ADORA/tests/e2e/run_qwen_gsm8k_function_rm_no_rmpad.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/run_qwen_gsm8k_function_rm_no_rmpad.sh -------------------------------------------------------------------------------- /ADORA/tests/e2e/run_qwen_gsm8k_model_rm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/run_qwen_gsm8k_model_rm.sh -------------------------------------------------------------------------------- /ADORA/tests/e2e/run_qwen_gsm8k_model_rm_no_rmpad.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/run_qwen_gsm8k_model_rm_no_rmpad.sh -------------------------------------------------------------------------------- /ADORA/tests/e2e/run_qwen_gsm8k_model_rm_seq_balance.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/run_qwen_gsm8k_model_rm_seq_balance.sh -------------------------------------------------------------------------------- /ADORA/tests/e2e/run_qwen_gsm8k_model_rm_ulysses.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/run_qwen_gsm8k_model_rm_ulysses.sh -------------------------------------------------------------------------------- /ADORA/tests/e2e/run_ray_trainer.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/run_ray_trainer.sh -------------------------------------------------------------------------------- /ADORA/tests/e2e/run_ray_trainer_rmpad.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/e2e/run_ray_trainer_rmpad.sh -------------------------------------------------------------------------------- /ADORA/tests/gpu_utility/test_memory_buffers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/gpu_utility/test_memory_buffers.py -------------------------------------------------------------------------------- /ADORA/tests/gpu_utility/test_ops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/gpu_utility/test_ops.py -------------------------------------------------------------------------------- /ADORA/tests/gpu_utility/test_torch_functional.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/gpu_utility/test_torch_functional.py -------------------------------------------------------------------------------- /ADORA/tests/model/test_transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/model/test_transformer.py -------------------------------------------------------------------------------- /ADORA/tests/model/test_transformers_ulysses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/model/test_transformers_ulysses.py -------------------------------------------------------------------------------- /ADORA/tests/ray/check_worker_alive/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/check_worker_alive/main.py -------------------------------------------------------------------------------- /ADORA/tests/ray/detached_worker/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/detached_worker/README.md -------------------------------------------------------------------------------- /ADORA/tests/ray/detached_worker/client.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/detached_worker/client.py -------------------------------------------------------------------------------- /ADORA/tests/ray/detached_worker/run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/detached_worker/run.sh -------------------------------------------------------------------------------- /ADORA/tests/ray/detached_worker/server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/detached_worker/server.py -------------------------------------------------------------------------------- /ADORA/tests/ray/test_check_worker_alive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/test_check_worker_alive.py -------------------------------------------------------------------------------- /ADORA/tests/ray/test_colocated_workers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/test_colocated_workers.py -------------------------------------------------------------------------------- /ADORA/tests/ray/test_data_transfer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/test_data_transfer.py -------------------------------------------------------------------------------- /ADORA/tests/ray/test_driverfunc_to_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/test_driverfunc_to_worker.py -------------------------------------------------------------------------------- /ADORA/tests/ray/test_high_level_scheduling_api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/test_high_level_scheduling_api.py -------------------------------------------------------------------------------- /ADORA/tests/ray/test_ray_local_envs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/test_ray_local_envs.py -------------------------------------------------------------------------------- /ADORA/tests/ray/test_rvdz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/test_rvdz.py -------------------------------------------------------------------------------- /ADORA/tests/ray/test_worker_group_basics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/test_worker_group_basics.py -------------------------------------------------------------------------------- /ADORA/tests/ray/test_worker_group_torch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/ray/test_worker_group_torch.py -------------------------------------------------------------------------------- /ADORA/tests/rollout/run_fsdp_vllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/rollout/run_fsdp_vllm.py -------------------------------------------------------------------------------- /ADORA/tests/rollout/test_vllm_hf_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/rollout/test_vllm_hf_loader.py -------------------------------------------------------------------------------- /ADORA/tests/sanity/check_license.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/sanity/check_license.py -------------------------------------------------------------------------------- /ADORA/tests/sanity/test_import.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/sanity/test_import.py -------------------------------------------------------------------------------- /ADORA/tests/utility/test_tensor_dict_utilities.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/utility/test_tensor_dict_utilities.py -------------------------------------------------------------------------------- /ADORA/tests/verl/utils/dataset/test_rl_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/verl/utils/dataset/test_rl_dataset.py -------------------------------------------------------------------------------- /ADORA/tests/verl/utils/dataset/test_rm_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/verl/utils/dataset/test_rm_dataset.py -------------------------------------------------------------------------------- /ADORA/tests/verl/utils/dataset/test_sft_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/tests/verl/utils/dataset/test_sft_dataset.py -------------------------------------------------------------------------------- /ADORA/verl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/models/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/README.md -------------------------------------------------------------------------------- /ADORA/verl/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/models/llama/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/llama/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/models/llama/megatron/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/llama/megatron/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/models/llama/megatron/checkpoint_utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/llama/megatron/checkpoint_utils/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/models/llama/megatron/checkpoint_utils/llama_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/llama/megatron/checkpoint_utils/llama_loader.py -------------------------------------------------------------------------------- /ADORA/verl/models/llama/megatron/checkpoint_utils/llama_saver.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/llama/megatron/checkpoint_utils/llama_saver.py -------------------------------------------------------------------------------- /ADORA/verl/models/llama/megatron/layers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/llama/megatron/layers/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/models/llama/megatron/layers/parallel_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/llama/megatron/layers/parallel_attention.py -------------------------------------------------------------------------------- /ADORA/verl/models/llama/megatron/layers/parallel_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/llama/megatron/layers/parallel_decoder.py -------------------------------------------------------------------------------- /ADORA/verl/models/llama/megatron/layers/parallel_linear.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/llama/megatron/layers/parallel_linear.py -------------------------------------------------------------------------------- /ADORA/verl/models/llama/megatron/layers/parallel_mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/llama/megatron/layers/parallel_mlp.py -------------------------------------------------------------------------------- /ADORA/verl/models/llama/megatron/layers/parallel_rmsnorm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/llama/megatron/layers/parallel_rmsnorm.py -------------------------------------------------------------------------------- /ADORA/verl/models/llama/megatron/modeling_llama_megatron.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/llama/megatron/modeling_llama_megatron.py -------------------------------------------------------------------------------- /ADORA/verl/models/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/registry.py -------------------------------------------------------------------------------- /ADORA/verl/models/transformers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/transformers/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/models/transformers/llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/transformers/llama.py -------------------------------------------------------------------------------- /ADORA/verl/models/transformers/monkey_patch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/transformers/monkey_patch.py -------------------------------------------------------------------------------- /ADORA/verl/models/transformers/qwen2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/transformers/qwen2.py -------------------------------------------------------------------------------- /ADORA/verl/models/weight_loader_registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/models/weight_loader_registry.py -------------------------------------------------------------------------------- /ADORA/verl/protocol.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/protocol.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/base/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/base/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/base/decorator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/base/decorator.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/base/megatron/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/base/megatron/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/base/megatron/worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/base/megatron/worker.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/base/megatron/worker_group.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/base/megatron/worker_group.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/base/register_center/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/base/register_center/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/base/register_center/ray.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/base/register_center/ray.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/base/worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/base/worker.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/base/worker_group.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/base/worker_group.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/ray/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/ray/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/ray/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/ray/base.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/ray/megatron.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/single_controller/ray/megatron.py -------------------------------------------------------------------------------- /ADORA/verl/single_controller/version/version: -------------------------------------------------------------------------------- 1 | 0.0.2 -------------------------------------------------------------------------------- /ADORA/verl/third_party/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_3_1/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_3_1/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_3_1/arg_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_3_1/arg_utils.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_3_1/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_3_1/config.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_3_1/llm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_3_1/llm.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_3_1/llm_engine_sp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_3_1/llm_engine_sp.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_3_1/model_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_3_1/model_loader.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_3_1/model_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_3_1/model_runner.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_3_1/parallel_state.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_3_1/parallel_state.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_3_1/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_3_1/tokenizer.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_3_1/weight_loaders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_3_1/weight_loaders.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_3_1/worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_3_1/worker.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/arg_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/arg_utils.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/config.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/dtensor_weight_loaders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/dtensor_weight_loaders.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/hf_weight_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/hf_weight_loader.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/llm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/llm.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/llm_engine_sp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/llm_engine_sp.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/megatron_weight_loaders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/megatron_weight_loaders.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/model_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/model_loader.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/model_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/model_runner.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/parallel_state.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/parallel_state.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/spmd_gpu_executor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/spmd_gpu_executor.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/tokenizer.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_4_2/worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_4_2/worker.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/arg_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/arg_utils.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/config.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/dtensor_weight_loaders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/dtensor_weight_loaders.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/hf_weight_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/hf_weight_loader.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/llm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/llm.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/llm_engine_sp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/llm_engine_sp.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/megatron_weight_loaders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/megatron_weight_loaders.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/model_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/model_loader.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/model_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/model_runner.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/parallel_state.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/parallel_state.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/spmd_gpu_executor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/spmd_gpu_executor.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/tokenizer.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_5_4/worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_5_4/worker.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/arg_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/arg_utils.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/config.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/dtensor_weight_loaders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/dtensor_weight_loaders.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/hf_weight_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/hf_weight_loader.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/llm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/llm.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/llm_engine_sp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/llm_engine_sp.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/megatron_weight_loaders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/megatron_weight_loaders.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/model_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/model_loader.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/model_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/model_runner.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/parallel_state.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/parallel_state.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/spmd_gpu_executor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/spmd_gpu_executor.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/tokenizer.py -------------------------------------------------------------------------------- /ADORA/verl/third_party/vllm/vllm_v_0_6_3/worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/third_party/vllm/vllm_v_0_6_3/worker.py -------------------------------------------------------------------------------- /ADORA/verl/trainer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/trainer/config/evaluation.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/config/evaluation.yaml -------------------------------------------------------------------------------- /ADORA/verl/trainer/config/generation.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/config/generation.yaml -------------------------------------------------------------------------------- /ADORA/verl/trainer/config/ppo_megatron_trainer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/config/ppo_megatron_trainer.yaml -------------------------------------------------------------------------------- /ADORA/verl/trainer/config/ppo_trainer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/config/ppo_trainer.yaml -------------------------------------------------------------------------------- /ADORA/verl/trainer/config/sft_trainer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/config/sft_trainer.yaml -------------------------------------------------------------------------------- /ADORA/verl/trainer/fsdp_sft_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/fsdp_sft_trainer.py -------------------------------------------------------------------------------- /ADORA/verl/trainer/main_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/main_eval.py -------------------------------------------------------------------------------- /ADORA/verl/trainer/main_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/main_generation.py -------------------------------------------------------------------------------- /ADORA/verl/trainer/main_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/main_ppo.py -------------------------------------------------------------------------------- /ADORA/verl/trainer/ppo/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/ppo/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/trainer/ppo/core_algos.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/ppo/core_algos.py -------------------------------------------------------------------------------- /ADORA/verl/trainer/ppo/ray_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/ppo/ray_trainer.py -------------------------------------------------------------------------------- /ADORA/verl/trainer/runtime_env.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/trainer/runtime_env.yaml -------------------------------------------------------------------------------- /ADORA/verl/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/utils/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/config.py -------------------------------------------------------------------------------- /ADORA/verl/utils/dataset/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/dataset/README.md -------------------------------------------------------------------------------- /ADORA/verl/utils/dataset/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/dataset/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/utils/dataset/rl_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/dataset/rl_dataset.py -------------------------------------------------------------------------------- /ADORA/verl/utils/dataset/rm_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/dataset/rm_dataset.py -------------------------------------------------------------------------------- /ADORA/verl/utils/dataset/sft_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/dataset/sft_dataset.py -------------------------------------------------------------------------------- /ADORA/verl/utils/debug/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/debug/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/utils/debug/performance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/debug/performance.py -------------------------------------------------------------------------------- /ADORA/verl/utils/debug/trajectory_tracker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/debug/trajectory_tracker.py -------------------------------------------------------------------------------- /ADORA/verl/utils/distributed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/distributed.py -------------------------------------------------------------------------------- /ADORA/verl/utils/flops_counter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/flops_counter.py -------------------------------------------------------------------------------- /ADORA/verl/utils/fs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/fs.py -------------------------------------------------------------------------------- /ADORA/verl/utils/fsdp_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/fsdp_utils.py -------------------------------------------------------------------------------- /ADORA/verl/utils/hdfs_io.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/hdfs_io.py -------------------------------------------------------------------------------- /ADORA/verl/utils/import_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/import_utils.py -------------------------------------------------------------------------------- /ADORA/verl/utils/logger/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/logger/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/utils/logger/aggregate_logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/logger/aggregate_logger.py -------------------------------------------------------------------------------- /ADORA/verl/utils/logging_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/logging_utils.py -------------------------------------------------------------------------------- /ADORA/verl/utils/megatron/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/megatron/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/utils/megatron/memory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/megatron/memory.py -------------------------------------------------------------------------------- /ADORA/verl/utils/megatron/optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/megatron/optimizer.py -------------------------------------------------------------------------------- /ADORA/verl/utils/megatron/optimizer_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/megatron/optimizer_config.py -------------------------------------------------------------------------------- /ADORA/verl/utils/megatron/pipeline_parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/megatron/pipeline_parallel.py -------------------------------------------------------------------------------- /ADORA/verl/utils/megatron/sequence_parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/megatron/sequence_parallel.py -------------------------------------------------------------------------------- /ADORA/verl/utils/megatron/tensor_parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/megatron/tensor_parallel.py -------------------------------------------------------------------------------- /ADORA/verl/utils/megatron_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/megatron_utils.py -------------------------------------------------------------------------------- /ADORA/verl/utils/memory_buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/memory_buffer.py -------------------------------------------------------------------------------- /ADORA/verl/utils/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/model.py -------------------------------------------------------------------------------- /ADORA/verl/utils/py_functional.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/py_functional.py -------------------------------------------------------------------------------- /ADORA/verl/utils/ray_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/ray_utils.py -------------------------------------------------------------------------------- /ADORA/verl/utils/rendezvous/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/rendezvous/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/utils/rendezvous/ray_backend.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/rendezvous/ray_backend.py -------------------------------------------------------------------------------- /ADORA/verl/utils/reward_score/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/reward_score/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/utils/reward_score/countdown.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/reward_score/countdown.py -------------------------------------------------------------------------------- /ADORA/verl/utils/reward_score/gsm8k.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/reward_score/gsm8k.py -------------------------------------------------------------------------------- /ADORA/verl/utils/reward_score/kk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/reward_score/kk.py -------------------------------------------------------------------------------- /ADORA/verl/utils/reward_score/math.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/reward_score/math.py -------------------------------------------------------------------------------- /ADORA/verl/utils/reward_score/multiply.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/reward_score/multiply.py -------------------------------------------------------------------------------- /ADORA/verl/utils/seqlen_balancing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/seqlen_balancing.py -------------------------------------------------------------------------------- /ADORA/verl/utils/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/tokenizer.py -------------------------------------------------------------------------------- /ADORA/verl/utils/torch_dtypes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/torch_dtypes.py -------------------------------------------------------------------------------- /ADORA/verl/utils/torch_functional.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/torch_functional.py -------------------------------------------------------------------------------- /ADORA/verl/utils/tracking.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/tracking.py -------------------------------------------------------------------------------- /ADORA/verl/utils/ulysses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/utils/ulysses.py -------------------------------------------------------------------------------- /ADORA/verl/version/version: -------------------------------------------------------------------------------- 1 | 0.1 -------------------------------------------------------------------------------- /ADORA/verl/workers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/workers/actor/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/actor/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/workers/actor/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/actor/base.py -------------------------------------------------------------------------------- /ADORA/verl/workers/actor/dp_actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/actor/dp_actor.py -------------------------------------------------------------------------------- /ADORA/verl/workers/actor/megatron_actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/actor/megatron_actor.py -------------------------------------------------------------------------------- /ADORA/verl/workers/critic/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/critic/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/workers/critic/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/critic/base.py -------------------------------------------------------------------------------- /ADORA/verl/workers/critic/dp_critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/critic/dp_critic.py -------------------------------------------------------------------------------- /ADORA/verl/workers/critic/megatron_critic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/critic/megatron_critic.py -------------------------------------------------------------------------------- /ADORA/verl/workers/fsdp_workers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/fsdp_workers.py -------------------------------------------------------------------------------- /ADORA/verl/workers/megatron_workers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/megatron_workers.py -------------------------------------------------------------------------------- /ADORA/verl/workers/reward_model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/reward_model/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/workers/reward_model/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/reward_model/base.py -------------------------------------------------------------------------------- /ADORA/verl/workers/reward_model/megatron/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/reward_model/megatron/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/workers/reward_model/megatron/reward_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/reward_model/megatron/reward_model.py -------------------------------------------------------------------------------- /ADORA/verl/workers/rollout/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/rollout/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/workers/rollout/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/rollout/base.py -------------------------------------------------------------------------------- /ADORA/verl/workers/rollout/hf_rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/rollout/hf_rollout.py -------------------------------------------------------------------------------- /ADORA/verl/workers/rollout/naive/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/rollout/naive/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/workers/rollout/naive/naive_rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/rollout/naive/naive_rollout.py -------------------------------------------------------------------------------- /ADORA/verl/workers/rollout/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/rollout/tokenizer.py -------------------------------------------------------------------------------- /ADORA/verl/workers/rollout/vllm_rollout/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/rollout/vllm_rollout/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/workers/rollout/vllm_rollout/vllm_rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/rollout/vllm_rollout/vllm_rollout.py -------------------------------------------------------------------------------- /ADORA/verl/workers/sharding_manager/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/sharding_manager/__init__.py -------------------------------------------------------------------------------- /ADORA/verl/workers/sharding_manager/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/sharding_manager/base.py -------------------------------------------------------------------------------- /ADORA/verl/workers/sharding_manager/fsdp_ulysses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/sharding_manager/fsdp_ulysses.py -------------------------------------------------------------------------------- /ADORA/verl/workers/sharding_manager/fsdp_vllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/sharding_manager/fsdp_vllm.py -------------------------------------------------------------------------------- /ADORA/verl/workers/sharding_manager/megatron_vllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA/verl/workers/sharding_manager/megatron_vllm.py -------------------------------------------------------------------------------- /ADORA_VL/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/README.md -------------------------------------------------------------------------------- /ADORA_VL/dockerfile/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/dockerfile/Dockerfile -------------------------------------------------------------------------------- /ADORA_VL/dockerfile/docker-entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/dockerfile/docker-entrypoint.sh -------------------------------------------------------------------------------- /ADORA_VL/docs/logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/docs/logo.png -------------------------------------------------------------------------------- /ADORA_VL/docs/math_results.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/docs/math_results.xlsx -------------------------------------------------------------------------------- /ADORA_VL/docs/ppo_examples.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/docs/ppo_examples.md -------------------------------------------------------------------------------- /ADORA_VL/docs/ray_architecture.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/docs/ray_architecture.png -------------------------------------------------------------------------------- /ADORA_VL/examples/scripts/docker_run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/examples/scripts/docker_run.sh -------------------------------------------------------------------------------- /ADORA_VL/examples/scripts/nvidia_docker_install.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/examples/scripts/nvidia_docker_install.sh -------------------------------------------------------------------------------- /ADORA_VL/examples/scripts/qwen25vl_7b_geo3k_adora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/examples/scripts/qwen25vl_7b_geo3k_adora.sh -------------------------------------------------------------------------------- /ADORA_VL/examples/scripts/reward_func.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/examples/scripts/reward_func.py -------------------------------------------------------------------------------- /ADORA_VL/examples/scripts/reward_func_format_iou.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/examples/scripts/reward_func_format_iou.py -------------------------------------------------------------------------------- /ADORA_VL/examples/scripts/reward_func_math.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/examples/scripts/reward_func_math.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/cli/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/cli/lora_combiner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/cli/lora_combiner.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/cli/train_ppo_ray_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/cli/train_ppo_ray_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/datasets/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/datasets/__init__.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/datasets/prompts_dataset_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/datasets/prompts_dataset_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/datasets/reward_dataset_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/datasets/reward_dataset_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/datasets/sft_dataset_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/datasets/sft_dataset_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/datasets/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/datasets/utils.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/models/__init__.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/models/actor_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/models/actor_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/models/loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/models/loss.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/models/model_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/models/model_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/models/ring_attn_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/models/ring_attn_utils.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/models/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/models/utils.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/__init__.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/ppo_trainer_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/ppo_trainer_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/ppo_utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/ppo_utils/__init__.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/ppo_utils/experience_maker_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/ppo_utils/experience_maker_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/ppo_utils/kl_controller.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/ppo_utils/kl_controller.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/ppo_utils/replay_buffer_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/ppo_utils/replay_buffer_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/ray/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/ray/__init__.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/ray/launcher_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/ray/launcher_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/ray/ppo_actor_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/ray/ppo_actor_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/ray/ppo_critic_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/ray/ppo_critic_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/ray/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/ray/utils.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/ray/vllm_engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/ray/vllm_engine.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/trainer/ray/vllm_worker_wrap.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/trainer/ray/vllm_worker_wrap.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/__init__.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/deepspeed/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/deepspeed/__init__.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/deepspeed/deepspeed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/deepspeed/deepspeed.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/deepspeed/deepspeed_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/deepspeed/deepspeed_utils.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/distributed_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/distributed_sampler.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/distributed_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/distributed_util.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/intern_vl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/intern_vl/__init__.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/intern_vl/image_processing_intern_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/intern_vl/image_processing_intern_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/intern_vl/processing_intern_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/intern_vl/processing_intern_vl.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/logging_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/logging_utils.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/processor.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/remote_rm_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/remote_rm_utils.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/rl_logging_board/config.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/rl_logging_board/config.toml -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/rl_logging_board/rl_logging_board.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/rl_logging_board/rl_logging_board.py -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/rl_logging_board/start.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/rl_logging_board/start.sh -------------------------------------------------------------------------------- /ADORA_VL/openrlhf/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/openrlhf/utils/utils.py -------------------------------------------------------------------------------- /ADORA_VL/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/pyproject.toml -------------------------------------------------------------------------------- /ADORA_VL/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/requirements.txt -------------------------------------------------------------------------------- /ADORA_VL/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/ADORA_VL/setup.py -------------------------------------------------------------------------------- /ADORA_VL/version.txt: -------------------------------------------------------------------------------- 1 | 0.6.0 2 | -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/CONTRIBUTING.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/README.md -------------------------------------------------------------------------------- /docs/adora.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/docs/adora.png -------------------------------------------------------------------------------- /docs/adora_vl.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ShadeCloak/ADORA/HEAD/docs/adora_vl.png --------------------------------------------------------------------------------