├── .github └── workflows │ ├── conda-ci.yml │ ├── generate_github_workflows.py │ ├── pr-test.yml │ ├── pr-test.yml.j2 │ ├── pre-commit.yml │ └── release-docs.yaml ├── .gitignore ├── .pre-commit-config.yaml ├── LICENSE ├── README.md ├── README_zh.md ├── docker ├── Dockerfile ├── Dockerfile.rocm ├── Dockerfile_20250810_9a48ba0.rocm ├── Dockerfile_20250810_c22f55b.rocm ├── README.md ├── amd_patch │ ├── latest │ │ ├── amd_megatron_fused_kernels_init.patch │ │ ├── megatron.patch │ │ └── sglang.patch │ └── sglv0.5.0rc0 │ │ ├── amd_megatron_fused_kernels_init.patch │ │ ├── megatron.patch │ │ └── sglang.patch ├── justfile ├── patch │ ├── latest │ │ ├── megatron.patch │ │ └── sglang.patch │ ├── v0.5.0rc0-cu126 │ │ ├── megatron.patch │ │ └── sglang.patch │ └── v0.5.5.post1 │ │ ├── megatron.patch │ │ └── sglang.patch └── version.txt ├── docs ├── README.md ├── _static │ ├── css │ │ ├── custom_log.css │ │ └── readthedocs.css │ ├── image │ │ ├── blogs │ │ │ └── release_v0.1.0 │ │ │ │ ├── cuda_vmm.png │ │ │ │ └── overrall.png │ │ ├── logo.ico │ │ └── logo.jpg │ └── js │ │ └── lang-toggle.js ├── build.sh ├── build_all.sh ├── conf.py ├── en │ ├── advanced │ │ ├── arch-support-beyond-megatron.md │ │ ├── fault-tolerance.md │ │ └── speculative-decoding.md │ ├── blogs │ │ ├── introducing_slime.md │ │ └── release_v0.1.0.md │ ├── developer_guide │ │ └── debug.md │ ├── examples │ │ ├── deepseek-r1.md │ │ ├── glm4-9B.md │ │ ├── glm4.5-355B-A32B.md │ │ ├── qwen3-30B-A3B.md │ │ ├── qwen3-4B.md │ │ └── qwen3-4b-base-openhermes.md │ ├── get_started │ │ ├── qa.md │ │ ├── quick_start.md │ │ └── usage.md │ ├── index.rst │ └── platform_support │ │ └── amd_tutorial.md ├── requirements.txt ├── serve.sh └── zh │ ├── advanced │ ├── arch-support-beyond-megatron.md │ ├── fault-torlance.md │ └── speculative-decoding.md │ ├── blogs │ ├── introducing_slime.md │ └── release_v0.1.0.md │ ├── developer_guide │ └── debug.md │ ├── examples │ ├── deepseek-r1.md │ ├── glm4-9B.md │ ├── glm4.5-355B-A32B.md │ ├── qwen3-30B-A3B.md │ ├── qwen3-4B.md │ └── qwen3-4b-base-openhermes.md │ ├── get_started │ ├── qa.md │ ├── quick_start.md │ └── usage.md │ └── index.rst ├── examples ├── __init__.py ├── eval │ ├── README.md │ ├── __init__.py │ ├── eval_delegate.py │ ├── eval_delegate_rollout.py │ ├── nemo_skills │ │ ├── __init__.py │ │ ├── config │ │ │ └── local_cluster.yaml │ │ ├── skills_client.py │ │ ├── skills_config.py │ │ └── skills_server.py │ └── scripts │ │ ├── multi_tasks.yaml │ │ ├── run-qwen3-32B.sh │ │ └── run-qwen3-4B.sh ├── eval_multi_task │ ├── README.md │ ├── multi_task.sh │ ├── multi_task.yaml │ └── requirements_ifbench.txt ├── formal_math │ └── single_round │ │ ├── README.md │ │ ├── kimina_wrapper.py │ │ ├── prepare_data.py │ │ ├── reward_fn.py │ │ ├── run.py │ │ ├── run_minimal.py │ │ └── run_sft.py ├── fully_async │ ├── README.md │ ├── fully_async_rollout.py │ └── run-qwen3-4b-fully_async.sh ├── low_precision │ ├── README.md │ ├── run-qwen3-30b-a3b-fp8-two-nodes.sh │ └── run-qwen3-4b-fp8.sh ├── multi_agent │ ├── README.md │ ├── __init__.py │ ├── agent_system.py │ ├── prompts.py │ ├── rollout_with_multi_agents.py │ └── run-qwen3-30B-A3B-multi-agent.sh ├── on_policy_distillation │ ├── on_policy_distillation.py │ └── run-qwen3-8B-opd.sh ├── reproducibility │ ├── README.md │ └── run-qwen2.5-0.5B-gsm8k.sh ├── retool │ ├── README.md │ ├── generate_with_retool.py │ ├── requirements.txt │ ├── retool_qwen3_4b_rl.sh │ ├── retool_qwen3_4b_sft.sh │ ├── rl_data_preprocess.py │ ├── sft_data_processing.py │ └── tool_sandbox.py ├── search-r1 │ ├── README.md │ ├── README_zh.md │ ├── generate_with_search.py │ ├── google_search_server.py │ ├── local_dense_retriever │ │ ├── download.py │ │ └── retrieval_server.py │ ├── local_search_server.py │ ├── qa_em_format.py │ └── run_qwen2.5_3B.sh ├── strands-agents │ ├── README.md │ ├── generate_with_strands.py │ ├── requirements.txt │ └── strands_qwen3_4b.sh ├── tau-bench │ ├── README.md │ ├── generate_with_tau.py │ ├── openai_tool_adapter.py │ ├── run_qwen3_4B.sh │ ├── sglang_tool_parser.py │ ├── tau1_mock.py │ └── trainable_agents.py ├── train_infer_mismatch_helper │ ├── README.md │ ├── mis.py │ ├── mis.yaml │ └── run-qwen3-4b-mis.sh └── true_on_policy │ ├── README.md │ ├── run_simple.py │ └── src │ ├── aime.png │ ├── raw_reward.png │ ├── rollout_time.png │ ├── step_time.png │ └── train_rollout_abs_diff.png ├── imgs └── arch.png ├── pyproject.toml ├── requirements.txt ├── scripts ├── models │ ├── deepseek-v3-20layer.sh │ ├── deepseek-v3-5layer.sh │ ├── deepseek-v3.sh │ ├── glm4-32B.sh │ ├── glm4-9B.sh │ ├── glm4.5-106B-A12B.sh │ ├── glm4.5-355B-A32B.sh │ ├── kimi-k2-thinking.sh │ ├── kimi-k2.sh │ ├── llama3.1-8B-Instruct.sh │ ├── llama3.2-3B-Instruct-amd.sh │ ├── llama3.2-3B-Instruct.sh │ ├── mimo-7B-rl.sh │ ├── moonlight.sh │ ├── qwen2.5-0.5B.sh │ ├── qwen2.5-1.5B.sh │ ├── qwen2.5-32B.sh │ ├── qwen2.5-3B.sh │ ├── qwen2.5-7B.sh │ ├── qwen3-0.6B.sh │ ├── qwen3-1.7B.sh │ ├── qwen3-14B.sh │ ├── qwen3-235B-A22B.sh │ ├── qwen3-30B-A3B.sh │ ├── qwen3-32B.sh │ ├── qwen3-4B-Instruct-2507.sh │ ├── qwen3-4B.sh │ ├── qwen3-8B.sh │ └── qwen3-next-80B-A3B.sh ├── run-deepseek-r1.sh ├── run-glm4-9B.sh ├── run-glm4.5-355B-A32B.sh ├── run-kimi-k2-Instruct.sh ├── run-kimi-k2-Thinking.sh ├── run-llama3.2-3B-Instruct-amd.sh ├── run-mimo-7B-rl-eagle.sh ├── run-moonlight-16B-A3B.sh ├── run-qwen3-235B-A22B-sft.sh ├── run-qwen3-235B-A22B.sh ├── run-qwen3-30B-A3B.sh ├── run-qwen3-32B.sh ├── run-qwen3-4B-amd.sh ├── run-qwen3-4B-base-sft.sh ├── run-qwen3-4B-fsdp.sh ├── run-qwen3-4B.sh ├── run-qwen3-4B_4xgpu-radixtree.sh ├── run-qwen3-4B_4xgpu.sh ├── run-qwen3-8B-amd.sh ├── run-qwen3-next-80B-A3B.sh ├── run_deepseek.py ├── run_glm45_355b_a32b.py ├── run_mcore_fsdp.py ├── run_qwen3_30b_a3b.py └── run_qwen3_4b.py ├── setup.py ├── slime ├── __init__.py ├── backends │ ├── __init__.py │ ├── fsdp_utils │ │ ├── __init__.py │ │ ├── actor.py │ │ ├── arguments.py │ │ ├── checkpoint.py │ │ ├── data_packing.py │ │ ├── kernels │ │ │ ├── __init__.py │ │ │ └── fused_experts.py │ │ ├── models │ │ │ ├── __init__.py │ │ │ ├── qwen3_moe.py │ │ │ └── qwen3_moe_hf.py │ │ └── update_weight_utils.py │ ├── megatron_utils │ │ ├── __init__.py │ │ ├── actor.py │ │ ├── arguments.py │ │ ├── checkpoint.py │ │ ├── config_mapping │ │ │ ├── __init__.py │ │ │ ├── predefined_config_mappers.py │ │ │ └── registry.py │ │ ├── cp_utils.py │ │ ├── data.py │ │ ├── initialize.py │ │ ├── loss.py │ │ ├── megatron_to_hf │ │ │ ├── __init__.py │ │ │ ├── deepseekv3.py │ │ │ ├── glm4.py │ │ │ ├── glm4moe.py │ │ │ ├── llama.py │ │ │ ├── mimo.py │ │ │ ├── processors │ │ │ │ ├── __init__.py │ │ │ │ ├── padding_remover.py │ │ │ │ └── quantizer.py │ │ │ ├── qwen2.py │ │ │ ├── qwen3_next.py │ │ │ └── qwen3moe.py │ │ ├── misc_utils.py │ │ ├── model.py │ │ ├── model_provider.py │ │ └── update_weight │ │ │ ├── __init__.py │ │ │ ├── common.py │ │ │ ├── hf_weight_iterator_base.py │ │ │ ├── hf_weight_iterator_bridge.py │ │ │ ├── hf_weight_iterator_direct.py │ │ │ ├── update_weight_from_distributed.py │ │ │ └── update_weight_from_tensor.py │ └── sglang_utils │ │ ├── __init__.py │ │ ├── arguments.py │ │ └── sglang_engine.py ├── ray │ ├── __init__.py │ ├── actor_group.py │ ├── placement_group.py │ ├── ray_actor.py │ ├── rollout.py │ ├── train_actor.py │ └── utils.py ├── rollout │ ├── __init__.py │ ├── base_types.py │ ├── data_source.py │ ├── filter_hub │ │ ├── __init__.py │ │ ├── base_types.py │ │ └── dynamic_sampling_filters.py │ ├── generate_hub │ │ ├── __init__.py │ │ └── benchmarkers.py │ ├── rm_hub │ │ ├── __init__.py │ │ ├── deepscaler.py │ │ ├── f1.py │ │ ├── gpqa.py │ │ ├── ifbench.py │ │ ├── math_dapo_utils.py │ │ └── math_utils.py │ ├── sft_rollout.py │ ├── sglang_rollout.py │ └── sleep_rollout.py ├── router │ ├── __init__.py │ ├── middleware_hub │ │ ├── __init__.py │ │ ├── radix_tree.py │ │ └── radix_tree_middleware.py │ └── router.py └── utils │ ├── __init__.py │ ├── arguments.py │ ├── async_utils.py │ ├── context_utils.py │ ├── data.py │ ├── debug_utils │ ├── __init__.py │ ├── display_debug_rollout_data.py │ ├── replay_reward_fn.py │ └── send_to_sglang.py │ ├── distributed_utils.py │ ├── eval_config.py │ ├── external_utils │ ├── __init__.py │ └── command_utils.py │ ├── flops_utils.py │ ├── fp8_kernel.py │ ├── health_monitor.py │ ├── http_utils.py │ ├── iter_utils.py │ ├── logging_utils.py │ ├── mask_utils.py │ ├── megatron_bridge_utils.py │ ├── memory_utils.py │ ├── metric_checker.py │ ├── metric_utils.py │ ├── misc.py │ ├── ppo_utils.py │ ├── profile_utils.py │ ├── ray_utils.py │ ├── reloadable_process_group.py │ ├── routing_replay.py │ ├── seqlen_balancing.py │ ├── tensor_backper.py │ ├── tensorboard_utils.py │ ├── timer.py │ ├── tracking_utils.py │ ├── train_dump_utils.py │ ├── train_metric_utils.py │ ├── typer_utils.py │ ├── types.py │ └── wandb_utils.py ├── slime_plugins ├── __init__.py ├── mbridge │ ├── __init__.py │ ├── glm4.py │ ├── glm4moe.py │ ├── mimo.py │ └── qwen3_next.py ├── megatron_bridge │ └── __init__.py ├── models │ ├── __init__.py │ ├── glm4.py │ ├── hf_attention.py │ └── qwen3_next.py └── rollout_buffer │ ├── README.md │ ├── README_zh.md │ ├── buffer.py │ ├── generator │ ├── __init__.py │ └── base_generator.py │ ├── rollout_buffer_example.py │ └── rollout_buffer_example.sh ├── tests ├── ci │ ├── README.md │ ├── github_runner │ │ ├── .env.example │ │ ├── .gitignore │ │ └── docker-compose.yml │ └── gpu_lock_exec.py ├── test_chunked_gae.py ├── test_external_rollout.py ├── test_fsdp_import.py ├── test_gspo.sh ├── test_moonlight_16B_A3B.py ├── test_quick_start_glm4_9B.py ├── test_qwen2.5_0.5B_gsm8k.py ├── test_qwen2.5_0.5B_gsm8k_async.py ├── test_qwen3_0.6B_fsdp_colocated_2xGPU.py ├── test_qwen3_0.6B_fsdp_distributed.py ├── test_qwen3_0.6B_parallel_check.py ├── test_qwen3_30B_A3B.py ├── test_qwen3_4B_fsdp_true_on_policy.py └── test_qwen3_4B_ppo.py ├── tools ├── convert_hf_to_fp8.py ├── convert_hf_to_torch_dist.py ├── convert_k2_thinking_int4_to_bf16.py ├── convert_to_hf.py ├── convert_torch_dist_to_hf.py └── fp8_cast_bf16.py ├── train.py └── train_async.py /.github/workflows/conda-ci.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/.github/workflows/conda-ci.yml -------------------------------------------------------------------------------- /.github/workflows/generate_github_workflows.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/.github/workflows/generate_github_workflows.py -------------------------------------------------------------------------------- /.github/workflows/pr-test.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/.github/workflows/pr-test.yml -------------------------------------------------------------------------------- /.github/workflows/pr-test.yml.j2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/.github/workflows/pr-test.yml.j2 -------------------------------------------------------------------------------- /.github/workflows/pre-commit.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/.github/workflows/pre-commit.yml -------------------------------------------------------------------------------- /.github/workflows/release-docs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/.github/workflows/release-docs.yaml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/.gitignore -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/README.md -------------------------------------------------------------------------------- /README_zh.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/README_zh.md -------------------------------------------------------------------------------- /docker/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/Dockerfile -------------------------------------------------------------------------------- /docker/Dockerfile.rocm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/Dockerfile.rocm -------------------------------------------------------------------------------- /docker/Dockerfile_20250810_9a48ba0.rocm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/Dockerfile_20250810_9a48ba0.rocm -------------------------------------------------------------------------------- /docker/Dockerfile_20250810_c22f55b.rocm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/Dockerfile_20250810_c22f55b.rocm -------------------------------------------------------------------------------- /docker/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/README.md -------------------------------------------------------------------------------- /docker/amd_patch/latest/amd_megatron_fused_kernels_init.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/amd_patch/latest/amd_megatron_fused_kernels_init.patch -------------------------------------------------------------------------------- /docker/amd_patch/latest/megatron.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/amd_patch/latest/megatron.patch -------------------------------------------------------------------------------- /docker/amd_patch/latest/sglang.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/amd_patch/latest/sglang.patch -------------------------------------------------------------------------------- /docker/amd_patch/sglv0.5.0rc0/amd_megatron_fused_kernels_init.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/amd_patch/sglv0.5.0rc0/amd_megatron_fused_kernels_init.patch -------------------------------------------------------------------------------- /docker/amd_patch/sglv0.5.0rc0/megatron.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/amd_patch/sglv0.5.0rc0/megatron.patch -------------------------------------------------------------------------------- /docker/amd_patch/sglv0.5.0rc0/sglang.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/amd_patch/sglv0.5.0rc0/sglang.patch -------------------------------------------------------------------------------- /docker/justfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/justfile -------------------------------------------------------------------------------- /docker/patch/latest/megatron.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/patch/latest/megatron.patch -------------------------------------------------------------------------------- /docker/patch/latest/sglang.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/patch/latest/sglang.patch -------------------------------------------------------------------------------- /docker/patch/v0.5.0rc0-cu126/megatron.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/patch/v0.5.0rc0-cu126/megatron.patch -------------------------------------------------------------------------------- /docker/patch/v0.5.0rc0-cu126/sglang.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/patch/v0.5.0rc0-cu126/sglang.patch -------------------------------------------------------------------------------- /docker/patch/v0.5.5.post1/megatron.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/patch/v0.5.5.post1/megatron.patch -------------------------------------------------------------------------------- /docker/patch/v0.5.5.post1/sglang.patch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docker/patch/v0.5.5.post1/sglang.patch -------------------------------------------------------------------------------- /docker/version.txt: -------------------------------------------------------------------------------- 1 | nightly-dev-202511127a -------------------------------------------------------------------------------- /docs/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/README.md -------------------------------------------------------------------------------- /docs/_static/css/custom_log.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/_static/css/custom_log.css -------------------------------------------------------------------------------- /docs/_static/css/readthedocs.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/_static/css/readthedocs.css -------------------------------------------------------------------------------- /docs/_static/image/blogs/release_v0.1.0/cuda_vmm.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/_static/image/blogs/release_v0.1.0/cuda_vmm.png -------------------------------------------------------------------------------- /docs/_static/image/blogs/release_v0.1.0/overrall.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/_static/image/blogs/release_v0.1.0/overrall.png -------------------------------------------------------------------------------- /docs/_static/image/logo.ico: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/_static/image/logo.ico -------------------------------------------------------------------------------- /docs/_static/image/logo.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/_static/image/logo.jpg -------------------------------------------------------------------------------- /docs/_static/js/lang-toggle.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/_static/js/lang-toggle.js -------------------------------------------------------------------------------- /docs/build.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/build.sh -------------------------------------------------------------------------------- /docs/build_all.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/build_all.sh -------------------------------------------------------------------------------- /docs/conf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/conf.py -------------------------------------------------------------------------------- /docs/en/advanced/arch-support-beyond-megatron.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/advanced/arch-support-beyond-megatron.md -------------------------------------------------------------------------------- /docs/en/advanced/fault-tolerance.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/advanced/fault-tolerance.md -------------------------------------------------------------------------------- /docs/en/advanced/speculative-decoding.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/advanced/speculative-decoding.md -------------------------------------------------------------------------------- /docs/en/blogs/introducing_slime.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/blogs/introducing_slime.md -------------------------------------------------------------------------------- /docs/en/blogs/release_v0.1.0.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/blogs/release_v0.1.0.md -------------------------------------------------------------------------------- /docs/en/developer_guide/debug.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/developer_guide/debug.md -------------------------------------------------------------------------------- /docs/en/examples/deepseek-r1.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/examples/deepseek-r1.md -------------------------------------------------------------------------------- /docs/en/examples/glm4-9B.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/examples/glm4-9B.md -------------------------------------------------------------------------------- /docs/en/examples/glm4.5-355B-A32B.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/examples/glm4.5-355B-A32B.md -------------------------------------------------------------------------------- /docs/en/examples/qwen3-30B-A3B.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/examples/qwen3-30B-A3B.md -------------------------------------------------------------------------------- /docs/en/examples/qwen3-4B.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/examples/qwen3-4B.md -------------------------------------------------------------------------------- /docs/en/examples/qwen3-4b-base-openhermes.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/examples/qwen3-4b-base-openhermes.md -------------------------------------------------------------------------------- /docs/en/get_started/qa.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/get_started/qa.md -------------------------------------------------------------------------------- /docs/en/get_started/quick_start.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/get_started/quick_start.md -------------------------------------------------------------------------------- /docs/en/get_started/usage.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/get_started/usage.md -------------------------------------------------------------------------------- /docs/en/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/index.rst -------------------------------------------------------------------------------- /docs/en/platform_support/amd_tutorial.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/en/platform_support/amd_tutorial.md -------------------------------------------------------------------------------- /docs/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/requirements.txt -------------------------------------------------------------------------------- /docs/serve.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/serve.sh -------------------------------------------------------------------------------- /docs/zh/advanced/arch-support-beyond-megatron.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/advanced/arch-support-beyond-megatron.md -------------------------------------------------------------------------------- /docs/zh/advanced/fault-torlance.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/advanced/fault-torlance.md -------------------------------------------------------------------------------- /docs/zh/advanced/speculative-decoding.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/advanced/speculative-decoding.md -------------------------------------------------------------------------------- /docs/zh/blogs/introducing_slime.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/blogs/introducing_slime.md -------------------------------------------------------------------------------- /docs/zh/blogs/release_v0.1.0.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/blogs/release_v0.1.0.md -------------------------------------------------------------------------------- /docs/zh/developer_guide/debug.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/developer_guide/debug.md -------------------------------------------------------------------------------- /docs/zh/examples/deepseek-r1.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/examples/deepseek-r1.md -------------------------------------------------------------------------------- /docs/zh/examples/glm4-9B.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/examples/glm4-9B.md -------------------------------------------------------------------------------- /docs/zh/examples/glm4.5-355B-A32B.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/examples/glm4.5-355B-A32B.md -------------------------------------------------------------------------------- /docs/zh/examples/qwen3-30B-A3B.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/examples/qwen3-30B-A3B.md -------------------------------------------------------------------------------- /docs/zh/examples/qwen3-4B.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/examples/qwen3-4B.md -------------------------------------------------------------------------------- /docs/zh/examples/qwen3-4b-base-openhermes.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/examples/qwen3-4b-base-openhermes.md -------------------------------------------------------------------------------- /docs/zh/get_started/qa.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/get_started/qa.md -------------------------------------------------------------------------------- /docs/zh/get_started/quick_start.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/get_started/quick_start.md -------------------------------------------------------------------------------- /docs/zh/get_started/usage.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/get_started/usage.md -------------------------------------------------------------------------------- /docs/zh/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/docs/zh/index.rst -------------------------------------------------------------------------------- /examples/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /examples/eval/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval/README.md -------------------------------------------------------------------------------- /examples/eval/__init__.py: -------------------------------------------------------------------------------- 1 | """Evaluation helpers and example configs.""" 2 | -------------------------------------------------------------------------------- /examples/eval/eval_delegate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval/eval_delegate.py -------------------------------------------------------------------------------- /examples/eval/eval_delegate_rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval/eval_delegate_rollout.py -------------------------------------------------------------------------------- /examples/eval/nemo_skills/__init__.py: -------------------------------------------------------------------------------- 1 | """NeMo Skills evaluation helpers.""" 2 | -------------------------------------------------------------------------------- /examples/eval/nemo_skills/config/local_cluster.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval/nemo_skills/config/local_cluster.yaml -------------------------------------------------------------------------------- /examples/eval/nemo_skills/skills_client.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval/nemo_skills/skills_client.py -------------------------------------------------------------------------------- /examples/eval/nemo_skills/skills_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval/nemo_skills/skills_config.py -------------------------------------------------------------------------------- /examples/eval/nemo_skills/skills_server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval/nemo_skills/skills_server.py -------------------------------------------------------------------------------- /examples/eval/scripts/multi_tasks.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval/scripts/multi_tasks.yaml -------------------------------------------------------------------------------- /examples/eval/scripts/run-qwen3-32B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval/scripts/run-qwen3-32B.sh -------------------------------------------------------------------------------- /examples/eval/scripts/run-qwen3-4B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval/scripts/run-qwen3-4B.sh -------------------------------------------------------------------------------- /examples/eval_multi_task/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval_multi_task/README.md -------------------------------------------------------------------------------- /examples/eval_multi_task/multi_task.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval_multi_task/multi_task.sh -------------------------------------------------------------------------------- /examples/eval_multi_task/multi_task.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval_multi_task/multi_task.yaml -------------------------------------------------------------------------------- /examples/eval_multi_task/requirements_ifbench.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/eval_multi_task/requirements_ifbench.txt -------------------------------------------------------------------------------- /examples/formal_math/single_round/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/formal_math/single_round/README.md -------------------------------------------------------------------------------- /examples/formal_math/single_round/kimina_wrapper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/formal_math/single_round/kimina_wrapper.py -------------------------------------------------------------------------------- /examples/formal_math/single_round/prepare_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/formal_math/single_round/prepare_data.py -------------------------------------------------------------------------------- /examples/formal_math/single_round/reward_fn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/formal_math/single_round/reward_fn.py -------------------------------------------------------------------------------- /examples/formal_math/single_round/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/formal_math/single_round/run.py -------------------------------------------------------------------------------- /examples/formal_math/single_round/run_minimal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/formal_math/single_round/run_minimal.py -------------------------------------------------------------------------------- /examples/formal_math/single_round/run_sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/formal_math/single_round/run_sft.py -------------------------------------------------------------------------------- /examples/fully_async/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/fully_async/README.md -------------------------------------------------------------------------------- /examples/fully_async/fully_async_rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/fully_async/fully_async_rollout.py -------------------------------------------------------------------------------- /examples/fully_async/run-qwen3-4b-fully_async.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/fully_async/run-qwen3-4b-fully_async.sh -------------------------------------------------------------------------------- /examples/low_precision/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/low_precision/README.md -------------------------------------------------------------------------------- /examples/low_precision/run-qwen3-30b-a3b-fp8-two-nodes.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/low_precision/run-qwen3-30b-a3b-fp8-two-nodes.sh -------------------------------------------------------------------------------- /examples/low_precision/run-qwen3-4b-fp8.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/low_precision/run-qwen3-4b-fp8.sh -------------------------------------------------------------------------------- /examples/multi_agent/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/multi_agent/README.md -------------------------------------------------------------------------------- /examples/multi_agent/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /examples/multi_agent/agent_system.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/multi_agent/agent_system.py -------------------------------------------------------------------------------- /examples/multi_agent/prompts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/multi_agent/prompts.py -------------------------------------------------------------------------------- /examples/multi_agent/rollout_with_multi_agents.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/multi_agent/rollout_with_multi_agents.py -------------------------------------------------------------------------------- /examples/multi_agent/run-qwen3-30B-A3B-multi-agent.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/multi_agent/run-qwen3-30B-A3B-multi-agent.sh -------------------------------------------------------------------------------- /examples/on_policy_distillation/on_policy_distillation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/on_policy_distillation/on_policy_distillation.py -------------------------------------------------------------------------------- /examples/on_policy_distillation/run-qwen3-8B-opd.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/on_policy_distillation/run-qwen3-8B-opd.sh -------------------------------------------------------------------------------- /examples/reproducibility/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/reproducibility/README.md -------------------------------------------------------------------------------- /examples/reproducibility/run-qwen2.5-0.5B-gsm8k.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/reproducibility/run-qwen2.5-0.5B-gsm8k.sh -------------------------------------------------------------------------------- /examples/retool/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/retool/README.md -------------------------------------------------------------------------------- /examples/retool/generate_with_retool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/retool/generate_with_retool.py -------------------------------------------------------------------------------- /examples/retool/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/retool/requirements.txt -------------------------------------------------------------------------------- /examples/retool/retool_qwen3_4b_rl.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/retool/retool_qwen3_4b_rl.sh -------------------------------------------------------------------------------- /examples/retool/retool_qwen3_4b_sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/retool/retool_qwen3_4b_sft.sh -------------------------------------------------------------------------------- /examples/retool/rl_data_preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/retool/rl_data_preprocess.py -------------------------------------------------------------------------------- /examples/retool/sft_data_processing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/retool/sft_data_processing.py -------------------------------------------------------------------------------- /examples/retool/tool_sandbox.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/retool/tool_sandbox.py -------------------------------------------------------------------------------- /examples/search-r1/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/search-r1/README.md -------------------------------------------------------------------------------- /examples/search-r1/README_zh.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/search-r1/README_zh.md -------------------------------------------------------------------------------- /examples/search-r1/generate_with_search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/search-r1/generate_with_search.py -------------------------------------------------------------------------------- /examples/search-r1/google_search_server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/search-r1/google_search_server.py -------------------------------------------------------------------------------- /examples/search-r1/local_dense_retriever/download.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/search-r1/local_dense_retriever/download.py -------------------------------------------------------------------------------- /examples/search-r1/local_dense_retriever/retrieval_server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/search-r1/local_dense_retriever/retrieval_server.py -------------------------------------------------------------------------------- /examples/search-r1/local_search_server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/search-r1/local_search_server.py -------------------------------------------------------------------------------- /examples/search-r1/qa_em_format.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/search-r1/qa_em_format.py -------------------------------------------------------------------------------- /examples/search-r1/run_qwen2.5_3B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/search-r1/run_qwen2.5_3B.sh -------------------------------------------------------------------------------- /examples/strands-agents/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/strands-agents/README.md -------------------------------------------------------------------------------- /examples/strands-agents/generate_with_strands.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/strands-agents/generate_with_strands.py -------------------------------------------------------------------------------- /examples/strands-agents/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/strands-agents/requirements.txt -------------------------------------------------------------------------------- /examples/strands-agents/strands_qwen3_4b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/strands-agents/strands_qwen3_4b.sh -------------------------------------------------------------------------------- /examples/tau-bench/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/tau-bench/README.md -------------------------------------------------------------------------------- /examples/tau-bench/generate_with_tau.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/tau-bench/generate_with_tau.py -------------------------------------------------------------------------------- /examples/tau-bench/openai_tool_adapter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/tau-bench/openai_tool_adapter.py -------------------------------------------------------------------------------- /examples/tau-bench/run_qwen3_4B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/tau-bench/run_qwen3_4B.sh -------------------------------------------------------------------------------- /examples/tau-bench/sglang_tool_parser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/tau-bench/sglang_tool_parser.py -------------------------------------------------------------------------------- /examples/tau-bench/tau1_mock.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/tau-bench/tau1_mock.py -------------------------------------------------------------------------------- /examples/tau-bench/trainable_agents.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/tau-bench/trainable_agents.py -------------------------------------------------------------------------------- /examples/train_infer_mismatch_helper/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/train_infer_mismatch_helper/README.md -------------------------------------------------------------------------------- /examples/train_infer_mismatch_helper/mis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/train_infer_mismatch_helper/mis.py -------------------------------------------------------------------------------- /examples/train_infer_mismatch_helper/mis.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/train_infer_mismatch_helper/mis.yaml -------------------------------------------------------------------------------- /examples/train_infer_mismatch_helper/run-qwen3-4b-mis.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/train_infer_mismatch_helper/run-qwen3-4b-mis.sh -------------------------------------------------------------------------------- /examples/true_on_policy/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/true_on_policy/README.md -------------------------------------------------------------------------------- /examples/true_on_policy/run_simple.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/true_on_policy/run_simple.py -------------------------------------------------------------------------------- /examples/true_on_policy/src/aime.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/true_on_policy/src/aime.png -------------------------------------------------------------------------------- /examples/true_on_policy/src/raw_reward.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/true_on_policy/src/raw_reward.png -------------------------------------------------------------------------------- /examples/true_on_policy/src/rollout_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/true_on_policy/src/rollout_time.png -------------------------------------------------------------------------------- /examples/true_on_policy/src/step_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/true_on_policy/src/step_time.png -------------------------------------------------------------------------------- /examples/true_on_policy/src/train_rollout_abs_diff.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/examples/true_on_policy/src/train_rollout_abs_diff.png -------------------------------------------------------------------------------- /imgs/arch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/imgs/arch.png -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/pyproject.toml -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/requirements.txt -------------------------------------------------------------------------------- /scripts/models/deepseek-v3-20layer.sh: -------------------------------------------------------------------------------- 1 | MODEL_ARGS_NUM_LAYERS=20 source "$(dirname -- "${BASH_SOURCE[0]}")/deepseek-v3.sh" 2 | -------------------------------------------------------------------------------- /scripts/models/deepseek-v3-5layer.sh: -------------------------------------------------------------------------------- 1 | MODEL_ARGS_NUM_LAYERS=5 source "$(dirname -- "${BASH_SOURCE[0]}")/deepseek-v3.sh" 2 | -------------------------------------------------------------------------------- /scripts/models/deepseek-v3.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/deepseek-v3.sh -------------------------------------------------------------------------------- /scripts/models/glm4-32B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/glm4-32B.sh -------------------------------------------------------------------------------- /scripts/models/glm4-9B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/glm4-9B.sh -------------------------------------------------------------------------------- /scripts/models/glm4.5-106B-A12B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/glm4.5-106B-A12B.sh -------------------------------------------------------------------------------- /scripts/models/glm4.5-355B-A32B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/glm4.5-355B-A32B.sh -------------------------------------------------------------------------------- /scripts/models/kimi-k2-thinking.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/kimi-k2-thinking.sh -------------------------------------------------------------------------------- /scripts/models/kimi-k2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/kimi-k2.sh -------------------------------------------------------------------------------- /scripts/models/llama3.1-8B-Instruct.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/llama3.1-8B-Instruct.sh -------------------------------------------------------------------------------- /scripts/models/llama3.2-3B-Instruct-amd.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/llama3.2-3B-Instruct-amd.sh -------------------------------------------------------------------------------- /scripts/models/llama3.2-3B-Instruct.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/llama3.2-3B-Instruct.sh -------------------------------------------------------------------------------- /scripts/models/mimo-7B-rl.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/mimo-7B-rl.sh -------------------------------------------------------------------------------- /scripts/models/moonlight.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/moonlight.sh -------------------------------------------------------------------------------- /scripts/models/qwen2.5-0.5B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen2.5-0.5B.sh -------------------------------------------------------------------------------- /scripts/models/qwen2.5-1.5B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen2.5-1.5B.sh -------------------------------------------------------------------------------- /scripts/models/qwen2.5-32B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen2.5-32B.sh -------------------------------------------------------------------------------- /scripts/models/qwen2.5-3B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen2.5-3B.sh -------------------------------------------------------------------------------- /scripts/models/qwen2.5-7B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen2.5-7B.sh -------------------------------------------------------------------------------- /scripts/models/qwen3-0.6B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen3-0.6B.sh -------------------------------------------------------------------------------- /scripts/models/qwen3-1.7B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen3-1.7B.sh -------------------------------------------------------------------------------- /scripts/models/qwen3-14B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen3-14B.sh -------------------------------------------------------------------------------- /scripts/models/qwen3-235B-A22B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen3-235B-A22B.sh -------------------------------------------------------------------------------- /scripts/models/qwen3-30B-A3B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen3-30B-A3B.sh -------------------------------------------------------------------------------- /scripts/models/qwen3-32B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen3-32B.sh -------------------------------------------------------------------------------- /scripts/models/qwen3-4B-Instruct-2507.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen3-4B-Instruct-2507.sh -------------------------------------------------------------------------------- /scripts/models/qwen3-4B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen3-4B.sh -------------------------------------------------------------------------------- /scripts/models/qwen3-8B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen3-8B.sh -------------------------------------------------------------------------------- /scripts/models/qwen3-next-80B-A3B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/models/qwen3-next-80B-A3B.sh -------------------------------------------------------------------------------- /scripts/run-deepseek-r1.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-deepseek-r1.sh -------------------------------------------------------------------------------- /scripts/run-glm4-9B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-glm4-9B.sh -------------------------------------------------------------------------------- /scripts/run-glm4.5-355B-A32B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-glm4.5-355B-A32B.sh -------------------------------------------------------------------------------- /scripts/run-kimi-k2-Instruct.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-kimi-k2-Instruct.sh -------------------------------------------------------------------------------- /scripts/run-kimi-k2-Thinking.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-kimi-k2-Thinking.sh -------------------------------------------------------------------------------- /scripts/run-llama3.2-3B-Instruct-amd.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-llama3.2-3B-Instruct-amd.sh -------------------------------------------------------------------------------- /scripts/run-mimo-7B-rl-eagle.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-mimo-7B-rl-eagle.sh -------------------------------------------------------------------------------- /scripts/run-moonlight-16B-A3B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-moonlight-16B-A3B.sh -------------------------------------------------------------------------------- /scripts/run-qwen3-235B-A22B-sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-qwen3-235B-A22B-sft.sh -------------------------------------------------------------------------------- /scripts/run-qwen3-235B-A22B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-qwen3-235B-A22B.sh -------------------------------------------------------------------------------- /scripts/run-qwen3-30B-A3B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-qwen3-30B-A3B.sh -------------------------------------------------------------------------------- /scripts/run-qwen3-32B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-qwen3-32B.sh -------------------------------------------------------------------------------- /scripts/run-qwen3-4B-amd.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-qwen3-4B-amd.sh -------------------------------------------------------------------------------- /scripts/run-qwen3-4B-base-sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-qwen3-4B-base-sft.sh -------------------------------------------------------------------------------- /scripts/run-qwen3-4B-fsdp.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-qwen3-4B-fsdp.sh -------------------------------------------------------------------------------- /scripts/run-qwen3-4B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-qwen3-4B.sh -------------------------------------------------------------------------------- /scripts/run-qwen3-4B_4xgpu-radixtree.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-qwen3-4B_4xgpu-radixtree.sh -------------------------------------------------------------------------------- /scripts/run-qwen3-4B_4xgpu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-qwen3-4B_4xgpu.sh -------------------------------------------------------------------------------- /scripts/run-qwen3-8B-amd.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-qwen3-8B-amd.sh -------------------------------------------------------------------------------- /scripts/run-qwen3-next-80B-A3B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run-qwen3-next-80B-A3B.sh -------------------------------------------------------------------------------- /scripts/run_deepseek.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run_deepseek.py -------------------------------------------------------------------------------- /scripts/run_glm45_355b_a32b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run_glm45_355b_a32b.py -------------------------------------------------------------------------------- /scripts/run_mcore_fsdp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run_mcore_fsdp.py -------------------------------------------------------------------------------- /scripts/run_qwen3_30b_a3b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run_qwen3_30b_a3b.py -------------------------------------------------------------------------------- /scripts/run_qwen3_4b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/scripts/run_qwen3_4b.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/setup.py -------------------------------------------------------------------------------- /slime/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/backends/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /slime/backends/fsdp_utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/fsdp_utils/__init__.py -------------------------------------------------------------------------------- /slime/backends/fsdp_utils/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/fsdp_utils/actor.py -------------------------------------------------------------------------------- /slime/backends/fsdp_utils/arguments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/fsdp_utils/arguments.py -------------------------------------------------------------------------------- /slime/backends/fsdp_utils/checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/fsdp_utils/checkpoint.py -------------------------------------------------------------------------------- /slime/backends/fsdp_utils/data_packing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/fsdp_utils/data_packing.py -------------------------------------------------------------------------------- /slime/backends/fsdp_utils/kernels/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/backends/fsdp_utils/kernels/fused_experts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/fsdp_utils/kernels/fused_experts.py -------------------------------------------------------------------------------- /slime/backends/fsdp_utils/models/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/backends/fsdp_utils/models/qwen3_moe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/fsdp_utils/models/qwen3_moe.py -------------------------------------------------------------------------------- /slime/backends/fsdp_utils/models/qwen3_moe_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/fsdp_utils/models/qwen3_moe_hf.py -------------------------------------------------------------------------------- /slime/backends/fsdp_utils/update_weight_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/fsdp_utils/update_weight_utils.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/__init__.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/actor.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/arguments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/arguments.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/checkpoint.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/config_mapping/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/config_mapping/__init__.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/config_mapping/predefined_config_mappers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/config_mapping/predefined_config_mappers.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/config_mapping/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/config_mapping/registry.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/cp_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/cp_utils.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/data.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/initialize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/initialize.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/loss.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/megatron_to_hf/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/megatron_to_hf/__init__.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/megatron_to_hf/deepseekv3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/megatron_to_hf/deepseekv3.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/megatron_to_hf/glm4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/megatron_to_hf/glm4.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/megatron_to_hf/glm4moe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/megatron_to_hf/glm4moe.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/megatron_to_hf/llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/megatron_to_hf/llama.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/megatron_to_hf/mimo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/megatron_to_hf/mimo.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/megatron_to_hf/processors/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/backends/megatron_utils/megatron_to_hf/processors/padding_remover.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/megatron_to_hf/processors/padding_remover.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/megatron_to_hf/processors/quantizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/megatron_to_hf/processors/quantizer.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/megatron_to_hf/qwen2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/megatron_to_hf/qwen2.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/megatron_to_hf/qwen3_next.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/megatron_to_hf/qwen3_next.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/megatron_to_hf/qwen3moe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/megatron_to_hf/qwen3moe.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/misc_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/misc_utils.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/model.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/model_provider.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/model_provider.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/update_weight/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/backends/megatron_utils/update_weight/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/update_weight/common.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/update_weight/hf_weight_iterator_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/update_weight/hf_weight_iterator_base.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/update_weight/hf_weight_iterator_bridge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/update_weight/hf_weight_iterator_bridge.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/update_weight/hf_weight_iterator_direct.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/update_weight/hf_weight_iterator_direct.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/update_weight/update_weight_from_distributed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/update_weight/update_weight_from_distributed.py -------------------------------------------------------------------------------- /slime/backends/megatron_utils/update_weight/update_weight_from_tensor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/megatron_utils/update_weight/update_weight_from_tensor.py -------------------------------------------------------------------------------- /slime/backends/sglang_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/backends/sglang_utils/arguments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/sglang_utils/arguments.py -------------------------------------------------------------------------------- /slime/backends/sglang_utils/sglang_engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/backends/sglang_utils/sglang_engine.py -------------------------------------------------------------------------------- /slime/ray/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/ray/actor_group.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/ray/actor_group.py -------------------------------------------------------------------------------- /slime/ray/placement_group.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/ray/placement_group.py -------------------------------------------------------------------------------- /slime/ray/ray_actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/ray/ray_actor.py -------------------------------------------------------------------------------- /slime/ray/rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/ray/rollout.py -------------------------------------------------------------------------------- /slime/ray/train_actor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/ray/train_actor.py -------------------------------------------------------------------------------- /slime/ray/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/ray/utils.py -------------------------------------------------------------------------------- /slime/rollout/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/rollout/base_types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/base_types.py -------------------------------------------------------------------------------- /slime/rollout/data_source.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/data_source.py -------------------------------------------------------------------------------- /slime/rollout/filter_hub/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/rollout/filter_hub/base_types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/filter_hub/base_types.py -------------------------------------------------------------------------------- /slime/rollout/filter_hub/dynamic_sampling_filters.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/filter_hub/dynamic_sampling_filters.py -------------------------------------------------------------------------------- /slime/rollout/generate_hub/__init__.py: -------------------------------------------------------------------------------- 1 | # TODO: maybe move `sglang_rollout::generate` to this folder 2 | -------------------------------------------------------------------------------- /slime/rollout/generate_hub/benchmarkers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/generate_hub/benchmarkers.py -------------------------------------------------------------------------------- /slime/rollout/rm_hub/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/rm_hub/__init__.py -------------------------------------------------------------------------------- /slime/rollout/rm_hub/deepscaler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/rm_hub/deepscaler.py -------------------------------------------------------------------------------- /slime/rollout/rm_hub/f1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/rm_hub/f1.py -------------------------------------------------------------------------------- /slime/rollout/rm_hub/gpqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/rm_hub/gpqa.py -------------------------------------------------------------------------------- /slime/rollout/rm_hub/ifbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/rm_hub/ifbench.py -------------------------------------------------------------------------------- /slime/rollout/rm_hub/math_dapo_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/rm_hub/math_dapo_utils.py -------------------------------------------------------------------------------- /slime/rollout/rm_hub/math_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/rm_hub/math_utils.py -------------------------------------------------------------------------------- /slime/rollout/sft_rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/sft_rollout.py -------------------------------------------------------------------------------- /slime/rollout/sglang_rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/sglang_rollout.py -------------------------------------------------------------------------------- /slime/rollout/sleep_rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/rollout/sleep_rollout.py -------------------------------------------------------------------------------- /slime/router/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/router/middleware_hub/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/router/middleware_hub/radix_tree.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/router/middleware_hub/radix_tree.py -------------------------------------------------------------------------------- /slime/router/middleware_hub/radix_tree_middleware.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/router/middleware_hub/radix_tree_middleware.py -------------------------------------------------------------------------------- /slime/router/router.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/router/router.py -------------------------------------------------------------------------------- /slime/utils/__init__.py: -------------------------------------------------------------------------------- 1 | """Utility package root for Slime.""" 2 | -------------------------------------------------------------------------------- /slime/utils/arguments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/arguments.py -------------------------------------------------------------------------------- /slime/utils/async_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/async_utils.py -------------------------------------------------------------------------------- /slime/utils/context_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/context_utils.py -------------------------------------------------------------------------------- /slime/utils/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/data.py -------------------------------------------------------------------------------- /slime/utils/debug_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/utils/debug_utils/display_debug_rollout_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/debug_utils/display_debug_rollout_data.py -------------------------------------------------------------------------------- /slime/utils/debug_utils/replay_reward_fn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/debug_utils/replay_reward_fn.py -------------------------------------------------------------------------------- /slime/utils/debug_utils/send_to_sglang.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/debug_utils/send_to_sglang.py -------------------------------------------------------------------------------- /slime/utils/distributed_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/distributed_utils.py -------------------------------------------------------------------------------- /slime/utils/eval_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/eval_config.py -------------------------------------------------------------------------------- /slime/utils/external_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime/utils/external_utils/command_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/external_utils/command_utils.py -------------------------------------------------------------------------------- /slime/utils/flops_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/flops_utils.py -------------------------------------------------------------------------------- /slime/utils/fp8_kernel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/fp8_kernel.py -------------------------------------------------------------------------------- /slime/utils/health_monitor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/health_monitor.py -------------------------------------------------------------------------------- /slime/utils/http_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/http_utils.py -------------------------------------------------------------------------------- /slime/utils/iter_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/iter_utils.py -------------------------------------------------------------------------------- /slime/utils/logging_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/logging_utils.py -------------------------------------------------------------------------------- /slime/utils/mask_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/mask_utils.py -------------------------------------------------------------------------------- /slime/utils/megatron_bridge_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/megatron_bridge_utils.py -------------------------------------------------------------------------------- /slime/utils/memory_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/memory_utils.py -------------------------------------------------------------------------------- /slime/utils/metric_checker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/metric_checker.py -------------------------------------------------------------------------------- /slime/utils/metric_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/metric_utils.py -------------------------------------------------------------------------------- /slime/utils/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/misc.py -------------------------------------------------------------------------------- /slime/utils/ppo_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/ppo_utils.py -------------------------------------------------------------------------------- /slime/utils/profile_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/profile_utils.py -------------------------------------------------------------------------------- /slime/utils/ray_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/ray_utils.py -------------------------------------------------------------------------------- /slime/utils/reloadable_process_group.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/reloadable_process_group.py -------------------------------------------------------------------------------- /slime/utils/routing_replay.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/routing_replay.py -------------------------------------------------------------------------------- /slime/utils/seqlen_balancing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/seqlen_balancing.py -------------------------------------------------------------------------------- /slime/utils/tensor_backper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/tensor_backper.py -------------------------------------------------------------------------------- /slime/utils/tensorboard_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/tensorboard_utils.py -------------------------------------------------------------------------------- /slime/utils/timer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/timer.py -------------------------------------------------------------------------------- /slime/utils/tracking_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/tracking_utils.py -------------------------------------------------------------------------------- /slime/utils/train_dump_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/train_dump_utils.py -------------------------------------------------------------------------------- /slime/utils/train_metric_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/train_metric_utils.py -------------------------------------------------------------------------------- /slime/utils/typer_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/typer_utils.py -------------------------------------------------------------------------------- /slime/utils/types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/types.py -------------------------------------------------------------------------------- /slime/utils/wandb_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime/utils/wandb_utils.py -------------------------------------------------------------------------------- /slime_plugins/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime_plugins/mbridge/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/mbridge/__init__.py -------------------------------------------------------------------------------- /slime_plugins/mbridge/glm4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/mbridge/glm4.py -------------------------------------------------------------------------------- /slime_plugins/mbridge/glm4moe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/mbridge/glm4moe.py -------------------------------------------------------------------------------- /slime_plugins/mbridge/mimo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/mbridge/mimo.py -------------------------------------------------------------------------------- /slime_plugins/mbridge/qwen3_next.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/mbridge/qwen3_next.py -------------------------------------------------------------------------------- /slime_plugins/megatron_bridge/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime_plugins/models/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /slime_plugins/models/glm4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/models/glm4.py -------------------------------------------------------------------------------- /slime_plugins/models/hf_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/models/hf_attention.py -------------------------------------------------------------------------------- /slime_plugins/models/qwen3_next.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/models/qwen3_next.py -------------------------------------------------------------------------------- /slime_plugins/rollout_buffer/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/rollout_buffer/README.md -------------------------------------------------------------------------------- /slime_plugins/rollout_buffer/README_zh.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/rollout_buffer/README_zh.md -------------------------------------------------------------------------------- /slime_plugins/rollout_buffer/buffer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/rollout_buffer/buffer.py -------------------------------------------------------------------------------- /slime_plugins/rollout_buffer/generator/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/rollout_buffer/generator/__init__.py -------------------------------------------------------------------------------- /slime_plugins/rollout_buffer/generator/base_generator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/rollout_buffer/generator/base_generator.py -------------------------------------------------------------------------------- /slime_plugins/rollout_buffer/rollout_buffer_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/rollout_buffer/rollout_buffer_example.py -------------------------------------------------------------------------------- /slime_plugins/rollout_buffer/rollout_buffer_example.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/slime_plugins/rollout_buffer/rollout_buffer_example.sh -------------------------------------------------------------------------------- /tests/ci/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/ci/README.md -------------------------------------------------------------------------------- /tests/ci/github_runner/.env.example: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/ci/github_runner/.env.example -------------------------------------------------------------------------------- /tests/ci/github_runner/.gitignore: -------------------------------------------------------------------------------- 1 | .env -------------------------------------------------------------------------------- /tests/ci/github_runner/docker-compose.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/ci/github_runner/docker-compose.yml -------------------------------------------------------------------------------- /tests/ci/gpu_lock_exec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/ci/gpu_lock_exec.py -------------------------------------------------------------------------------- /tests/test_chunked_gae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_chunked_gae.py -------------------------------------------------------------------------------- /tests/test_external_rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_external_rollout.py -------------------------------------------------------------------------------- /tests/test_fsdp_import.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_fsdp_import.py -------------------------------------------------------------------------------- /tests/test_gspo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_gspo.sh -------------------------------------------------------------------------------- /tests/test_moonlight_16B_A3B.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_moonlight_16B_A3B.py -------------------------------------------------------------------------------- /tests/test_quick_start_glm4_9B.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_quick_start_glm4_9B.py -------------------------------------------------------------------------------- /tests/test_qwen2.5_0.5B_gsm8k.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_qwen2.5_0.5B_gsm8k.py -------------------------------------------------------------------------------- /tests/test_qwen2.5_0.5B_gsm8k_async.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_qwen2.5_0.5B_gsm8k_async.py -------------------------------------------------------------------------------- /tests/test_qwen3_0.6B_fsdp_colocated_2xGPU.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_qwen3_0.6B_fsdp_colocated_2xGPU.py -------------------------------------------------------------------------------- /tests/test_qwen3_0.6B_fsdp_distributed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_qwen3_0.6B_fsdp_distributed.py -------------------------------------------------------------------------------- /tests/test_qwen3_0.6B_parallel_check.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_qwen3_0.6B_parallel_check.py -------------------------------------------------------------------------------- /tests/test_qwen3_30B_A3B.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_qwen3_30B_A3B.py -------------------------------------------------------------------------------- /tests/test_qwen3_4B_fsdp_true_on_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_qwen3_4B_fsdp_true_on_policy.py -------------------------------------------------------------------------------- /tests/test_qwen3_4B_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tests/test_qwen3_4B_ppo.py -------------------------------------------------------------------------------- /tools/convert_hf_to_fp8.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tools/convert_hf_to_fp8.py -------------------------------------------------------------------------------- /tools/convert_hf_to_torch_dist.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tools/convert_hf_to_torch_dist.py -------------------------------------------------------------------------------- /tools/convert_k2_thinking_int4_to_bf16.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tools/convert_k2_thinking_int4_to_bf16.py -------------------------------------------------------------------------------- /tools/convert_to_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tools/convert_to_hf.py -------------------------------------------------------------------------------- /tools/convert_torch_dist_to_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tools/convert_torch_dist_to_hf.py -------------------------------------------------------------------------------- /tools/fp8_cast_bf16.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/tools/fp8_cast_bf16.py -------------------------------------------------------------------------------- /train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/train.py -------------------------------------------------------------------------------- /train_async.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUDM/slime/HEAD/train_async.py --------------------------------------------------------------------------------