├── .gitignore ├── .vscode └── settings.json ├── LICENSE ├── README-eng.md ├── README.md ├── engineer ├── how-to-use-docker │ ├── how_to_bump_version.md │ ├── readme.md │ └── readme_en.md └── uv │ ├── H200.png │ └── readme.md ├── rlhf ├── GRPO │ ├── README.md │ ├── SGLang_GRPO.md │ └── grpo-main.png ├── OpenRLHF │ ├── develop-log.md │ ├── learning-stage.png │ ├── make-experience.png │ ├── openrlhf-sglang.md │ └── readme.md ├── areal │ └── code-walk-through.md ├── partial-rollout │ ├── Learning_to_Reason_under_Off-Policy_Guidance.md │ └── readme.md ├── rl-walk-through │ ├── part-1.md │ ├── part-2.md │ ├── part-3.md │ ├── part-4.md │ ├── part-5.md │ ├── part-6.md │ ├── part-7.md │ ├── part-8.md │ └── pics │ │ ├── epsilon-regrets.png │ │ ├── ppo-cut.png │ │ └── sarsa-q-learning.png ├── slime │ ├── batch-GAE │ │ └── ppo-gae-chunk.md │ ├── code-walk-through │ │ ├── datasource.png │ │ ├── original │ │ │ ├── part-1.md │ │ │ ├── part-2.md │ │ │ ├── part-3.md │ │ │ ├── part-4.md │ │ │ └── part-5.md │ │ ├── overall_workflow.png │ │ ├── readme.md │ │ ├── readme_en.md │ │ ├── rollout_parts.png │ │ └── sampling_flow.png │ ├── fp8 │ │ ├── pic │ │ │ ├── 10_1_TIS.png │ │ │ ├── 10_2_rollout_logprob_abs_diff.png │ │ │ ├── 11_1_TIS.png │ │ │ ├── 11_2_rollout_logprob_abs_diff.png │ │ │ ├── 1_E4vsE5.png │ │ │ ├── 2_size.png │ │ │ ├── 3_Megatron.png │ │ │ ├── 4_cpu_bound.png │ │ │ ├── 5_KLloss.png │ │ │ ├── 6_FP8_quant_error.png │ │ │ ├── 7_KLloss2.png │ │ │ ├── 8_TIS.png │ │ │ ├── 9_1_TIS.png │ │ │ └── 9_2_rollout_logprob_abs_diff.png │ │ ├── readme.md │ │ └── readme_en.md │ ├── fsdp │ │ ├── pic │ │ │ ├── 1_fsdp_init.png │ │ │ ├── 2_fsdp_train.png │ │ │ ├── 3_kl_0.png │ │ │ ├── 4_fsdp_refit.png │ │ │ └── 5_fsdp_mcore_match.png │ │ ├── readme.md │ │ ├── readme_en.md │ │ └── release_log │ │ │ └── setup_fsdp.md │ └── spec │ │ ├── pic │ │ ├── cp.png │ │ ├── final-state.png │ │ ├── long-throughput.png │ │ ├── loss-flow.png │ │ ├── mtp-head.png │ │ ├── mtp-loss.png │ │ ├── overall-throughput.png │ │ ├── reward.png │ │ ├── spec-acc-len.png │ │ └── train-time.png │ │ ├── readme-en.md │ │ └── readme.md ├── sys-design │ ├── pics │ │ ├── 1f1b.png │ │ ├── chunked_pp.png │ │ ├── cross-shard.png │ │ ├── ep.png │ │ ├── epall2all.png │ │ ├── fsdp-algorithm.png │ │ ├── fthenb.png │ │ ├── mixed.png │ │ ├── tp+cp.png │ │ ├── tp+sp.png │ │ ├── tp.png │ │ └── update_weights.jpg │ ├── readme-1-EN.md │ ├── readme-1.md │ ├── readme-2-en.md │ ├── readme-2.md │ └── readme-3.md └── verl │ ├── VLM │ └── veRL-VLM.md │ ├── amd-verl-dev │ └── dev.md │ ├── img │ ├── gcs-address.png │ ├── multi-node-status.png │ ├── placement.png │ ├── ray-runtime-start.png │ ├── sandbox_supported_datasets.png │ └── sandbox_supported_languages.png │ ├── multi-turn │ ├── code-walk-through │ │ ├── dapo.md │ │ ├── readme-2-EN.md │ │ ├── readme-2.md │ │ ├── readme-3.md │ │ ├── readme-5-EN.md │ │ ├── readme-5.md │ │ ├── readme-6.md │ │ ├── readme.md │ │ └── readme_EN.md │ ├── fast_tokenization │ │ ├── multiturn_tokenization_and_masking.md │ │ ├── multiturn_tokenization_and_masking_ZH.md │ │ ├── think.jpg │ │ ├── verRL-multiturn-fast-tokenization.md │ │ └── verRL-multiturn-fast-tokenization_ZH.md │ ├── imgs │ │ ├── Multi-Turn_Rollout_Workflow.png │ │ ├── Tool_Lifecycle_and_Request_State_Transaction.png │ │ ├── Weave_Trace.jpg │ │ └── agentLoop.png │ ├── release_log │ │ ├── latest_sglang.md │ │ ├── over_sample.md │ │ ├── verl-multiturn-rollout-Release.md │ │ └── verl-multiturn-rollout-Release_ZH.md │ └── tool_examples │ │ ├── agent_loop.md │ │ ├── debug-multi-stage.md │ │ ├── debug-tp-2-multi-turn.md │ │ ├── debug-tp-2.md │ │ ├── pics │ │ ├── tui_1.png │ │ ├── tui_2.png │ │ ├── wandb.png │ │ └── wandb_600.png │ │ ├── profile.md │ │ ├── profile_en.md │ │ ├── tui.md │ │ ├── tui_en.md │ │ ├── verl-multiturn-searchR1-like.md │ │ ├── verl-multiturn-searchR1-like_ZH.md │ │ ├── verl-vlm-multiturn_ZH.md │ │ ├── weave_trace_readme.md │ │ └── weave_trace_readme_en.md │ ├── readme.md │ ├── server-based │ └── veRL-server-based-rollout.md │ ├── spin │ ├── SPIN-dev.md │ ├── dev-log.md │ └── test-log.md │ └── sppo │ ├── compare_with_ppo_grpo.md │ ├── dev-log.md │ ├── paper.md │ └── test-log.md ├── sglang ├── code-walk-through │ ├── mm_req_lifecycle.svg │ ├── multimodal_request_lifecycle.md │ ├── readme-CN.md │ ├── readme.md │ ├── sglang-architecture.svg │ └── sglang_scheduler.svg ├── constraint-decoding │ ├── readme.md │ └── readme_en.md ├── dp-attention │ └── readme.md ├── how-model-is-loaded │ ├── how-model-weight-is-loaded.md │ └── readme.md ├── kvcache-code-walk-through │ ├── kv-cache-request-lifecycle.png │ ├── readme-CN.md │ ├── readme.md │ └── scheduler_overview.png ├── latency-accelerate-for-weight-updates │ ├── readme-CN.md │ └── readme.md ├── nvidia-dynamo │ └── dynamo.md ├── online-update-weights │ └── readme.md ├── quantization │ ├── acc.png │ ├── decode_throughput.png │ ├── decodetp_degrade.png │ ├── general_background.md │ ├── gpu.png │ ├── latency.png │ ├── model_loading_pipeline.png │ ├── quantization_architecture.md │ ├── quantization_architecture_en.md │ ├── sglang-architecture.png │ ├── throughput.png │ └── unsloth.md ├── qwen │ └── coder.md ├── scheduler-evolution │ ├── SGLang Scheduler Evolution.md │ ├── SGLang Scheduler 技术变迁.md │ └── img │ │ ├── Scheduler.png │ │ ├── batch.png │ │ ├── lazy_sampling.png │ │ ├── overlap.png │ │ ├── previous_overlap.png │ │ ├── sglang_cache.png │ │ └── sglang_scheduler.svg ├── sglang-scheduler │ ├── readme-CN.md │ ├── readme.md │ └── static │ │ ├── double_check.png │ │ ├── get_next_batch_to_run.png │ │ ├── inbatch.png │ │ ├── new_token_ratio.png │ │ ├── page_attn.png │ │ └── update_running_batch.png ├── sglang-verl-engine │ └── readme.md ├── sglang-worker │ ├── SGLang-Archi.png │ ├── readme-CN.md │ └── readme.md ├── speculative-decoding │ ├── speculative-decoding.md │ ├── withSpec1.png │ ├── withSpec2.png │ └── withoutSpec.png ├── tiny-llm │ └── day1.md └── zero-overhead-scheduler │ ├── image │ ├── breakdown.png │ ├── pipeline1.png │ ├── pipeline2.png │ ├── placeholder1.png │ ├── placeholder2.png │ ├── real_pipeline1.png │ ├── real_pipeline2.png │ └── sgl_blog_pipeline.png │ └── zero-overhead-batch-scheduler.md ├── torch ├── cuda-graph │ ├── readme.md │ └── readme_en.md ├── mem-snapshot │ ├── pics │ │ ├── active-memory-timeline.png │ │ ├── forward-1.png │ │ ├── stack.png │ │ ├── step-2.png │ │ ├── step-3.png │ │ ├── step-4.png │ │ ├── with-gc.png │ │ └── without-gc.png │ ├── readme-en.md │ └── readme.md ├── nccl │ ├── NCCL.assets │ │ ├── allgather.png │ │ ├── allreduce.png │ │ ├── broadcast.png │ │ ├── dp.png │ │ ├── pp.png │ │ ├── reduce.png │ │ ├── reducescatter.png │ │ ├── ring.png │ │ └── tp.png │ ├── readme.md │ └── readme_en.md ├── tensor-parallelism │ └── readme.md └── torch-distributed │ ├── DBTree.jpg │ ├── codes │ ├── all-gather-reduce.py │ ├── all-reduce-softmax.py │ ├── broad-cast.py │ ├── init-process-group.py │ ├── new-group.py │ ├── scatter.py │ ├── send-recv-async.py │ └── send-recv-sync.py │ ├── complete-allreduce.svg │ └── readme.md └── transformers ├── attention ├── cross_attention.md ├── cross_attention_.webp └── cross_attention_en.md └── special_tokens ├── special_tokens.md └── special_tokens_en.md /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/.gitignore -------------------------------------------------------------------------------- /.vscode/settings.json: -------------------------------------------------------------------------------- 1 | { 2 | "iis.configDir": "" 3 | } -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/LICENSE -------------------------------------------------------------------------------- /README-eng.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/README-eng.md -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/README.md -------------------------------------------------------------------------------- /engineer/how-to-use-docker/how_to_bump_version.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/engineer/how-to-use-docker/how_to_bump_version.md -------------------------------------------------------------------------------- /engineer/how-to-use-docker/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/engineer/how-to-use-docker/readme.md -------------------------------------------------------------------------------- /engineer/how-to-use-docker/readme_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/engineer/how-to-use-docker/readme_en.md -------------------------------------------------------------------------------- /engineer/uv/H200.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/engineer/uv/H200.png -------------------------------------------------------------------------------- /engineer/uv/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/engineer/uv/readme.md -------------------------------------------------------------------------------- /rlhf/GRPO/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/GRPO/README.md -------------------------------------------------------------------------------- /rlhf/GRPO/SGLang_GRPO.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/GRPO/SGLang_GRPO.md -------------------------------------------------------------------------------- /rlhf/GRPO/grpo-main.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/GRPO/grpo-main.png -------------------------------------------------------------------------------- /rlhf/OpenRLHF/develop-log.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/OpenRLHF/develop-log.md -------------------------------------------------------------------------------- /rlhf/OpenRLHF/learning-stage.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/OpenRLHF/learning-stage.png -------------------------------------------------------------------------------- /rlhf/OpenRLHF/make-experience.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/OpenRLHF/make-experience.png -------------------------------------------------------------------------------- /rlhf/OpenRLHF/openrlhf-sglang.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/OpenRLHF/openrlhf-sglang.md -------------------------------------------------------------------------------- /rlhf/OpenRLHF/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/OpenRLHF/readme.md -------------------------------------------------------------------------------- /rlhf/areal/code-walk-through.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/areal/code-walk-through.md -------------------------------------------------------------------------------- /rlhf/partial-rollout/Learning_to_Reason_under_Off-Policy_Guidance.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/partial-rollout/Learning_to_Reason_under_Off-Policy_Guidance.md -------------------------------------------------------------------------------- /rlhf/partial-rollout/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/partial-rollout/readme.md -------------------------------------------------------------------------------- /rlhf/rl-walk-through/part-1.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/rl-walk-through/part-1.md -------------------------------------------------------------------------------- /rlhf/rl-walk-through/part-2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/rl-walk-through/part-2.md -------------------------------------------------------------------------------- /rlhf/rl-walk-through/part-3.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/rl-walk-through/part-3.md -------------------------------------------------------------------------------- /rlhf/rl-walk-through/part-4.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/rl-walk-through/part-4.md -------------------------------------------------------------------------------- /rlhf/rl-walk-through/part-5.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/rl-walk-through/part-5.md -------------------------------------------------------------------------------- /rlhf/rl-walk-through/part-6.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/rl-walk-through/part-6.md -------------------------------------------------------------------------------- /rlhf/rl-walk-through/part-7.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/rl-walk-through/part-7.md -------------------------------------------------------------------------------- /rlhf/rl-walk-through/part-8.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/rl-walk-through/part-8.md -------------------------------------------------------------------------------- /rlhf/rl-walk-through/pics/epsilon-regrets.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/rl-walk-through/pics/epsilon-regrets.png -------------------------------------------------------------------------------- /rlhf/rl-walk-through/pics/ppo-cut.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/rl-walk-through/pics/ppo-cut.png -------------------------------------------------------------------------------- /rlhf/rl-walk-through/pics/sarsa-q-learning.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/rl-walk-through/pics/sarsa-q-learning.png -------------------------------------------------------------------------------- /rlhf/slime/batch-GAE/ppo-gae-chunk.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/batch-GAE/ppo-gae-chunk.md -------------------------------------------------------------------------------- /rlhf/slime/code-walk-through/datasource.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/code-walk-through/datasource.png -------------------------------------------------------------------------------- /rlhf/slime/code-walk-through/original/part-1.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/code-walk-through/original/part-1.md -------------------------------------------------------------------------------- /rlhf/slime/code-walk-through/original/part-2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/code-walk-through/original/part-2.md -------------------------------------------------------------------------------- /rlhf/slime/code-walk-through/original/part-3.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/code-walk-through/original/part-3.md -------------------------------------------------------------------------------- /rlhf/slime/code-walk-through/original/part-4.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/code-walk-through/original/part-4.md -------------------------------------------------------------------------------- /rlhf/slime/code-walk-through/original/part-5.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/code-walk-through/original/part-5.md -------------------------------------------------------------------------------- /rlhf/slime/code-walk-through/overall_workflow.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/code-walk-through/overall_workflow.png -------------------------------------------------------------------------------- /rlhf/slime/code-walk-through/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/code-walk-through/readme.md -------------------------------------------------------------------------------- /rlhf/slime/code-walk-through/readme_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/code-walk-through/readme_en.md -------------------------------------------------------------------------------- /rlhf/slime/code-walk-through/rollout_parts.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/code-walk-through/rollout_parts.png -------------------------------------------------------------------------------- /rlhf/slime/code-walk-through/sampling_flow.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/code-walk-through/sampling_flow.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/10_1_TIS.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/10_1_TIS.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/10_2_rollout_logprob_abs_diff.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/10_2_rollout_logprob_abs_diff.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/11_1_TIS.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/11_1_TIS.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/11_2_rollout_logprob_abs_diff.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/11_2_rollout_logprob_abs_diff.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/1_E4vsE5.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/1_E4vsE5.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/2_size.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/2_size.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/3_Megatron.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/3_Megatron.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/4_cpu_bound.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/4_cpu_bound.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/5_KLloss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/5_KLloss.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/6_FP8_quant_error.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/6_FP8_quant_error.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/7_KLloss2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/7_KLloss2.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/8_TIS.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/8_TIS.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/9_1_TIS.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/9_1_TIS.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/pic/9_2_rollout_logprob_abs_diff.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/pic/9_2_rollout_logprob_abs_diff.png -------------------------------------------------------------------------------- /rlhf/slime/fp8/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/readme.md -------------------------------------------------------------------------------- /rlhf/slime/fp8/readme_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fp8/readme_en.md -------------------------------------------------------------------------------- /rlhf/slime/fsdp/pic/1_fsdp_init.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fsdp/pic/1_fsdp_init.png -------------------------------------------------------------------------------- /rlhf/slime/fsdp/pic/2_fsdp_train.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fsdp/pic/2_fsdp_train.png -------------------------------------------------------------------------------- /rlhf/slime/fsdp/pic/3_kl_0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fsdp/pic/3_kl_0.png -------------------------------------------------------------------------------- /rlhf/slime/fsdp/pic/4_fsdp_refit.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fsdp/pic/4_fsdp_refit.png -------------------------------------------------------------------------------- /rlhf/slime/fsdp/pic/5_fsdp_mcore_match.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fsdp/pic/5_fsdp_mcore_match.png -------------------------------------------------------------------------------- /rlhf/slime/fsdp/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fsdp/readme.md -------------------------------------------------------------------------------- /rlhf/slime/fsdp/readme_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fsdp/readme_en.md -------------------------------------------------------------------------------- /rlhf/slime/fsdp/release_log/setup_fsdp.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/fsdp/release_log/setup_fsdp.md -------------------------------------------------------------------------------- /rlhf/slime/spec/pic/cp.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/spec/pic/cp.png -------------------------------------------------------------------------------- /rlhf/slime/spec/pic/final-state.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/spec/pic/final-state.png -------------------------------------------------------------------------------- /rlhf/slime/spec/pic/long-throughput.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/spec/pic/long-throughput.png -------------------------------------------------------------------------------- /rlhf/slime/spec/pic/loss-flow.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/spec/pic/loss-flow.png -------------------------------------------------------------------------------- /rlhf/slime/spec/pic/mtp-head.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/spec/pic/mtp-head.png -------------------------------------------------------------------------------- /rlhf/slime/spec/pic/mtp-loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/spec/pic/mtp-loss.png -------------------------------------------------------------------------------- /rlhf/slime/spec/pic/overall-throughput.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/spec/pic/overall-throughput.png -------------------------------------------------------------------------------- /rlhf/slime/spec/pic/reward.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/spec/pic/reward.png -------------------------------------------------------------------------------- /rlhf/slime/spec/pic/spec-acc-len.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/spec/pic/spec-acc-len.png -------------------------------------------------------------------------------- /rlhf/slime/spec/pic/train-time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/spec/pic/train-time.png -------------------------------------------------------------------------------- /rlhf/slime/spec/readme-en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/spec/readme-en.md -------------------------------------------------------------------------------- /rlhf/slime/spec/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/slime/spec/readme.md -------------------------------------------------------------------------------- /rlhf/sys-design/pics/1f1b.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/pics/1f1b.png -------------------------------------------------------------------------------- /rlhf/sys-design/pics/chunked_pp.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/pics/chunked_pp.png -------------------------------------------------------------------------------- /rlhf/sys-design/pics/cross-shard.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/pics/cross-shard.png -------------------------------------------------------------------------------- /rlhf/sys-design/pics/ep.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/pics/ep.png -------------------------------------------------------------------------------- /rlhf/sys-design/pics/epall2all.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/pics/epall2all.png -------------------------------------------------------------------------------- /rlhf/sys-design/pics/fsdp-algorithm.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/pics/fsdp-algorithm.png -------------------------------------------------------------------------------- /rlhf/sys-design/pics/fthenb.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/pics/fthenb.png -------------------------------------------------------------------------------- /rlhf/sys-design/pics/mixed.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/pics/mixed.png -------------------------------------------------------------------------------- /rlhf/sys-design/pics/tp+cp.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/pics/tp+cp.png -------------------------------------------------------------------------------- /rlhf/sys-design/pics/tp+sp.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/pics/tp+sp.png -------------------------------------------------------------------------------- /rlhf/sys-design/pics/tp.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/pics/tp.png -------------------------------------------------------------------------------- /rlhf/sys-design/pics/update_weights.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/pics/update_weights.jpg -------------------------------------------------------------------------------- /rlhf/sys-design/readme-1-EN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/readme-1-EN.md -------------------------------------------------------------------------------- /rlhf/sys-design/readme-1.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/readme-1.md -------------------------------------------------------------------------------- /rlhf/sys-design/readme-2-en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/readme-2-en.md -------------------------------------------------------------------------------- /rlhf/sys-design/readme-2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/readme-2.md -------------------------------------------------------------------------------- /rlhf/sys-design/readme-3.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/sys-design/readme-3.md -------------------------------------------------------------------------------- /rlhf/verl/VLM/veRL-VLM.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/VLM/veRL-VLM.md -------------------------------------------------------------------------------- /rlhf/verl/amd-verl-dev/dev.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/amd-verl-dev/dev.md -------------------------------------------------------------------------------- /rlhf/verl/img/gcs-address.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/img/gcs-address.png -------------------------------------------------------------------------------- /rlhf/verl/img/multi-node-status.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/img/multi-node-status.png -------------------------------------------------------------------------------- /rlhf/verl/img/placement.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/img/placement.png -------------------------------------------------------------------------------- /rlhf/verl/img/ray-runtime-start.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/img/ray-runtime-start.png -------------------------------------------------------------------------------- /rlhf/verl/img/sandbox_supported_datasets.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/img/sandbox_supported_datasets.png -------------------------------------------------------------------------------- /rlhf/verl/img/sandbox_supported_languages.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/img/sandbox_supported_languages.png -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/code-walk-through/dapo.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/code-walk-through/dapo.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/code-walk-through/readme-2-EN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/code-walk-through/readme-2-EN.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/code-walk-through/readme-2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/code-walk-through/readme-2.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/code-walk-through/readme-3.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/code-walk-through/readme-3.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/code-walk-through/readme-5-EN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/code-walk-through/readme-5-EN.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/code-walk-through/readme-5.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/code-walk-through/readme-5.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/code-walk-through/readme-6.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/code-walk-through/readme-6.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/code-walk-through/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/code-walk-through/readme.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/code-walk-through/readme_EN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/code-walk-through/readme_EN.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/fast_tokenization/multiturn_tokenization_and_masking.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/fast_tokenization/multiturn_tokenization_and_masking.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/fast_tokenization/multiturn_tokenization_and_masking_ZH.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/fast_tokenization/multiturn_tokenization_and_masking_ZH.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/fast_tokenization/think.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/fast_tokenization/think.jpg -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/fast_tokenization/verRL-multiturn-fast-tokenization.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/fast_tokenization/verRL-multiturn-fast-tokenization.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/fast_tokenization/verRL-multiturn-fast-tokenization_ZH.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/fast_tokenization/verRL-multiturn-fast-tokenization_ZH.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/imgs/Multi-Turn_Rollout_Workflow.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/imgs/Multi-Turn_Rollout_Workflow.png -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/imgs/Tool_Lifecycle_and_Request_State_Transaction.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/imgs/Tool_Lifecycle_and_Request_State_Transaction.png -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/imgs/Weave_Trace.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/imgs/Weave_Trace.jpg -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/imgs/agentLoop.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/imgs/agentLoop.png -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/release_log/latest_sglang.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/release_log/latest_sglang.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/release_log/over_sample.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/release_log/over_sample.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/release_log/verl-multiturn-rollout-Release.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/release_log/verl-multiturn-rollout-Release.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/release_log/verl-multiturn-rollout-Release_ZH.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/release_log/verl-multiturn-rollout-Release_ZH.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/agent_loop.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/agent_loop.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/debug-multi-stage.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/debug-multi-stage.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/debug-tp-2-multi-turn.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/debug-tp-2-multi-turn.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/debug-tp-2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/debug-tp-2.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/pics/tui_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/pics/tui_1.png -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/pics/tui_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/pics/tui_2.png -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/pics/wandb.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/pics/wandb.png -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/pics/wandb_600.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/pics/wandb_600.png -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/profile.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/profile.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/profile_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/profile_en.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/tui.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/tui.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/tui_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/tui_en.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/verl-multiturn-searchR1-like.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/verl-multiturn-searchR1-like.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/verl-multiturn-searchR1-like_ZH.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/verl-multiturn-searchR1-like_ZH.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/verl-vlm-multiturn_ZH.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/verl-vlm-multiturn_ZH.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/weave_trace_readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/weave_trace_readme.md -------------------------------------------------------------------------------- /rlhf/verl/multi-turn/tool_examples/weave_trace_readme_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/multi-turn/tool_examples/weave_trace_readme_en.md -------------------------------------------------------------------------------- /rlhf/verl/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/readme.md -------------------------------------------------------------------------------- /rlhf/verl/server-based/veRL-server-based-rollout.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/server-based/veRL-server-based-rollout.md -------------------------------------------------------------------------------- /rlhf/verl/spin/SPIN-dev.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/spin/SPIN-dev.md -------------------------------------------------------------------------------- /rlhf/verl/spin/dev-log.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/spin/dev-log.md -------------------------------------------------------------------------------- /rlhf/verl/spin/test-log.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/spin/test-log.md -------------------------------------------------------------------------------- /rlhf/verl/sppo/compare_with_ppo_grpo.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/sppo/compare_with_ppo_grpo.md -------------------------------------------------------------------------------- /rlhf/verl/sppo/dev-log.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/sppo/dev-log.md -------------------------------------------------------------------------------- /rlhf/verl/sppo/paper.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/sppo/paper.md -------------------------------------------------------------------------------- /rlhf/verl/sppo/test-log.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/rlhf/verl/sppo/test-log.md -------------------------------------------------------------------------------- /sglang/code-walk-through/mm_req_lifecycle.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/code-walk-through/mm_req_lifecycle.svg -------------------------------------------------------------------------------- /sglang/code-walk-through/multimodal_request_lifecycle.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/code-walk-through/multimodal_request_lifecycle.md -------------------------------------------------------------------------------- /sglang/code-walk-through/readme-CN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/code-walk-through/readme-CN.md -------------------------------------------------------------------------------- /sglang/code-walk-through/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/code-walk-through/readme.md -------------------------------------------------------------------------------- /sglang/code-walk-through/sglang-architecture.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/code-walk-through/sglang-architecture.svg -------------------------------------------------------------------------------- /sglang/code-walk-through/sglang_scheduler.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/code-walk-through/sglang_scheduler.svg -------------------------------------------------------------------------------- /sglang/constraint-decoding/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/constraint-decoding/readme.md -------------------------------------------------------------------------------- /sglang/constraint-decoding/readme_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/constraint-decoding/readme_en.md -------------------------------------------------------------------------------- /sglang/dp-attention/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/dp-attention/readme.md -------------------------------------------------------------------------------- /sglang/how-model-is-loaded/how-model-weight-is-loaded.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/how-model-is-loaded/how-model-weight-is-loaded.md -------------------------------------------------------------------------------- /sglang/how-model-is-loaded/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/how-model-is-loaded/readme.md -------------------------------------------------------------------------------- /sglang/kvcache-code-walk-through/kv-cache-request-lifecycle.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/kvcache-code-walk-through/kv-cache-request-lifecycle.png -------------------------------------------------------------------------------- /sglang/kvcache-code-walk-through/readme-CN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/kvcache-code-walk-through/readme-CN.md -------------------------------------------------------------------------------- /sglang/kvcache-code-walk-through/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/kvcache-code-walk-through/readme.md -------------------------------------------------------------------------------- /sglang/kvcache-code-walk-through/scheduler_overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/kvcache-code-walk-through/scheduler_overview.png -------------------------------------------------------------------------------- /sglang/latency-accelerate-for-weight-updates/readme-CN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/latency-accelerate-for-weight-updates/readme-CN.md -------------------------------------------------------------------------------- /sglang/latency-accelerate-for-weight-updates/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/latency-accelerate-for-weight-updates/readme.md -------------------------------------------------------------------------------- /sglang/nvidia-dynamo/dynamo.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/nvidia-dynamo/dynamo.md -------------------------------------------------------------------------------- /sglang/online-update-weights/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/online-update-weights/readme.md -------------------------------------------------------------------------------- /sglang/quantization/acc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/quantization/acc.png -------------------------------------------------------------------------------- /sglang/quantization/decode_throughput.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/quantization/decode_throughput.png -------------------------------------------------------------------------------- /sglang/quantization/decodetp_degrade.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/quantization/decodetp_degrade.png -------------------------------------------------------------------------------- /sglang/quantization/general_background.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/quantization/general_background.md -------------------------------------------------------------------------------- /sglang/quantization/gpu.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/quantization/gpu.png -------------------------------------------------------------------------------- /sglang/quantization/latency.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/quantization/latency.png -------------------------------------------------------------------------------- /sglang/quantization/model_loading_pipeline.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/quantization/model_loading_pipeline.png -------------------------------------------------------------------------------- /sglang/quantization/quantization_architecture.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/quantization/quantization_architecture.md -------------------------------------------------------------------------------- /sglang/quantization/quantization_architecture_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/quantization/quantization_architecture_en.md -------------------------------------------------------------------------------- /sglang/quantization/sglang-architecture.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/quantization/sglang-architecture.png -------------------------------------------------------------------------------- /sglang/quantization/throughput.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/quantization/throughput.png -------------------------------------------------------------------------------- /sglang/quantization/unsloth.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/quantization/unsloth.md -------------------------------------------------------------------------------- /sglang/qwen/coder.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/qwen/coder.md -------------------------------------------------------------------------------- /sglang/scheduler-evolution/SGLang Scheduler Evolution.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/scheduler-evolution/SGLang Scheduler Evolution.md -------------------------------------------------------------------------------- /sglang/scheduler-evolution/SGLang Scheduler 技术变迁.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/scheduler-evolution/SGLang Scheduler 技术变迁.md -------------------------------------------------------------------------------- /sglang/scheduler-evolution/img/Scheduler.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/scheduler-evolution/img/Scheduler.png -------------------------------------------------------------------------------- /sglang/scheduler-evolution/img/batch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/scheduler-evolution/img/batch.png -------------------------------------------------------------------------------- /sglang/scheduler-evolution/img/lazy_sampling.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/scheduler-evolution/img/lazy_sampling.png -------------------------------------------------------------------------------- /sglang/scheduler-evolution/img/overlap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/scheduler-evolution/img/overlap.png -------------------------------------------------------------------------------- /sglang/scheduler-evolution/img/previous_overlap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/scheduler-evolution/img/previous_overlap.png -------------------------------------------------------------------------------- /sglang/scheduler-evolution/img/sglang_cache.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/scheduler-evolution/img/sglang_cache.png -------------------------------------------------------------------------------- /sglang/scheduler-evolution/img/sglang_scheduler.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/scheduler-evolution/img/sglang_scheduler.svg -------------------------------------------------------------------------------- /sglang/sglang-scheduler/readme-CN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/sglang-scheduler/readme-CN.md -------------------------------------------------------------------------------- /sglang/sglang-scheduler/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/sglang-scheduler/readme.md -------------------------------------------------------------------------------- /sglang/sglang-scheduler/static/double_check.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/sglang-scheduler/static/double_check.png -------------------------------------------------------------------------------- /sglang/sglang-scheduler/static/get_next_batch_to_run.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/sglang-scheduler/static/get_next_batch_to_run.png -------------------------------------------------------------------------------- /sglang/sglang-scheduler/static/inbatch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/sglang-scheduler/static/inbatch.png -------------------------------------------------------------------------------- /sglang/sglang-scheduler/static/new_token_ratio.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/sglang-scheduler/static/new_token_ratio.png -------------------------------------------------------------------------------- /sglang/sglang-scheduler/static/page_attn.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/sglang-scheduler/static/page_attn.png -------------------------------------------------------------------------------- /sglang/sglang-scheduler/static/update_running_batch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/sglang-scheduler/static/update_running_batch.png -------------------------------------------------------------------------------- /sglang/sglang-verl-engine/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/sglang-verl-engine/readme.md -------------------------------------------------------------------------------- /sglang/sglang-worker/SGLang-Archi.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/sglang-worker/SGLang-Archi.png -------------------------------------------------------------------------------- /sglang/sglang-worker/readme-CN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/sglang-worker/readme-CN.md -------------------------------------------------------------------------------- /sglang/sglang-worker/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/sglang-worker/readme.md -------------------------------------------------------------------------------- /sglang/speculative-decoding/speculative-decoding.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/speculative-decoding/speculative-decoding.md -------------------------------------------------------------------------------- /sglang/speculative-decoding/withSpec1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/speculative-decoding/withSpec1.png -------------------------------------------------------------------------------- /sglang/speculative-decoding/withSpec2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/speculative-decoding/withSpec2.png -------------------------------------------------------------------------------- /sglang/speculative-decoding/withoutSpec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/speculative-decoding/withoutSpec.png -------------------------------------------------------------------------------- /sglang/tiny-llm/day1.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/tiny-llm/day1.md -------------------------------------------------------------------------------- /sglang/zero-overhead-scheduler/image/breakdown.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/zero-overhead-scheduler/image/breakdown.png -------------------------------------------------------------------------------- /sglang/zero-overhead-scheduler/image/pipeline1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/zero-overhead-scheduler/image/pipeline1.png -------------------------------------------------------------------------------- /sglang/zero-overhead-scheduler/image/pipeline2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/zero-overhead-scheduler/image/pipeline2.png -------------------------------------------------------------------------------- /sglang/zero-overhead-scheduler/image/placeholder1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/zero-overhead-scheduler/image/placeholder1.png -------------------------------------------------------------------------------- /sglang/zero-overhead-scheduler/image/placeholder2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/zero-overhead-scheduler/image/placeholder2.png -------------------------------------------------------------------------------- /sglang/zero-overhead-scheduler/image/real_pipeline1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/zero-overhead-scheduler/image/real_pipeline1.png -------------------------------------------------------------------------------- /sglang/zero-overhead-scheduler/image/real_pipeline2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/zero-overhead-scheduler/image/real_pipeline2.png -------------------------------------------------------------------------------- /sglang/zero-overhead-scheduler/image/sgl_blog_pipeline.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/zero-overhead-scheduler/image/sgl_blog_pipeline.png -------------------------------------------------------------------------------- /sglang/zero-overhead-scheduler/zero-overhead-batch-scheduler.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/sglang/zero-overhead-scheduler/zero-overhead-batch-scheduler.md -------------------------------------------------------------------------------- /torch/cuda-graph/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/cuda-graph/readme.md -------------------------------------------------------------------------------- /torch/cuda-graph/readme_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/cuda-graph/readme_en.md -------------------------------------------------------------------------------- /torch/mem-snapshot/pics/active-memory-timeline.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/mem-snapshot/pics/active-memory-timeline.png -------------------------------------------------------------------------------- /torch/mem-snapshot/pics/forward-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/mem-snapshot/pics/forward-1.png -------------------------------------------------------------------------------- /torch/mem-snapshot/pics/stack.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/mem-snapshot/pics/stack.png -------------------------------------------------------------------------------- /torch/mem-snapshot/pics/step-2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/mem-snapshot/pics/step-2.png -------------------------------------------------------------------------------- /torch/mem-snapshot/pics/step-3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/mem-snapshot/pics/step-3.png -------------------------------------------------------------------------------- /torch/mem-snapshot/pics/step-4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/mem-snapshot/pics/step-4.png -------------------------------------------------------------------------------- /torch/mem-snapshot/pics/with-gc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/mem-snapshot/pics/with-gc.png -------------------------------------------------------------------------------- /torch/mem-snapshot/pics/without-gc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/mem-snapshot/pics/without-gc.png -------------------------------------------------------------------------------- /torch/mem-snapshot/readme-en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/mem-snapshot/readme-en.md -------------------------------------------------------------------------------- /torch/mem-snapshot/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/mem-snapshot/readme.md -------------------------------------------------------------------------------- /torch/nccl/NCCL.assets/allgather.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/nccl/NCCL.assets/allgather.png -------------------------------------------------------------------------------- /torch/nccl/NCCL.assets/allreduce.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/nccl/NCCL.assets/allreduce.png -------------------------------------------------------------------------------- /torch/nccl/NCCL.assets/broadcast.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/nccl/NCCL.assets/broadcast.png -------------------------------------------------------------------------------- /torch/nccl/NCCL.assets/dp.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/nccl/NCCL.assets/dp.png -------------------------------------------------------------------------------- /torch/nccl/NCCL.assets/pp.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/nccl/NCCL.assets/pp.png -------------------------------------------------------------------------------- /torch/nccl/NCCL.assets/reduce.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/nccl/NCCL.assets/reduce.png -------------------------------------------------------------------------------- /torch/nccl/NCCL.assets/reducescatter.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/nccl/NCCL.assets/reducescatter.png -------------------------------------------------------------------------------- /torch/nccl/NCCL.assets/ring.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/nccl/NCCL.assets/ring.png -------------------------------------------------------------------------------- /torch/nccl/NCCL.assets/tp.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/nccl/NCCL.assets/tp.png -------------------------------------------------------------------------------- /torch/nccl/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/nccl/readme.md -------------------------------------------------------------------------------- /torch/nccl/readme_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/nccl/readme_en.md -------------------------------------------------------------------------------- /torch/tensor-parallelism/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/tensor-parallelism/readme.md -------------------------------------------------------------------------------- /torch/torch-distributed/DBTree.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/torch-distributed/DBTree.jpg -------------------------------------------------------------------------------- /torch/torch-distributed/codes/all-gather-reduce.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/torch-distributed/codes/all-gather-reduce.py -------------------------------------------------------------------------------- /torch/torch-distributed/codes/all-reduce-softmax.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/torch-distributed/codes/all-reduce-softmax.py -------------------------------------------------------------------------------- /torch/torch-distributed/codes/broad-cast.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/torch-distributed/codes/broad-cast.py -------------------------------------------------------------------------------- /torch/torch-distributed/codes/init-process-group.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/torch-distributed/codes/init-process-group.py -------------------------------------------------------------------------------- /torch/torch-distributed/codes/new-group.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/torch-distributed/codes/new-group.py -------------------------------------------------------------------------------- /torch/torch-distributed/codes/scatter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/torch-distributed/codes/scatter.py -------------------------------------------------------------------------------- /torch/torch-distributed/codes/send-recv-async.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/torch-distributed/codes/send-recv-async.py -------------------------------------------------------------------------------- /torch/torch-distributed/codes/send-recv-sync.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/torch-distributed/codes/send-recv-sync.py -------------------------------------------------------------------------------- /torch/torch-distributed/complete-allreduce.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/torch-distributed/complete-allreduce.svg -------------------------------------------------------------------------------- /torch/torch-distributed/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/torch/torch-distributed/readme.md -------------------------------------------------------------------------------- /transformers/attention/cross_attention.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/transformers/attention/cross_attention.md -------------------------------------------------------------------------------- /transformers/attention/cross_attention_.webp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/transformers/attention/cross_attention_.webp -------------------------------------------------------------------------------- /transformers/attention/cross_attention_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/transformers/attention/cross_attention_en.md -------------------------------------------------------------------------------- /transformers/special_tokens/special_tokens.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/transformers/special_tokens/special_tokens.md -------------------------------------------------------------------------------- /transformers/special_tokens/special_tokens_en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zhaochenyang20/Awesome-ML-SYS-Tutorial/HEAD/transformers/special_tokens/special_tokens_en.md --------------------------------------------------------------------------------