├── .gitignore ├── README.md ├── assets └── teaser.png ├── lmms-eval ├── CLAUDE.md ├── LICENSE ├── README.md ├── docs │ ├── README.md │ ├── commands.md │ ├── current_tasks.md │ ├── lmms-eval-0.3.md │ ├── lmms-eval-0.4.md │ ├── model_guide.md │ ├── run_examples.md │ ├── task_guide.md │ └── throughput_metrics.md ├── examples │ ├── chat_templates │ │ └── tool_call_qwen2_5_vl.jinja │ ├── mcp_server │ │ └── sample_mcp_server.py │ └── models │ │ ├── aero_1_audio.sh │ │ ├── aria.sh │ │ ├── auroracap.sh │ │ ├── claude.sh │ │ ├── idefics2.sh │ │ ├── instructblip.sh │ │ ├── internvl1.5.sh │ │ ├── internvl2.sh │ │ ├── llama_vid.sh │ │ ├── llama_vision.sh │ │ ├── llava_1_5.sh │ │ ├── llava_next.sh │ │ ├── llava_onevision.sh │ │ ├── llava_video.sh │ │ ├── movie_chat.sh │ │ ├── mplug_owl.sh │ │ ├── openai_compatible.sh │ │ ├── plm.sh │ │ ├── qwen25vl.sh │ │ ├── qwen2vl.sh │ │ ├── sglang.sh │ │ ├── slime.sh │ │ ├── tensor_parallel.sh │ │ ├── tinyllava.sh │ │ ├── video_chatgpt.sh │ │ ├── video_llava.sh │ │ ├── vllm_qwen2vl.sh │ │ ├── xai_grok.sh │ │ └── xcomposer.sh ├── fla │ ├── __init__.py │ ├── layers │ │ ├── __init__.py │ │ ├── abc.py │ │ ├── attn.py │ │ ├── based.py │ │ ├── bitattn.py │ │ ├── comba.py │ │ ├── delta_net.py │ │ ├── forgetting_attn.py │ │ ├── gated_deltanet.py │ │ ├── gated_deltaproduct.py │ │ ├── gla.py │ │ ├── gsa.py │ │ ├── hgrn.py │ │ ├── hgrn2.py │ │ ├── lightnet.py │ │ ├── linear_attn.py │ │ ├── mamba.py │ │ ├── mamba2.py │ │ ├── mesa_net.py │ │ ├── mla.py │ │ ├── multiscale_retention.py │ │ ├── nsa.py │ │ ├── path_attn.py │ │ ├── rebased.py │ │ ├── rodimus.py │ │ ├── rwkv6.py │ │ ├── rwkv7.py │ │ ├── simple_gla.py │ │ └── utils.py │ ├── models │ │ ├── __init__.py │ │ ├── abc │ │ │ ├── __init__.py │ │ │ ├── configuration_abc.py │ │ │ └── modeling_abc.py │ │ ├── bitnet │ │ │ ├── __init__.py │ │ │ ├── configuration_bitnet.py │ │ │ └── modeling_bitnet.py │ │ ├── comba │ │ │ ├── __init__.py │ │ │ ├── configuration_comba.py │ │ │ └── modeling_comba.py │ │ ├── delta_net │ │ │ ├── __init__.py │ │ │ ├── configuration_delta_net.py │ │ │ └── modeling_delta_net.py │ │ ├── forgetting_transformer │ │ │ ├── __init__.py │ │ │ ├── configuration_forgetting_transformer.py │ │ │ └── modeling_forgetting_transformer.py │ │ ├── gated_deltanet │ │ │ ├── __init__.py │ │ │ ├── configuration_gated_deltanet.py │ │ │ └── modeling_gated_deltanet.py │ │ ├── gated_deltaproduct │ │ │ ├── __init__.py │ │ │ ├── configuration_gated_deltaproduct.py │ │ │ └── modeling_gated_deltaproduct.py │ │ ├── gla │ │ │ ├── __init__.py │ │ │ ├── configuration_gla.py │ │ │ └── modeling_gla.py │ │ ├── gsa │ │ │ ├── __init__.py │ │ │ ├── configuration_gsa.py │ │ │ └── modeling_gsa.py │ │ ├── hgrn │ │ │ ├── __init__.py │ │ │ ├── configuration_hgrn.py │ │ │ └── modeling_hgrn.py │ │ ├── hgrn2 │ │ │ ├── __init__.py │ │ │ ├── configuration_hgrn2.py │ │ │ └── modeling_hgrn2.py │ │ ├── lightnet │ │ │ ├── __init__.py │ │ │ ├── configuration_lightnet.py │ │ │ └── modeling_lightnet.py │ │ ├── linear_attn │ │ │ ├── __init__.py │ │ │ ├── configuration_linear_attn.py │ │ │ └── modeling_linear_attn.py │ │ ├── mamba │ │ │ ├── __init__.py │ │ │ ├── configuration_mamba.py │ │ │ └── modeling_mamba.py │ │ ├── mamba2 │ │ │ ├── __init__.py │ │ │ ├── configuration_mamba2.py │ │ │ └── modeling_mamba2.py │ │ ├── mesa_net │ │ │ ├── __init__.py │ │ │ ├── configuration_mesa_net.py │ │ │ └── modeling_mesa_net.py │ │ ├── mla │ │ │ ├── __init__.py │ │ │ ├── configuration_mla.py │ │ │ └── modeling_mla.py │ │ ├── nsa │ │ │ ├── __init__.py │ │ │ ├── configuration_nsa.py │ │ │ └── modeling_nsa.py │ │ ├── path_attn │ │ │ ├── __init__.py │ │ │ ├── configuration_path_attention.py │ │ │ └── modeling_path_attention.py │ │ ├── retnet │ │ │ ├── __init__.py │ │ │ ├── configuration_retnet.py │ │ │ └── modeling_retnet.py │ │ ├── rodimus │ │ │ ├── __init__.py │ │ │ ├── configuration_rodimus.py │ │ │ └── modeling_rodimus.py │ │ ├── rwkv6 │ │ │ ├── __init__.py │ │ │ ├── configuration_rwkv6.py │ │ │ └── modeling_rwkv6.py │ │ ├── rwkv7 │ │ │ ├── __init__.py │ │ │ ├── configuration_rwkv7.py │ │ │ └── modeling_rwkv7.py │ │ ├── samba │ │ │ ├── __init__.py │ │ │ ├── configuration_samba.py │ │ │ └── modeling_samba.py │ │ ├── transformer │ │ │ ├── __init__.py │ │ │ ├── configuration_transformer.py │ │ │ └── modeling_transformer.py │ │ └── utils.py │ ├── modules │ │ ├── __init__.py │ │ ├── activations.py │ │ ├── convolution.py │ │ ├── feature_map.py │ │ ├── fused_bitlinear.py │ │ ├── fused_cross_entropy.py │ │ ├── fused_kl_div.py │ │ ├── fused_linear_cross_entropy.py │ │ ├── fused_norm_gate.py │ │ ├── grpo.py │ │ ├── l2norm.py │ │ ├── l2warp.py │ │ ├── layernorm.py │ │ ├── layernorm_gated.py │ │ ├── mlp.py │ │ ├── parallel.py │ │ ├── rotary.py │ │ └── token_shift.py │ ├── ops │ │ ├── __init__.py │ │ ├── abc │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ └── naive.py │ │ ├── attn │ │ │ ├── __init__.py │ │ │ ├── decoding.py │ │ │ └── parallel.py │ │ ├── based │ │ │ ├── __init__.py │ │ │ ├── fused_chunk.py │ │ │ ├── naive.py │ │ │ └── parallel.py │ │ ├── comba │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_recurrent.py │ │ │ ├── utils.py │ │ │ └── wy_fast.py │ │ ├── common │ │ │ ├── __init__.py │ │ │ ├── chunk_delta_h.py │ │ │ ├── chunk_h.py │ │ │ ├── chunk_h_parallel.py │ │ │ ├── chunk_h_split.py │ │ │ ├── chunk_o.py │ │ │ ├── chunk_scaled_dot_kkt.py │ │ │ ├── fused_chunk.py │ │ │ └── fused_recurrent.py │ │ ├── delta_rule │ │ │ ├── README.md │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_chunk.py │ │ │ ├── fused_recurrent.py │ │ │ ├── naive.py │ │ │ ├── parallel.py │ │ │ └── wy_fast.py │ │ ├── forgetting_attn │ │ │ ├── __init__.py │ │ │ └── parallel.py │ │ ├── gated_delta_product │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── chunk_deltaproduct_h.py │ │ │ ├── chunk_deltaproduct_o.py │ │ │ ├── chunk_ref.py │ │ │ └── naive.py │ │ ├── gated_delta_rule │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_recurrent.py │ │ │ └── wy_fast.py │ │ ├── generalized_delta_rule │ │ │ ├── README.md │ │ │ ├── __init__.py │ │ │ ├── dplr │ │ │ │ ├── __init__.py │ │ │ │ ├── chunk.py │ │ │ │ ├── chunk_A_bwd.py │ │ │ │ ├── chunk_A_fwd.py │ │ │ │ ├── chunk_h_bwd.py │ │ │ │ ├── chunk_h_fwd.py │ │ │ │ ├── chunk_o_bwd.py │ │ │ │ ├── chunk_o_fwd.py │ │ │ │ ├── fused_recurrent.py │ │ │ │ ├── naive.py │ │ │ │ ├── wy_fast_bwd.py │ │ │ │ └── wy_fast_fwd.py │ │ │ └── iplr │ │ │ │ ├── __init__.py │ │ │ │ ├── chunk.py │ │ │ │ ├── fused_recurrent.py │ │ │ │ ├── naive.py │ │ │ │ └── wy_fast.py │ │ ├── gla │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_chunk.py │ │ │ ├── fused_recurrent.py │ │ │ └── naive.py │ │ ├── gsa │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_recurrent.py │ │ │ └── naive.py │ │ ├── hgrn │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_recurrent.py │ │ │ └── naive.py │ │ ├── lightning_attn │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ └── fused_recurrent.py │ │ ├── linear_attn │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_chunk.py │ │ │ ├── fused_recurrent.py │ │ │ ├── naive.py │ │ │ └── utils.py │ │ ├── mesa_net │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── chunk_cg_solver_bwd.py │ │ │ ├── chunk_cg_solver_fwd.py │ │ │ ├── chunk_h_fwd.py │ │ │ ├── chunk_h_kk_intra_bwd.py │ │ │ ├── chunk_h_kv_intra_bwd.py │ │ │ ├── chunk_h_kv_intra_bwd_separate.py │ │ │ ├── decoding_one_step.py │ │ │ └── naive.py │ │ ├── nsa │ │ │ ├── __init__.py │ │ │ ├── compression.py │ │ │ ├── naive.py │ │ │ ├── parallel.py │ │ │ └── utils.py │ │ ├── path_attn │ │ │ ├── __init__.py │ │ │ ├── cumprod_householder_bwd.py │ │ │ ├── cumprod_householder_fwd.py │ │ │ ├── intra_chunk_preprocess_bwd.py │ │ │ ├── intra_chunk_preprocess_bwd_prepare.py │ │ │ ├── intra_chunk_preprocess_fwd.py │ │ │ ├── parallel.py │ │ │ ├── parallel_path_bwd_inter_dkv.py │ │ │ ├── parallel_path_bwd_inter_dqh.py │ │ │ ├── parallel_path_bwd_intra.py │ │ │ ├── parallel_path_fwd.py │ │ │ ├── prepare_k_cache.py │ │ │ └── transform_q.py │ │ ├── rebased │ │ │ ├── __init__.py │ │ │ ├── naive.py │ │ │ └── parallel.py │ │ ├── retention │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_chunk.py │ │ │ ├── fused_recurrent.py │ │ │ ├── naive.py │ │ │ └── parallel.py │ │ ├── rwkv4 │ │ │ ├── __init__.py │ │ │ └── fused_recurrent.py │ │ ├── rwkv6 │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── chunk_naive.py │ │ │ ├── fused_recurrent.py │ │ │ └── recurrent_naive.py │ │ ├── rwkv7 │ │ │ ├── RWKV7(Goose).md │ │ │ ├── __init__.py │ │ │ ├── channel_mixing.py │ │ │ ├── chunk.py │ │ │ ├── fused_addcmul.py │ │ │ ├── fused_k_update.py │ │ │ ├── fused_recurrent.py │ │ │ └── gate_output_correction.py │ │ ├── simple_gla │ │ │ ├── README.md │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_chunk.py │ │ │ ├── fused_recurrent.py │ │ │ ├── naive.py │ │ │ └── parallel.py │ │ ├── titans │ │ │ ├── __init__.py │ │ │ ├── log_impl.py │ │ │ └── naive.py │ │ ├── ttt │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_chunk.py │ │ │ └── naive.py │ │ └── utils │ │ │ ├── __init__.py │ │ │ ├── asm.py │ │ │ ├── constant.py │ │ │ ├── cumsum.py │ │ │ ├── index.py │ │ │ ├── logcumsumexp.py │ │ │ ├── logsumexp.py │ │ │ ├── matmul.py │ │ │ ├── op.py │ │ │ ├── pack.py │ │ │ ├── pooling.py │ │ │ ├── softmax.py │ │ │ └── solve_tril.py │ └── utils.py ├── lmms_eval │ ├── __init__.py │ ├── __main__.py │ ├── api │ │ ├── __init__.py │ │ ├── filter.py │ │ ├── group.py │ │ ├── instance.py │ │ ├── metrics.py │ │ ├── model.py │ │ ├── registry.py │ │ ├── samplers.py │ │ └── task.py │ ├── caching │ │ ├── __init__.py │ │ └── cache.py │ ├── evaluator.py │ ├── evaluator_utils.py │ ├── filters │ │ ├── __init__.py │ │ ├── decontamination.py │ │ ├── extraction.py │ │ ├── selection.py │ │ └── transformation.py │ ├── llm_judge │ │ ├── __init__.py │ │ ├── base.py │ │ ├── factory.py │ │ ├── launcher │ │ │ ├── __init__.py │ │ │ ├── base.py │ │ │ └── sglang.py │ │ ├── prompt.py │ │ ├── protocol.py │ │ ├── providers │ │ │ ├── __init__.py │ │ │ ├── async_azure_openai.py │ │ │ ├── async_openai.py │ │ │ ├── azure_openai.py │ │ │ ├── dummy.py │ │ │ └── openai.py │ │ └── utils.py │ ├── loggers │ │ ├── __init__.py │ │ ├── evaluation_tracker.py │ │ ├── utils.py │ │ └── wandb_logger.py │ ├── logging_utils.py │ ├── mcp │ │ ├── __init__.py │ │ └── client.py │ ├── models │ │ ├── __init__.py │ │ ├── chat │ │ │ ├── async_openai.py │ │ │ ├── huggingface.py │ │ │ ├── llava_hf.py │ │ │ ├── openai_compatible.py │ │ │ ├── qwen2_5_vl.py │ │ │ ├── sglang.py │ │ │ └── vllm.py │ │ ├── model_utils │ │ │ ├── __init__.py │ │ │ ├── audio_processing.py │ │ │ ├── gen_metrics.py │ │ │ ├── load_video.py │ │ │ ├── qwen │ │ │ │ └── qwen_generate_utils.py │ │ │ └── reasoning_model_utils.py │ │ ├── qwen25_vl │ │ │ ├── __init__.py │ │ │ ├── configuration_qwen2_5_vl.py │ │ │ ├── modeling │ │ │ │ ├── flex_attention.py │ │ │ │ ├── initial.py │ │ │ │ ├── last_layer.py │ │ │ │ ├── modeling_flash_attention_utils.py │ │ │ │ ├── modeling_rope_utils.py │ │ │ │ ├── npu_flash_attention.py │ │ │ │ └── utils │ │ │ │ │ ├── args_doc.py │ │ │ │ │ ├── doc.py │ │ │ │ │ ├── generic.py │ │ │ │ │ ├── import_utils.py │ │ │ │ │ └── logging.py │ │ │ ├── modeling_qwen2_5_vl.py │ │ │ ├── processing_qwen2_5_vl.py │ │ │ └── vision_process.py │ │ └── simple │ │ │ ├── aero.py │ │ │ ├── aria.py │ │ │ ├── auroracap.py │ │ │ ├── batch_gpt4.py │ │ │ ├── cambrian.py │ │ │ ├── claude.py │ │ │ ├── cogvlm2.py │ │ │ ├── egogpt.py │ │ │ ├── from_log.py │ │ │ ├── fuyu.py │ │ │ ├── gemini_api.py │ │ │ ├── gpt4v.py │ │ │ ├── idefics2.py │ │ │ ├── instructblip.py │ │ │ ├── internvideo2.py │ │ │ ├── internvideo2_5.py │ │ │ ├── internvl.py │ │ │ ├── internvl2.py │ │ │ ├── llama_vid.py │ │ │ ├── llama_vision.py │ │ │ ├── llava.py │ │ │ ├── llava_hf.py │ │ │ ├── llava_onevision.py │ │ │ ├── llava_onevision_moviechat.py │ │ │ ├── llava_sglang.py │ │ │ ├── llava_vid.py │ │ │ ├── longva.py │ │ │ ├── mantis.py │ │ │ ├── minicpm_v.py │ │ │ ├── minimonkey.py │ │ │ ├── moviechat.py │ │ │ ├── mplug_owl_video.py │ │ │ ├── ola.py │ │ │ ├── openai_compatible.py │ │ │ ├── oryx.py │ │ │ ├── phi3v.py │ │ │ ├── phi4_multimodal.py │ │ │ ├── plm.py │ │ │ ├── qwen25_vl_flexprefill.py │ │ │ ├── qwen25_vl_minference.py │ │ │ ├── qwen25_vl_trishape.py │ │ │ ├── qwen25_vl_xattention.py │ │ │ ├── qwen2_5_omni.py │ │ │ ├── qwen2_5_vl.py │ │ │ ├── qwen2_5_vl_interleave.py │ │ │ ├── qwen2_audio.py │ │ │ ├── qwen2_vl.py │ │ │ ├── qwen_vl.py │ │ │ ├── qwen_vl_api.py │ │ │ ├── reka.py │ │ │ ├── ross.py │ │ │ ├── slime.py │ │ │ ├── srt_api.py │ │ │ ├── tinyllava.py │ │ │ ├── video_chatgpt.py │ │ │ ├── video_llava.py │ │ │ ├── videochat2.py │ │ │ ├── videochat_flash.py │ │ │ ├── videollama3.py │ │ │ ├── videonsa.py │ │ │ ├── vila.py │ │ │ ├── vita.py │ │ │ ├── vllm.py │ │ │ ├── vora.py │ │ │ ├── whisper.py │ │ │ ├── whisper_vllm.py │ │ │ ├── xcomposer2_4KHD.py │ │ │ └── xcomposer2d5.py │ ├── protocol.py │ ├── tasks │ │ ├── VisualPuzzles │ │ │ ├── VisualPuzzles_cot.yaml │ │ │ ├── VisualPuzzles_direct.yaml │ │ │ └── utils.py │ │ ├── __init__.py │ │ ├── _task_utils │ │ │ ├── file_utils.py │ │ │ ├── gpt_eval_utils.py │ │ │ ├── math_verify_utils.py │ │ │ ├── video_loader.py │ │ │ └── vqa_eval_metric.py │ │ ├── activitynetqa │ │ │ ├── _default_template_yaml │ │ │ ├── activitynetqa_generation.yaml │ │ │ └── utils.py │ │ ├── ai2d │ │ │ ├── ai2d.yaml │ │ │ ├── ai2d_lite.yaml │ │ │ ├── ai2d_no_mask.yaml │ │ │ ├── upload_ai2d.py │ │ │ └── utils.py │ │ ├── aime │ │ │ ├── README.md │ │ │ ├── aime24_figures.yaml │ │ │ ├── aime24_figures_agg64.yaml │ │ │ ├── aime24_nofigures.yaml │ │ │ ├── aime24_nofigures_agg64.yaml │ │ │ ├── aime24_nofigures_agg8.yaml │ │ │ ├── aime25_nofigures.yaml │ │ │ ├── aime25_nofigures_agg64.yaml │ │ │ ├── aime25_nofigures_agg8.yaml │ │ │ ├── aime_2024_agg8.yaml │ │ │ ├── aime_2024_rebase.yaml │ │ │ ├── aime_figures.yaml │ │ │ ├── aime_nofigures.yaml │ │ │ └── utils.py │ │ ├── air_bench │ │ │ ├── _default_template_yaml │ │ │ ├── air_bench_chat.yaml │ │ │ ├── air_bench_chat_mixed.yaml │ │ │ ├── air_bench_chat_music.yaml │ │ │ ├── air_bench_chat_sound.yaml │ │ │ ├── air_bench_chat_speech.yaml │ │ │ ├── air_bench_foundation.yaml │ │ │ ├── air_bench_foundation_music.yaml │ │ │ ├── air_bench_foundation_sound.yaml │ │ │ ├── air_bench_foundation_speech.yaml │ │ │ └── utils.py │ │ ├── alpaca_audio │ │ │ ├── alpaca_audio.yaml │ │ │ └── utils.py │ │ ├── arc │ │ │ ├── README.md │ │ │ ├── arc_challenge.yaml │ │ │ └── arc_easy.yaml │ │ ├── av_odyssey │ │ │ ├── av_odyssey.yaml │ │ │ └── utils.py │ │ ├── camerabench_vqa │ │ │ ├── camerabench_vqa.yaml │ │ │ └── utils.py │ │ ├── capability │ │ │ ├── _default_template_yaml │ │ │ ├── capability.yaml │ │ │ ├── capability_OCR.yaml │ │ │ ├── capability_action.yaml │ │ │ ├── capability_camera_angle.yaml │ │ │ ├── capability_camera_movement.yaml │ │ │ ├── capability_character_identification.yaml │ │ │ ├── capability_dynamic_object_number.yaml │ │ │ ├── capability_event.yaml │ │ │ ├── capability_object_category.yaml │ │ │ ├── capability_object_color.yaml │ │ │ ├── capability_object_number.yaml │ │ │ ├── capability_scene.yaml │ │ │ ├── capability_spatial_relation.yaml │ │ │ ├── capability_style.yaml │ │ │ ├── prompt.py │ │ │ └── utils.py │ │ ├── charades_sta │ │ │ ├── charades.yaml │ │ │ ├── eval_tvg.py │ │ │ └── utils.py │ │ ├── chartqa │ │ │ ├── chartqa.yaml │ │ │ ├── chartqa_lite.yaml │ │ │ ├── upload_chartqa.py │ │ │ └── utils.py │ │ ├── cinepile │ │ │ ├── cinepile.yaml │ │ │ └── utils.py │ │ ├── clotho_aqa │ │ │ ├── _default_template_yaml │ │ │ ├── clotho_aqa.yaml │ │ │ ├── clotho_aqa_test.yaml │ │ │ ├── clotho_aqa_val.yaml │ │ │ ├── clotho_asqa_test_v2.yaml │ │ │ └── utils.py │ │ ├── cmmmu │ │ │ ├── _cmmmu.yaml │ │ │ ├── _default_template_cmmmu_yaml │ │ │ ├── cmmmu_test.yaml │ │ │ ├── cmmmu_val.yaml │ │ │ └── utils.py │ │ ├── coco_cap │ │ │ ├── coco2014_cap.yaml │ │ │ ├── coco2014_cap_test.yaml │ │ │ ├── coco2014_cap_val.yaml │ │ │ ├── coco2017_cap.yaml │ │ │ ├── coco2017_cap_test.yaml │ │ │ ├── coco2017_cap_val.yaml │ │ │ ├── coco2017_cap_val_lite.yaml │ │ │ ├── coco_cap.yaml │ │ │ ├── coco_karpathy.yaml │ │ │ ├── coco_karpathy_test.yaml │ │ │ ├── coco_karpathy_val.yaml │ │ │ └── utils.py │ │ ├── common_voice_15 │ │ │ ├── _default_template_yaml │ │ │ ├── common_voice_15.yaml │ │ │ ├── common_voice_15_en.yaml │ │ │ ├── common_voice_15_fr.yaml │ │ │ ├── common_voice_15_zh-CN.yaml │ │ │ └── utils.py │ │ ├── conbench │ │ │ ├── conbench.yaml │ │ │ └── utils.py │ │ ├── covost2 │ │ │ ├── _default_template_en_zh_yaml │ │ │ ├── _default_template_zh_en_yaml │ │ │ ├── covost2.yaml │ │ │ ├── covost2_en_zh.yaml │ │ │ ├── covost2_en_zh_dev.yaml │ │ │ ├── covost2_en_zh_test.yaml │ │ │ ├── covost2_zh_en.yaml │ │ │ ├── covost2_zh_en_dev.yaml │ │ │ ├── covost2_zh_en_test.yaml │ │ │ └── utils.py │ │ ├── cuva │ │ │ ├── _default_template_yaml │ │ │ ├── cuva.yaml │ │ │ ├── cuva_test.yaml │ │ │ └── utils.py │ │ ├── cvrr │ │ │ ├── _cvrr.yaml │ │ │ ├── _default_template_yaml │ │ │ ├── cvrr_fine_grained_action_understanding.yaml │ │ │ ├── cvrr_interpretation_of_social_context.yaml │ │ │ ├── cvrr_interpretation_of_visual_context.yaml │ │ │ ├── cvrr_multiple_actions_in_a_single_video.yaml │ │ │ ├── cvrr_non_existent_actions_with_existent_scene_depictions.yaml │ │ │ ├── cvrr_non_existent_actions_with_non_existent_scene_depictions.yaml │ │ │ ├── cvrr_object_instance_count.yaml │ │ │ ├── cvrr_partial_actions.yaml │ │ │ ├── cvrr_time_order_understanding.yaml │ │ │ ├── cvrr_understanding_emotional_context.yaml │ │ │ ├── cvrr_unusual_and_physically_anomalous_activities.yaml │ │ │ └── utils.py │ │ ├── detailcaps │ │ │ ├── _default_template_detailcaps_yaml │ │ │ ├── detailcaps.yaml │ │ │ └── utils.py │ │ ├── docvqa │ │ │ ├── _default_template_docvqa_yaml │ │ │ ├── docvqa.yaml │ │ │ ├── docvqa_test.yaml │ │ │ ├── docvqa_val.yaml │ │ │ ├── docvqa_val_lite.yaml │ │ │ └── utils.py │ │ ├── dtcbench │ │ │ ├── dtcbench.yaml │ │ │ └── utils.py │ │ ├── egoplan │ │ │ ├── egoplan.yaml │ │ │ └── utils.py │ │ ├── egoschema │ │ │ ├── README.md │ │ │ ├── _default_template_yaml │ │ │ ├── egoschema.yaml │ │ │ ├── egoschema_mcppl.yaml │ │ │ ├── egoschema_subset.yaml │ │ │ ├── egoschema_subset_mcppl.yaml │ │ │ └── utils.py │ │ ├── egothink │ │ │ ├── _default_template_yaml │ │ │ ├── egothink.yaml │ │ │ ├── egothink_activity.yaml │ │ │ ├── egothink_affordance.yaml │ │ │ ├── egothink_assistance.yaml │ │ │ ├── egothink_attribute.yaml │ │ │ ├── egothink_comparing.yaml │ │ │ ├── egothink_counting.yaml │ │ │ ├── egothink_existence.yaml │ │ │ ├── egothink_forecasting.yaml │ │ │ ├── egothink_location.yaml │ │ │ ├── egothink_navigation.yaml │ │ │ ├── egothink_situated.yaml │ │ │ ├── egothink_spatial.yaml │ │ │ └── utils.py │ │ ├── emma │ │ │ ├── emma_all.yaml │ │ │ ├── emma_mini_all.yaml │ │ │ └── utils.py │ │ ├── ferret │ │ │ ├── ferret.yaml │ │ │ ├── rule.json │ │ │ └── utils.py │ │ ├── fleurs │ │ │ ├── _default_template_yaml │ │ │ ├── fleurs.yaml │ │ │ ├── fleurs_cmn_hans_cn.yaml │ │ │ ├── fleurs_en.yaml │ │ │ ├── fleurs_yue_hant_hk.yaml │ │ │ └── utils.py │ │ ├── flickr30k │ │ │ ├── flickr30k.yaml │ │ │ ├── flickr30k_test.yaml │ │ │ ├── flickr30k_test_lite.yaml │ │ │ └── utils.py │ │ ├── funqa │ │ │ ├── _default_template_yaml │ │ │ ├── funqa.yaml │ │ │ ├── funqa_test.yaml │ │ │ └── utils.py │ │ ├── gigaspeech │ │ │ ├── gigaspeech.yaml │ │ │ ├── gigaspeech_dev.yaml │ │ │ ├── gigaspeech_l_dev.yaml │ │ │ ├── gigaspeech_l_test.yaml │ │ │ ├── gigaspeech_m_dev.yaml │ │ │ ├── gigaspeech_m_test.yaml │ │ │ ├── gigaspeech_s_dev.yaml │ │ │ ├── gigaspeech_s_test.yaml │ │ │ ├── gigaspeech_test.yaml │ │ │ ├── gigaspeech_xl_dev.yaml │ │ │ ├── gigaspeech_xl_test.yaml │ │ │ ├── gigaspeech_xs_dev.yaml │ │ │ ├── gigaspeech_xs_test.yaml │ │ │ ├── utils.py │ │ │ └── whisper_normalizer │ │ │ │ ├── basic.py │ │ │ │ ├── english.json │ │ │ │ └── english.py │ │ ├── gpqa │ │ │ ├── README.md │ │ │ ├── cot_n_shot │ │ │ │ ├── _generate_configs.py │ │ │ │ ├── _gpqa_cot_n_shot_yaml │ │ │ │ ├── gpqa_diamond_cot_n_shot.yaml │ │ │ │ ├── gpqa_extended_cot_n_shot.yaml │ │ │ │ ├── gpqa_main_cot_n_shot.yaml │ │ │ │ └── utils.py │ │ │ ├── cot_zeroshot │ │ │ │ ├── _generate_configs.py │ │ │ │ ├── _gpqa_cot_zeroshot_yaml │ │ │ │ ├── gpqa_diamond_cot_zeroshot.yaml │ │ │ │ ├── gpqa_extended_cot_zeroshot.yaml │ │ │ │ ├── gpqa_main_cot_zeroshot.yaml │ │ │ │ └── utils.py │ │ │ ├── generative │ │ │ │ ├── _generate_configs.py │ │ │ │ ├── _gpqa_generative_n_shot_yaml │ │ │ │ ├── gpqa_diamond_generative_n_shot.yaml │ │ │ │ ├── gpqa_extended_generative_n_shot.yaml │ │ │ │ ├── gpqa_main_generative_n_shot.yaml │ │ │ │ └── utils.py │ │ │ ├── n_shot │ │ │ │ ├── _generate_configs.py │ │ │ │ ├── _gpqa_n_shot_yaml │ │ │ │ ├── gpqa_diamond_n_shot.yaml │ │ │ │ ├── gpqa_extended_n_shot.yaml │ │ │ │ ├── gpqa_main_n_shot.yaml │ │ │ │ └── utils.py │ │ │ ├── openai │ │ │ │ ├── gpqa_diamond_openai.yaml │ │ │ │ ├── gpqa_diamond_openai_agg64.yaml │ │ │ │ ├── gpqa_diamond_openai_maj64_cov64.yaml │ │ │ │ └── utils.py │ │ │ └── zeroshot │ │ │ │ ├── _generate_configs.py │ │ │ │ ├── _gpqa_zeroshot_yaml │ │ │ │ ├── gpqa_diamond_zeroshot.yaml │ │ │ │ ├── gpqa_extended_zeroshot.yaml │ │ │ │ ├── gpqa_main_zeroshot.yaml │ │ │ │ └── utils.py │ │ ├── gqa │ │ │ ├── gqa.yaml │ │ │ ├── gqa_lite.yaml │ │ │ └── utils.py │ │ ├── gqa_ru │ │ │ ├── gqa_ru.yaml │ │ │ └── utils.py │ │ ├── gsm8k │ │ │ ├── README.md │ │ │ ├── gsm8k-cot-llama.yaml │ │ │ ├── gsm8k-cot-self-consistency.yaml │ │ │ ├── gsm8k-cot-zeroshot.yaml │ │ │ ├── gsm8k-cot.yaml │ │ │ └── gsm8k.yaml │ │ ├── hallusion_bench │ │ │ ├── evaluate_hb.py │ │ │ ├── hallusion_bench_image.yaml │ │ │ └── utils.py │ │ ├── hellaswag │ │ │ ├── README.md │ │ │ ├── hellaswag.yaml │ │ │ └── utils.py │ │ ├── hrbench │ │ │ ├── hrbench.yaml │ │ │ ├── hrbench4k.yaml │ │ │ ├── hrbench8k.yaml │ │ │ ├── hrbench_evals.py │ │ │ └── utils.py │ │ ├── iconqa │ │ │ ├── _default_template_docvqa_yaml │ │ │ ├── iconqa.yaml │ │ │ ├── iconqa_test.yaml │ │ │ ├── iconqa_val.yaml │ │ │ └── utils.py │ │ ├── ifeval │ │ │ ├── README.md │ │ │ ├── ifeval.yaml │ │ │ ├── instructions.py │ │ │ ├── instructions_registry.py │ │ │ ├── instructions_util.py │ │ │ └── utils.py │ │ ├── ii_bench │ │ │ ├── ii_bench.yaml │ │ │ └── utils.py │ │ ├── illusionvqa │ │ │ ├── illusionvqa.yaml │ │ │ ├── illusionvqa_comprehension.yaml │ │ │ ├── illusionvqa_soft_localization.yaml │ │ │ └── utils.py │ │ ├── infovqa │ │ │ ├── _default_template_infovqa_yaml │ │ │ ├── infovqa.yaml │ │ │ ├── infovqa_test.yaml │ │ │ ├── infovqa_val.yaml │ │ │ ├── infovqa_val_lite.yaml │ │ │ └── utils.py │ │ ├── internal_eval │ │ │ ├── _default_template_internal_eval_yaml │ │ │ ├── d170_cn.yaml │ │ │ ├── d170_cn_utils.py │ │ │ ├── d170_en.yaml │ │ │ ├── d170_en_utils.py │ │ │ ├── dc100_en.yaml │ │ │ ├── dc100_en_utils.py │ │ │ ├── dc200_cn.yaml │ │ │ ├── dc200_cn_utils.py │ │ │ ├── internal_eval.yaml │ │ │ └── utils.py │ │ ├── jmmmu │ │ │ ├── _default_template_yaml │ │ │ ├── jmmmu.yaml │ │ │ ├── jmmmu_accounting.yaml │ │ │ ├── jmmmu_agriculture.yaml │ │ │ ├── jmmmu_architecture_and_engineering.yaml │ │ │ ├── jmmmu_basic_medical_science.yaml │ │ │ ├── jmmmu_biology.yaml │ │ │ ├── jmmmu_chemistry.yaml │ │ │ ├── jmmmu_clinical_medicine.yaml │ │ │ ├── jmmmu_computer_science.yaml │ │ │ ├── jmmmu_design.yaml │ │ │ ├── jmmmu_diagnostics_and_laboratory_medicine.yaml │ │ │ ├── jmmmu_economics.yaml │ │ │ ├── jmmmu_electronics.yaml │ │ │ ├── jmmmu_energy_and_power.yaml │ │ │ ├── jmmmu_finance.yaml │ │ │ ├── jmmmu_japanese_art.yaml │ │ │ ├── jmmmu_japanese_heritage.yaml │ │ │ ├── jmmmu_japanese_history.yaml │ │ │ ├── jmmmu_manage.yaml │ │ │ ├── jmmmu_marketing.yaml │ │ │ ├── jmmmu_materials.yaml │ │ │ ├── jmmmu_math.yaml │ │ │ ├── jmmmu_mechanical_engineering.yaml │ │ │ ├── jmmmu_music.yaml │ │ │ ├── jmmmu_pharmacy.yaml │ │ │ ├── jmmmu_physics.yaml │ │ │ ├── jmmmu_psychology.yaml │ │ │ ├── jmmmu_public_health.yaml │ │ │ ├── jmmmu_world_history.yaml │ │ │ └── utils.py │ │ ├── k12 │ │ │ ├── k12.yaml │ │ │ └── utils.py │ │ ├── librispeech │ │ │ ├── _default_yaml_template │ │ │ ├── cn_tn.py │ │ │ ├── librispeech.yaml │ │ │ ├── librispeech_dev_clean.yaml │ │ │ ├── librispeech_dev_other.yaml │ │ │ ├── librispeech_long.yaml │ │ │ ├── librispeech_test_clean.yaml │ │ │ ├── librispeech_test_clean_long.yaml │ │ │ ├── librispeech_test_other.yaml │ │ │ ├── librispeech_test_other_long.yaml │ │ │ ├── utils.py │ │ │ └── whisper_normalizer │ │ │ │ ├── basic.py │ │ │ │ ├── english.json │ │ │ │ └── english.py │ │ ├── live_bench │ │ │ ├── live_bench.yaml │ │ │ ├── live_bench_2406.yaml │ │ │ ├── live_bench_2407.yaml │ │ │ ├── live_bench_2409.yaml │ │ │ ├── live_bench_template_yaml │ │ │ ├── live_bench_template_yaml_v2 │ │ │ ├── utils.py │ │ │ └── utils_v2.py │ │ ├── livexiv_tqa │ │ │ ├── livexiv_tqa.yaml │ │ │ ├── livexiv_tqa_template_yaml │ │ │ ├── livexiv_tqa_v1.yaml │ │ │ ├── livexiv_tqa_v2.yaml │ │ │ ├── livexiv_tqa_v3.yaml │ │ │ ├── livexiv_tqa_v4.yaml │ │ │ ├── livexiv_tqa_v5.yaml │ │ │ ├── livexiv_tqa_v6.yaml │ │ │ └── utils.py │ │ ├── livexiv_vqa │ │ │ ├── livexiv_vqa.yaml │ │ │ ├── livexiv_vqa_template_yaml │ │ │ ├── livexiv_vqa_v1.yaml │ │ │ ├── livexiv_vqa_v2.yaml │ │ │ ├── livexiv_vqa_v3.yaml │ │ │ ├── livexiv_vqa_v4.yaml │ │ │ ├── livexiv_vqa_v5.yaml │ │ │ ├── livexiv_vqa_v6.yaml │ │ │ └── utils.py │ │ ├── llava-bench-coco │ │ │ ├── llava-bench-coco.yaml │ │ │ ├── rule.json │ │ │ └── utils.py │ │ ├── llava-in-the-wild │ │ │ ├── llava-in-the-wild.yaml │ │ │ ├── llava-in-the-wild_ko.yaml │ │ │ ├── rule.json │ │ │ ├── rule_ko.json │ │ │ ├── utils.py │ │ │ └── utils_ko.py │ │ ├── llava_interleave_bench │ │ │ ├── _default_template_interleave_yaml │ │ │ ├── in_domain.yaml │ │ │ ├── interleave_bench.yaml │ │ │ ├── multi_view_in_domain.yaml │ │ │ ├── out_of_domain.yaml │ │ │ └── utils.py │ │ ├── llava_wilder │ │ │ ├── _default_template_wilder_yaml │ │ │ ├── llava_wilder_small.yaml │ │ │ └── utils.py │ │ ├── longtimescope │ │ │ ├── longtimescope.yaml │ │ │ └── utils.py │ │ ├── longvideobench │ │ │ ├── longvideobench_test_i.yaml │ │ │ ├── longvideobench_test_v.yaml │ │ │ ├── longvideobench_val_i.yaml │ │ │ ├── longvideobench_val_v.yaml │ │ │ └── utils.py │ │ ├── lsdbench │ │ │ ├── README.md │ │ │ ├── lsdbench.yaml │ │ │ └── utils.py │ │ ├── mathverse │ │ │ ├── mathverse.yaml │ │ │ ├── mathverse_evals.py │ │ │ ├── mathverse_testmini.yaml │ │ │ ├── mathverse_testmini_text.yaml │ │ │ ├── mathverse_testmini_text_dominant.yaml │ │ │ ├── mathverse_testmini_text_lite.yaml │ │ │ ├── mathverse_testmini_text_only.yaml │ │ │ ├── mathverse_testmini_vision.yaml │ │ │ ├── mathverse_testmini_vision_dominant.yaml │ │ │ ├── mathverse_testmini_vision_intensive.yaml │ │ │ ├── mathverse_testmini_vision_only.yaml │ │ │ └── utils.py │ │ ├── mathvision │ │ │ ├── eval_utils.py │ │ │ ├── mathvision_reason_test.yaml │ │ │ ├── mathvision_reason_testmini.yaml │ │ │ ├── mathvision_test.yaml │ │ │ ├── mathvision_testmini.yaml │ │ │ └── utils.py │ │ ├── mathvista │ │ │ ├── mathvista.yaml │ │ │ ├── mathvista_evals.py │ │ │ ├── mathvista_test.yaml │ │ │ ├── mathvista_testmini.yaml │ │ │ ├── mathvista_testmini_cot.yaml │ │ │ ├── mathvista_testmini_format.yaml │ │ │ ├── mathvista_testmini_solution.yaml │ │ │ └── utils.py │ │ ├── megabench │ │ │ ├── README.md │ │ │ ├── _default_template_yaml │ │ │ ├── breakdown │ │ │ │ ├── all_task_meta.json │ │ │ │ ├── analysis_utils.py │ │ │ │ └── derive_breakdown_results.py │ │ │ ├── evaluator.py │ │ │ ├── image_video_utils.py │ │ │ ├── megabench.yaml │ │ │ ├── megabench_core.yaml │ │ │ ├── megabench_core_si.yaml │ │ │ ├── megabench_open.yaml │ │ │ ├── megabench_open_si.yaml │ │ │ ├── metrics │ │ │ │ ├── README.md │ │ │ │ ├── __init__.py │ │ │ │ ├── aggregation │ │ │ │ │ ├── mean_agg.py │ │ │ │ │ ├── min_agg.py │ │ │ │ │ └── unsupported_agg.py │ │ │ │ ├── aggregation_type.py │ │ │ │ ├── metric_type.py │ │ │ │ ├── parsing │ │ │ │ │ ├── answer_str_parse.py │ │ │ │ │ ├── common │ │ │ │ │ │ ├── parsers.py │ │ │ │ │ │ └── utils.py │ │ │ │ │ ├── dummy_parse.py │ │ │ │ │ └── json_parse.py │ │ │ │ ├── response_parse_type.py │ │ │ │ └── scoring │ │ │ │ │ ├── ascii_art_vlm_judge.py │ │ │ │ │ ├── chess_jaccard.py │ │ │ │ │ ├── common │ │ │ │ │ ├── conversions.py │ │ │ │ │ ├── metrics.py │ │ │ │ │ └── transformations.py │ │ │ │ │ ├── constrained_generation.py │ │ │ │ │ ├── coordinate_sequence_match.py │ │ │ │ │ ├── dict_equality.py │ │ │ │ │ ├── dict_exact_match_agg_recall.py │ │ │ │ │ ├── dict_jaccard_agg_jaccard.py │ │ │ │ │ ├── dict_nbbox_iou_tuple_agg_jaccard.py │ │ │ │ │ ├── dict_set_equality_agg_jaccard.py │ │ │ │ │ ├── exact_str_match.py │ │ │ │ │ ├── exact_str_match_case_insensitive.py │ │ │ │ │ ├── general_numerical_match.py │ │ │ │ │ ├── geo_proximity.py │ │ │ │ │ ├── gleu.py │ │ │ │ │ ├── jaccard.py │ │ │ │ │ ├── latex_expr_equality.py │ │ │ │ │ ├── longest_common_list_prefix_ratio.py │ │ │ │ │ ├── mse.py │ │ │ │ │ ├── multi_ref_phrase.py │ │ │ │ │ ├── nbbox_iou.py │ │ │ │ │ ├── near_str_match.py │ │ │ │ │ ├── nli_entailment.py │ │ │ │ │ ├── normalized_similarity_damerau_levenshtein.py │ │ │ │ │ ├── number_rel_diff_ratio.py │ │ │ │ │ ├── positive_int_match.py │ │ │ │ │ ├── program_judge.py │ │ │ │ │ ├── sacrebleu_bleu.py │ │ │ │ │ ├── sequence_equality.py │ │ │ │ │ ├── set_equality.py │ │ │ │ │ ├── set_precision.py │ │ │ │ │ ├── simple_str_match.py │ │ │ │ │ ├── symbolic_planning.py │ │ │ │ │ ├── unsupported_scoring.py │ │ │ │ │ ├── vlm_as_judge.py │ │ │ │ │ ├── xml_nbbox_iou.py │ │ │ │ │ ├── xml_norm_point_distance.py │ │ │ │ │ └── xml_norm_point_in_bbox.py │ │ │ ├── requirements.txt │ │ │ └── utils.py │ │ ├── mia_bench │ │ │ ├── mia_bench.yaml │ │ │ └── utils.py │ │ ├── mirb │ │ │ ├── mirb.yaml │ │ │ └── utils.py │ │ ├── mix_evals │ │ │ ├── README.md │ │ │ ├── audio2text │ │ │ │ ├── _default_template_yaml │ │ │ │ ├── mix_evals_audio2_text_freeform.yaml │ │ │ │ ├── mix_evals_audio2_text_freeform_hard.yaml │ │ │ │ ├── mix_evals_audio2text.yaml │ │ │ │ ├── mix_evals_audio2text_hard.yaml │ │ │ │ └── utils.py │ │ │ ├── image2text │ │ │ │ ├── _default_template_yaml │ │ │ │ ├── mix_evals_image2text.yaml │ │ │ │ ├── mix_evals_image2text_freeform.yaml │ │ │ │ ├── mix_evals_image2text_freeform_hard.yaml │ │ │ │ ├── mix_evals_image2text_hard.yaml │ │ │ │ ├── mix_evals_image2text_mc.yaml │ │ │ │ ├── mix_evals_image2text_mc_hard.yaml │ │ │ │ └── utils.py │ │ │ └── video2text │ │ │ │ ├── _default_template_yaml │ │ │ │ ├── mix_evals_video2text.yaml │ │ │ │ ├── mix_evals_video2text_freeform.yaml │ │ │ │ ├── mix_evals_video2text_freeform_hard.yaml │ │ │ │ ├── mix_evals_video2text_hard.yaml │ │ │ │ ├── mix_evals_video2text_mc.yaml │ │ │ │ ├── mix_evals_video2text_mc_hard.yaml │ │ │ │ ├── mix_evals_video2text_openended.yaml │ │ │ │ └── utils.py │ │ ├── mlvu │ │ │ ├── mlvu_dev.yaml │ │ │ ├── mlvu_test.yaml │ │ │ └── utils.py │ │ ├── mmau │ │ │ ├── _default_template_yaml │ │ │ ├── mmau.yaml │ │ │ ├── mmau_test.yaml │ │ │ ├── mmau_test_mini.yaml │ │ │ └── utils.py │ │ ├── mmbench │ │ │ ├── _default_template_mmbench_cn_yaml │ │ │ ├── _default_template_mmbench_en_yaml │ │ │ ├── _default_template_mmbench_ko_yaml │ │ │ ├── _default_template_mmbench_ru_yaml │ │ │ ├── cc_utils.py │ │ │ ├── cn_utils.py │ │ │ ├── en_utils.py │ │ │ ├── ko_utils.py │ │ │ ├── mmbench.yaml │ │ │ ├── mmbench_cc.yaml │ │ │ ├── mmbench_cn.yaml │ │ │ ├── mmbench_cn_dev.yaml │ │ │ ├── mmbench_cn_dev_lite.yaml │ │ │ ├── mmbench_cn_test.yaml │ │ │ ├── mmbench_en.yaml │ │ │ ├── mmbench_en_dev.yaml │ │ │ ├── mmbench_en_dev_lite.yaml │ │ │ ├── mmbench_en_test.yaml │ │ │ ├── mmbench_evals.py │ │ │ ├── mmbench_ko_dev.yaml │ │ │ ├── mmbench_ru_dev.yaml │ │ │ └── ru_utils.py │ │ ├── mme │ │ │ ├── mme.yaml │ │ │ └── utils.py │ │ ├── mme_cot │ │ │ ├── README.md │ │ │ ├── mme_cot_direct.yaml │ │ │ ├── mme_cot_reason.yaml │ │ │ └── utils.py │ │ ├── mme_realworld │ │ │ ├── mme_realworld.yaml │ │ │ ├── mme_realworld_cn.yaml │ │ │ ├── mme_realworld_lite.yaml │ │ │ └── utils.py │ │ ├── mmlu │ │ │ ├── _generate_configs.py │ │ │ ├── continuation │ │ │ │ ├── _continuation_template_yaml │ │ │ │ ├── _mmlu.yaml │ │ │ │ ├── mmlu_abstract_algebra.yaml │ │ │ │ ├── mmlu_anatomy.yaml │ │ │ │ ├── mmlu_astronomy.yaml │ │ │ │ ├── mmlu_business_ethics.yaml │ │ │ │ ├── mmlu_clinical_knowledge.yaml │ │ │ │ ├── mmlu_college_biology.yaml │ │ │ │ ├── mmlu_college_chemistry.yaml │ │ │ │ ├── mmlu_college_computer_science.yaml │ │ │ │ ├── mmlu_college_mathematics.yaml │ │ │ │ ├── mmlu_college_medicine.yaml │ │ │ │ ├── mmlu_college_physics.yaml │ │ │ │ ├── mmlu_computer_security.yaml │ │ │ │ ├── mmlu_conceptual_physics.yaml │ │ │ │ ├── mmlu_econometrics.yaml │ │ │ │ ├── mmlu_electrical_engineering.yaml │ │ │ │ ├── mmlu_elementary_mathematics.yaml │ │ │ │ ├── mmlu_formal_logic.yaml │ │ │ │ ├── mmlu_global_facts.yaml │ │ │ │ ├── mmlu_high_school_biology.yaml │ │ │ │ ├── mmlu_high_school_chemistry.yaml │ │ │ │ ├── mmlu_high_school_computer_science.yaml │ │ │ │ ├── mmlu_high_school_european_history.yaml │ │ │ │ ├── mmlu_high_school_geography.yaml │ │ │ │ ├── mmlu_high_school_government_and_politics.yaml │ │ │ │ ├── mmlu_high_school_macroeconomics.yaml │ │ │ │ ├── mmlu_high_school_mathematics.yaml │ │ │ │ ├── mmlu_high_school_microeconomics.yaml │ │ │ │ ├── mmlu_high_school_physics.yaml │ │ │ │ ├── mmlu_high_school_psychology.yaml │ │ │ │ ├── mmlu_high_school_statistics.yaml │ │ │ │ ├── mmlu_high_school_us_history.yaml │ │ │ │ ├── mmlu_high_school_world_history.yaml │ │ │ │ ├── mmlu_human_aging.yaml │ │ │ │ ├── mmlu_human_sexuality.yaml │ │ │ │ ├── mmlu_international_law.yaml │ │ │ │ ├── mmlu_jurisprudence.yaml │ │ │ │ ├── mmlu_logical_fallacies.yaml │ │ │ │ ├── mmlu_machine_learning.yaml │ │ │ │ ├── mmlu_management.yaml │ │ │ │ ├── mmlu_marketing.yaml │ │ │ │ ├── mmlu_medical_genetics.yaml │ │ │ │ ├── mmlu_miscellaneous.yaml │ │ │ │ ├── mmlu_moral_disputes.yaml │ │ │ │ ├── mmlu_moral_scenarios.yaml │ │ │ │ ├── mmlu_nutrition.yaml │ │ │ │ ├── mmlu_philosophy.yaml │ │ │ │ ├── mmlu_prehistory.yaml │ │ │ │ ├── mmlu_professional_accounting.yaml │ │ │ │ ├── mmlu_professional_law.yaml │ │ │ │ ├── mmlu_professional_medicine.yaml │ │ │ │ ├── mmlu_professional_psychology.yaml │ │ │ │ ├── mmlu_public_relations.yaml │ │ │ │ ├── mmlu_security_studies.yaml │ │ │ │ ├── mmlu_sociology.yaml │ │ │ │ ├── mmlu_us_foreign_policy.yaml │ │ │ │ ├── mmlu_virology.yaml │ │ │ │ └── mmlu_world_religions.yaml │ │ │ ├── default │ │ │ │ ├── _default_template_yaml │ │ │ │ ├── _mmlu.yaml │ │ │ │ ├── _mmlu_humanities.yaml │ │ │ │ ├── _mmlu_other.yaml │ │ │ │ ├── _mmlu_social_sciences.yaml │ │ │ │ ├── _mmlu_stem.yaml │ │ │ │ ├── mmlu_abstract_algebra.yaml │ │ │ │ ├── mmlu_anatomy.yaml │ │ │ │ ├── mmlu_astronomy.yaml │ │ │ │ ├── mmlu_business_ethics.yaml │ │ │ │ ├── mmlu_clinical_knowledge.yaml │ │ │ │ ├── mmlu_college_biology.yaml │ │ │ │ ├── mmlu_college_chemistry.yaml │ │ │ │ ├── mmlu_college_computer_science.yaml │ │ │ │ ├── mmlu_college_mathematics.yaml │ │ │ │ ├── mmlu_college_medicine.yaml │ │ │ │ ├── mmlu_college_physics.yaml │ │ │ │ ├── mmlu_computer_security.yaml │ │ │ │ ├── mmlu_conceptual_physics.yaml │ │ │ │ ├── mmlu_econometrics.yaml │ │ │ │ ├── mmlu_electrical_engineering.yaml │ │ │ │ ├── mmlu_elementary_mathematics.yaml │ │ │ │ ├── mmlu_formal_logic.yaml │ │ │ │ ├── mmlu_global_facts.yaml │ │ │ │ ├── mmlu_high_school_biology.yaml │ │ │ │ ├── mmlu_high_school_chemistry.yaml │ │ │ │ ├── mmlu_high_school_computer_science.yaml │ │ │ │ ├── mmlu_high_school_european_history.yaml │ │ │ │ ├── mmlu_high_school_geography.yaml │ │ │ │ ├── mmlu_high_school_government_and_politics.yaml │ │ │ │ ├── mmlu_high_school_macroeconomics.yaml │ │ │ │ ├── mmlu_high_school_mathematics.yaml │ │ │ │ ├── mmlu_high_school_microeconomics.yaml │ │ │ │ ├── mmlu_high_school_physics.yaml │ │ │ │ ├── mmlu_high_school_psychology.yaml │ │ │ │ ├── mmlu_high_school_statistics.yaml │ │ │ │ ├── mmlu_high_school_us_history.yaml │ │ │ │ ├── mmlu_high_school_world_history.yaml │ │ │ │ ├── mmlu_human_aging.yaml │ │ │ │ ├── mmlu_human_sexuality.yaml │ │ │ │ ├── mmlu_international_law.yaml │ │ │ │ ├── mmlu_jurisprudence.yaml │ │ │ │ ├── mmlu_logical_fallacies.yaml │ │ │ │ ├── mmlu_machine_learning.yaml │ │ │ │ ├── mmlu_management.yaml │ │ │ │ ├── mmlu_marketing.yaml │ │ │ │ ├── mmlu_medical_genetics.yaml │ │ │ │ ├── mmlu_miscellaneous.yaml │ │ │ │ ├── mmlu_moral_disputes.yaml │ │ │ │ ├── mmlu_moral_scenarios.yaml │ │ │ │ ├── mmlu_nutrition.yaml │ │ │ │ ├── mmlu_philosophy.yaml │ │ │ │ ├── mmlu_prehistory.yaml │ │ │ │ ├── mmlu_professional_accounting.yaml │ │ │ │ ├── mmlu_professional_law.yaml │ │ │ │ ├── mmlu_professional_medicine.yaml │ │ │ │ ├── mmlu_professional_psychology.yaml │ │ │ │ ├── mmlu_public_relations.yaml │ │ │ │ ├── mmlu_security_studies.yaml │ │ │ │ ├── mmlu_sociology.yaml │ │ │ │ ├── mmlu_us_foreign_policy.yaml │ │ │ │ ├── mmlu_virology.yaml │ │ │ │ └── mmlu_world_religions.yaml │ │ │ ├── flan_cot_fewshot │ │ │ │ ├── _cot_prompts.json │ │ │ │ ├── _mmlu.yaml │ │ │ │ ├── _mmlu_flan_cot_fewshot_template_yaml │ │ │ │ ├── mmlu_abstract_algebra.yaml │ │ │ │ ├── mmlu_anatomy.yaml │ │ │ │ ├── mmlu_astronomy.yaml │ │ │ │ ├── mmlu_business_ethics.yaml │ │ │ │ ├── mmlu_clinical_knowledge.yaml │ │ │ │ ├── mmlu_college_biology.yaml │ │ │ │ ├── mmlu_college_chemistry.yaml │ │ │ │ ├── mmlu_college_computer_science.yaml │ │ │ │ ├── mmlu_college_mathematics.yaml │ │ │ │ ├── mmlu_college_medicine.yaml │ │ │ │ ├── mmlu_college_physics.yaml │ │ │ │ ├── mmlu_computer_security.yaml │ │ │ │ ├── mmlu_conceptual_physics.yaml │ │ │ │ ├── mmlu_econometrics.yaml │ │ │ │ ├── mmlu_electrical_engineering.yaml │ │ │ │ ├── mmlu_elementary_mathematics.yaml │ │ │ │ ├── mmlu_formal_logic.yaml │ │ │ │ ├── mmlu_global_facts.yaml │ │ │ │ ├── mmlu_high_school_biology.yaml │ │ │ │ ├── mmlu_high_school_chemistry.yaml │ │ │ │ ├── mmlu_high_school_computer_science.yaml │ │ │ │ ├── mmlu_high_school_european_history.yaml │ │ │ │ ├── mmlu_high_school_geography.yaml │ │ │ │ ├── mmlu_high_school_government_and_politics.yaml │ │ │ │ ├── mmlu_high_school_macroeconomics.yaml │ │ │ │ ├── mmlu_high_school_mathematics.yaml │ │ │ │ ├── mmlu_high_school_microeconomics.yaml │ │ │ │ ├── mmlu_high_school_physics.yaml │ │ │ │ ├── mmlu_high_school_psychology.yaml │ │ │ │ ├── mmlu_high_school_statistics.yaml │ │ │ │ ├── mmlu_high_school_us_history.yaml │ │ │ │ ├── mmlu_high_school_world_history.yaml │ │ │ │ ├── mmlu_human_aging.yaml │ │ │ │ ├── mmlu_human_sexuality.yaml │ │ │ │ ├── mmlu_international_law.yaml │ │ │ │ ├── mmlu_jurisprudence.yaml │ │ │ │ ├── mmlu_logical_fallacies.yaml │ │ │ │ ├── mmlu_machine_learning.yaml │ │ │ │ ├── mmlu_management.yaml │ │ │ │ ├── mmlu_marketing.yaml │ │ │ │ ├── mmlu_medical_genetics.yaml │ │ │ │ ├── mmlu_miscellaneous.yaml │ │ │ │ ├── mmlu_moral_disputes.yaml │ │ │ │ ├── mmlu_moral_scenarios.yaml │ │ │ │ ├── mmlu_nutrition.yaml │ │ │ │ ├── mmlu_philosophy.yaml │ │ │ │ ├── mmlu_prehistory.yaml │ │ │ │ ├── mmlu_professional_accounting.yaml │ │ │ │ ├── mmlu_professional_law.yaml │ │ │ │ ├── mmlu_professional_medicine.yaml │ │ │ │ ├── mmlu_professional_psychology.yaml │ │ │ │ ├── mmlu_public_relations.yaml │ │ │ │ ├── mmlu_security_studies.yaml │ │ │ │ ├── mmlu_sociology.yaml │ │ │ │ ├── mmlu_us_foreign_policy.yaml │ │ │ │ ├── mmlu_virology.yaml │ │ │ │ └── mmlu_world_religions.yaml │ │ │ ├── flan_cot_zeroshot │ │ │ │ ├── _mmlu.yaml │ │ │ │ ├── _mmlu_flan_cot_zeroshot_template_yaml │ │ │ │ ├── mmlu_abstract_algebra.yaml │ │ │ │ ├── mmlu_anatomy.yaml │ │ │ │ ├── mmlu_astronomy.yaml │ │ │ │ ├── mmlu_business_ethics.yaml │ │ │ │ ├── mmlu_clinical_knowledge.yaml │ │ │ │ ├── mmlu_college_biology.yaml │ │ │ │ ├── mmlu_college_chemistry.yaml │ │ │ │ ├── mmlu_college_computer_science.yaml │ │ │ │ ├── mmlu_college_mathematics.yaml │ │ │ │ ├── mmlu_college_medicine.yaml │ │ │ │ ├── mmlu_college_physics.yaml │ │ │ │ ├── mmlu_computer_security.yaml │ │ │ │ ├── mmlu_conceptual_physics.yaml │ │ │ │ ├── mmlu_econometrics.yaml │ │ │ │ ├── mmlu_electrical_engineering.yaml │ │ │ │ ├── mmlu_elementary_mathematics.yaml │ │ │ │ ├── mmlu_formal_logic.yaml │ │ │ │ ├── mmlu_global_facts.yaml │ │ │ │ ├── mmlu_high_school_biology.yaml │ │ │ │ ├── mmlu_high_school_chemistry.yaml │ │ │ │ ├── mmlu_high_school_computer_science.yaml │ │ │ │ ├── mmlu_high_school_european_history.yaml │ │ │ │ ├── mmlu_high_school_geography.yaml │ │ │ │ ├── mmlu_high_school_government_and_politics.yaml │ │ │ │ ├── mmlu_high_school_macroeconomics.yaml │ │ │ │ ├── mmlu_high_school_mathematics.yaml │ │ │ │ ├── mmlu_high_school_microeconomics.yaml │ │ │ │ ├── mmlu_high_school_physics.yaml │ │ │ │ ├── mmlu_high_school_psychology.yaml │ │ │ │ ├── mmlu_high_school_statistics.yaml │ │ │ │ ├── mmlu_high_school_us_history.yaml │ │ │ │ ├── mmlu_high_school_world_history.yaml │ │ │ │ ├── mmlu_human_aging.yaml │ │ │ │ ├── mmlu_human_sexuality.yaml │ │ │ │ ├── mmlu_international_law.yaml │ │ │ │ ├── mmlu_jurisprudence.yaml │ │ │ │ ├── mmlu_logical_fallacies.yaml │ │ │ │ ├── mmlu_machine_learning.yaml │ │ │ │ ├── mmlu_management.yaml │ │ │ │ ├── mmlu_marketing.yaml │ │ │ │ ├── mmlu_medical_genetics.yaml │ │ │ │ ├── mmlu_miscellaneous.yaml │ │ │ │ ├── mmlu_moral_disputes.yaml │ │ │ │ ├── mmlu_moral_scenarios.yaml │ │ │ │ ├── mmlu_nutrition.yaml │ │ │ │ ├── mmlu_philosophy.yaml │ │ │ │ ├── mmlu_prehistory.yaml │ │ │ │ ├── mmlu_professional_accounting.yaml │ │ │ │ ├── mmlu_professional_law.yaml │ │ │ │ ├── mmlu_professional_medicine.yaml │ │ │ │ ├── mmlu_professional_psychology.yaml │ │ │ │ ├── mmlu_public_relations.yaml │ │ │ │ ├── mmlu_security_studies.yaml │ │ │ │ ├── mmlu_sociology.yaml │ │ │ │ ├── mmlu_us_foreign_policy.yaml │ │ │ │ ├── mmlu_virology.yaml │ │ │ │ ├── mmlu_world_religions.yaml │ │ │ │ └── utils.py │ │ │ ├── flan_n_shot │ │ │ │ ├── generative │ │ │ │ │ ├── _mmlu.yaml │ │ │ │ │ ├── _mmlu_flan_generative_template_yaml │ │ │ │ │ ├── mmlu_abstract_algebra.yaml │ │ │ │ │ ├── mmlu_anatomy.yaml │ │ │ │ │ ├── mmlu_astronomy.yaml │ │ │ │ │ ├── mmlu_business_ethics.yaml │ │ │ │ │ ├── mmlu_clinical_knowledge.yaml │ │ │ │ │ ├── mmlu_college_biology.yaml │ │ │ │ │ ├── mmlu_college_chemistry.yaml │ │ │ │ │ ├── mmlu_college_computer_science.yaml │ │ │ │ │ ├── mmlu_college_mathematics.yaml │ │ │ │ │ ├── mmlu_college_medicine.yaml │ │ │ │ │ ├── mmlu_college_physics.yaml │ │ │ │ │ ├── mmlu_computer_security.yaml │ │ │ │ │ ├── mmlu_conceptual_physics.yaml │ │ │ │ │ ├── mmlu_econometrics.yaml │ │ │ │ │ ├── mmlu_electrical_engineering.yaml │ │ │ │ │ ├── mmlu_elementary_mathematics.yaml │ │ │ │ │ ├── mmlu_formal_logic.yaml │ │ │ │ │ ├── mmlu_global_facts.yaml │ │ │ │ │ ├── mmlu_high_school_biology.yaml │ │ │ │ │ ├── mmlu_high_school_chemistry.yaml │ │ │ │ │ ├── mmlu_high_school_computer_science.yaml │ │ │ │ │ ├── mmlu_high_school_european_history.yaml │ │ │ │ │ ├── mmlu_high_school_geography.yaml │ │ │ │ │ ├── mmlu_high_school_government_and_politics.yaml │ │ │ │ │ ├── mmlu_high_school_macroeconomics.yaml │ │ │ │ │ ├── mmlu_high_school_mathematics.yaml │ │ │ │ │ ├── mmlu_high_school_microeconomics.yaml │ │ │ │ │ ├── mmlu_high_school_physics.yaml │ │ │ │ │ ├── mmlu_high_school_psychology.yaml │ │ │ │ │ ├── mmlu_high_school_statistics.yaml │ │ │ │ │ ├── mmlu_high_school_us_history.yaml │ │ │ │ │ ├── mmlu_high_school_world_history.yaml │ │ │ │ │ ├── mmlu_human_aging.yaml │ │ │ │ │ ├── mmlu_human_sexuality.yaml │ │ │ │ │ ├── mmlu_international_law.yaml │ │ │ │ │ ├── mmlu_jurisprudence.yaml │ │ │ │ │ ├── mmlu_logical_fallacies.yaml │ │ │ │ │ ├── mmlu_machine_learning.yaml │ │ │ │ │ ├── mmlu_management.yaml │ │ │ │ │ ├── mmlu_marketing.yaml │ │ │ │ │ ├── mmlu_medical_genetics.yaml │ │ │ │ │ ├── mmlu_miscellaneous.yaml │ │ │ │ │ ├── mmlu_moral_disputes.yaml │ │ │ │ │ ├── mmlu_moral_scenarios.yaml │ │ │ │ │ ├── mmlu_nutrition.yaml │ │ │ │ │ ├── mmlu_philosophy.yaml │ │ │ │ │ ├── mmlu_prehistory.yaml │ │ │ │ │ ├── mmlu_professional_accounting.yaml │ │ │ │ │ ├── mmlu_professional_law.yaml │ │ │ │ │ ├── mmlu_professional_medicine.yaml │ │ │ │ │ ├── mmlu_professional_psychology.yaml │ │ │ │ │ ├── mmlu_public_relations.yaml │ │ │ │ │ ├── mmlu_security_studies.yaml │ │ │ │ │ ├── mmlu_sociology.yaml │ │ │ │ │ ├── mmlu_us_foreign_policy.yaml │ │ │ │ │ ├── mmlu_virology.yaml │ │ │ │ │ ├── mmlu_world_religions.yaml │ │ │ │ │ └── utils.py │ │ │ │ └── loglikelihood │ │ │ │ │ ├── _mmlu.yaml │ │ │ │ │ ├── _mmlu_flan_loglikelihood_template_yaml │ │ │ │ │ ├── mmlu_abstract_algebra.yaml │ │ │ │ │ ├── mmlu_anatomy.yaml │ │ │ │ │ ├── mmlu_astronomy.yaml │ │ │ │ │ ├── mmlu_business_ethics.yaml │ │ │ │ │ ├── mmlu_clinical_knowledge.yaml │ │ │ │ │ ├── mmlu_college_biology.yaml │ │ │ │ │ ├── mmlu_college_chemistry.yaml │ │ │ │ │ ├── mmlu_college_computer_science.yaml │ │ │ │ │ ├── mmlu_college_mathematics.yaml │ │ │ │ │ ├── mmlu_college_medicine.yaml │ │ │ │ │ ├── mmlu_college_physics.yaml │ │ │ │ │ ├── mmlu_computer_security.yaml │ │ │ │ │ ├── mmlu_conceptual_physics.yaml │ │ │ │ │ ├── mmlu_econometrics.yaml │ │ │ │ │ ├── mmlu_electrical_engineering.yaml │ │ │ │ │ ├── mmlu_elementary_mathematics.yaml │ │ │ │ │ ├── mmlu_formal_logic.yaml │ │ │ │ │ ├── mmlu_global_facts.yaml │ │ │ │ │ ├── mmlu_high_school_biology.yaml │ │ │ │ │ ├── mmlu_high_school_chemistry.yaml │ │ │ │ │ ├── mmlu_high_school_computer_science.yaml │ │ │ │ │ ├── mmlu_high_school_european_history.yaml │ │ │ │ │ ├── mmlu_high_school_geography.yaml │ │ │ │ │ ├── mmlu_high_school_government_and_politics.yaml │ │ │ │ │ ├── mmlu_high_school_macroeconomics.yaml │ │ │ │ │ ├── mmlu_high_school_mathematics.yaml │ │ │ │ │ ├── mmlu_high_school_microeconomics.yaml │ │ │ │ │ ├── mmlu_high_school_physics.yaml │ │ │ │ │ ├── mmlu_high_school_psychology.yaml │ │ │ │ │ ├── mmlu_high_school_statistics.yaml │ │ │ │ │ ├── mmlu_high_school_us_history.yaml │ │ │ │ │ ├── mmlu_high_school_world_history.yaml │ │ │ │ │ ├── mmlu_human_aging.yaml │ │ │ │ │ ├── mmlu_human_sexuality.yaml │ │ │ │ │ ├── mmlu_international_law.yaml │ │ │ │ │ ├── mmlu_jurisprudence.yaml │ │ │ │ │ ├── mmlu_logical_fallacies.yaml │ │ │ │ │ ├── mmlu_machine_learning.yaml │ │ │ │ │ ├── mmlu_management.yaml │ │ │ │ │ ├── mmlu_marketing.yaml │ │ │ │ │ ├── mmlu_medical_genetics.yaml │ │ │ │ │ ├── mmlu_miscellaneous.yaml │ │ │ │ │ ├── mmlu_moral_disputes.yaml │ │ │ │ │ ├── mmlu_moral_scenarios.yaml │ │ │ │ │ ├── mmlu_nutrition.yaml │ │ │ │ │ ├── mmlu_philosophy.yaml │ │ │ │ │ ├── mmlu_prehistory.yaml │ │ │ │ │ ├── mmlu_professional_accounting.yaml │ │ │ │ │ ├── mmlu_professional_law.yaml │ │ │ │ │ ├── mmlu_professional_medicine.yaml │ │ │ │ │ ├── mmlu_professional_psychology.yaml │ │ │ │ │ ├── mmlu_public_relations.yaml │ │ │ │ │ ├── mmlu_security_studies.yaml │ │ │ │ │ ├── mmlu_sociology.yaml │ │ │ │ │ ├── mmlu_us_foreign_policy.yaml │ │ │ │ │ ├── mmlu_virology.yaml │ │ │ │ │ └── mmlu_world_religions.yaml │ │ │ └── generative │ │ │ │ ├── _default_template_yaml │ │ │ │ ├── _mmlu.yaml │ │ │ │ ├── mmlu_abstract_algebra.yaml │ │ │ │ ├── mmlu_anatomy.yaml │ │ │ │ ├── mmlu_astronomy.yaml │ │ │ │ ├── mmlu_business_ethics.yaml │ │ │ │ ├── mmlu_clinical_knowledge.yaml │ │ │ │ ├── mmlu_college_biology.yaml │ │ │ │ ├── mmlu_college_chemistry.yaml │ │ │ │ ├── mmlu_college_computer_science.yaml │ │ │ │ ├── mmlu_college_mathematics.yaml │ │ │ │ ├── mmlu_college_medicine.yaml │ │ │ │ ├── mmlu_college_physics.yaml │ │ │ │ ├── mmlu_computer_security.yaml │ │ │ │ ├── mmlu_conceptual_physics.yaml │ │ │ │ ├── mmlu_econometrics.yaml │ │ │ │ ├── mmlu_electrical_engineering.yaml │ │ │ │ ├── mmlu_elementary_mathematics.yaml │ │ │ │ ├── mmlu_formal_logic.yaml │ │ │ │ ├── mmlu_global_facts.yaml │ │ │ │ ├── mmlu_high_school_biology.yaml │ │ │ │ ├── mmlu_high_school_chemistry.yaml │ │ │ │ ├── mmlu_high_school_computer_science.yaml │ │ │ │ ├── mmlu_high_school_european_history.yaml │ │ │ │ ├── mmlu_high_school_geography.yaml │ │ │ │ ├── mmlu_high_school_government_and_politics.yaml │ │ │ │ ├── mmlu_high_school_macroeconomics.yaml │ │ │ │ ├── mmlu_high_school_mathematics.yaml │ │ │ │ ├── mmlu_high_school_microeconomics.yaml │ │ │ │ ├── mmlu_high_school_physics.yaml │ │ │ │ ├── mmlu_high_school_psychology.yaml │ │ │ │ ├── mmlu_high_school_statistics.yaml │ │ │ │ ├── mmlu_high_school_us_history.yaml │ │ │ │ ├── mmlu_high_school_world_history.yaml │ │ │ │ ├── mmlu_human_aging.yaml │ │ │ │ ├── mmlu_human_sexuality.yaml │ │ │ │ ├── mmlu_international_law.yaml │ │ │ │ ├── mmlu_jurisprudence.yaml │ │ │ │ ├── mmlu_logical_fallacies.yaml │ │ │ │ ├── mmlu_machine_learning.yaml │ │ │ │ ├── mmlu_management.yaml │ │ │ │ ├── mmlu_marketing.yaml │ │ │ │ ├── mmlu_medical_genetics.yaml │ │ │ │ ├── mmlu_miscellaneous.yaml │ │ │ │ ├── mmlu_moral_disputes.yaml │ │ │ │ ├── mmlu_moral_scenarios.yaml │ │ │ │ ├── mmlu_nutrition.yaml │ │ │ │ ├── mmlu_philosophy.yaml │ │ │ │ ├── mmlu_prehistory.yaml │ │ │ │ ├── mmlu_professional_accounting.yaml │ │ │ │ ├── mmlu_professional_law.yaml │ │ │ │ ├── mmlu_professional_medicine.yaml │ │ │ │ ├── mmlu_professional_psychology.yaml │ │ │ │ ├── mmlu_public_relations.yaml │ │ │ │ ├── mmlu_security_studies.yaml │ │ │ │ ├── mmlu_sociology.yaml │ │ │ │ ├── mmlu_us_foreign_policy.yaml │ │ │ │ ├── mmlu_virology.yaml │ │ │ │ └── mmlu_world_religions.yaml │ │ ├── mmlu_pro │ │ │ ├── README.md │ │ │ ├── _default_template_yaml │ │ │ ├── _mmlu_pro.yaml │ │ │ ├── mmlu_pro_biology.yaml │ │ │ ├── mmlu_pro_business.yaml │ │ │ ├── mmlu_pro_chemistry.yaml │ │ │ ├── mmlu_pro_computer_science.yaml │ │ │ ├── mmlu_pro_economics.yaml │ │ │ ├── mmlu_pro_engineering.yaml │ │ │ ├── mmlu_pro_health.yaml │ │ │ ├── mmlu_pro_history.yaml │ │ │ ├── mmlu_pro_law.yaml │ │ │ ├── mmlu_pro_math.yaml │ │ │ ├── mmlu_pro_other.yaml │ │ │ ├── mmlu_pro_philosophy.yaml │ │ │ ├── mmlu_pro_physics.yaml │ │ │ ├── mmlu_pro_psychology.yaml │ │ │ └── utils.py │ │ ├── mmmu │ │ │ ├── _default_template_yaml │ │ │ ├── arial.ttf │ │ │ ├── mmmu.yaml │ │ │ ├── mmmu_group_img.yaml │ │ │ ├── mmmu_group_img_test.yaml │ │ │ ├── mmmu_group_img_val.yaml │ │ │ ├── mmmu_test.yaml │ │ │ ├── mmmu_val.yaml │ │ │ ├── mmmu_val_pass64.yaml │ │ │ ├── mmmu_val_reasoning.yaml │ │ │ ├── utils.py │ │ │ └── utils_group_img.py │ │ ├── mmmu_pro │ │ │ ├── _default_template_yaml │ │ │ ├── mmmu_pro.yaml │ │ │ ├── mmmu_pro_composite.yaml │ │ │ ├── mmmu_pro_composite_cot.yaml │ │ │ ├── mmmu_pro_cot.yaml │ │ │ ├── mmmu_pro_standard.yaml │ │ │ ├── mmmu_pro_standard_cot.yaml │ │ │ ├── mmmu_pro_vision.yaml │ │ │ ├── mmmu_pro_vision_cot.yaml │ │ │ └── utils.py │ │ ├── mmrefine │ │ │ ├── mmrefine.yaml │ │ │ ├── mmrefine_evals.py │ │ │ ├── prompts.py │ │ │ └── utils.py │ │ ├── mmsearch │ │ │ ├── constants.py │ │ │ ├── get_final_scores.py │ │ │ ├── lmms_eval_utils.py │ │ │ ├── mmsearch.yaml │ │ │ ├── mmsearch_end2end.yaml │ │ │ ├── mmsearch_rerank.yaml │ │ │ ├── mmsearch_summarization.yaml │ │ │ ├── prompts │ │ │ │ ├── prompt.py │ │ │ │ └── prompt_w_imagesearch.py │ │ │ ├── retrieve_content │ │ │ │ ├── retriever.py │ │ │ │ └── tokenization │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── tokenizers.py │ │ │ │ │ └── utils.py │ │ │ ├── score │ │ │ │ ├── f1_score.py │ │ │ │ ├── req_score.py │ │ │ │ └── result_summary.py │ │ │ └── utils │ │ │ │ ├── image_utils.py │ │ │ │ ├── lmms_eval_utils.py │ │ │ │ ├── prompt_utils.py │ │ │ │ ├── utils.py │ │ │ │ └── web_content_utils.py │ │ ├── mmsi_bench │ │ │ ├── msr_bench.yaml │ │ │ └── utils.py │ │ ├── mmstar │ │ │ ├── ko_utils.py │ │ │ ├── mmstar.yaml │ │ │ ├── mmstar_ko.yaml │ │ │ └── utils.py │ │ ├── mmt │ │ │ ├── _default_template_yaml │ │ │ ├── mmt.yaml │ │ │ ├── mmt_mi.yaml │ │ │ ├── mmt_mi_test.yaml │ │ │ ├── mmt_mi_val.yaml │ │ │ ├── mmt_test.yaml │ │ │ ├── mmt_val.yaml │ │ │ └── utils.py │ │ ├── mmupd │ │ │ ├── _default_template_mmupd_yaml │ │ │ ├── mmaad_base.yaml │ │ │ ├── mmaad_instruction.yaml │ │ │ ├── mmaad_option.yaml │ │ │ ├── mmiasd_base.yaml │ │ │ ├── mmiasd_instruction.yaml │ │ │ ├── mmiasd_option.yaml │ │ │ ├── mmivqd_base.yaml │ │ │ ├── mmivqd_instruction.yaml │ │ │ ├── mmivqd_option.yaml │ │ │ ├── mmupd.yaml │ │ │ ├── mmupd_base.yaml │ │ │ ├── mmupd_evals.py │ │ │ ├── mmupd_instruction.yaml │ │ │ ├── mmupd_option.yaml │ │ │ └── utils.py │ │ ├── mmvet │ │ │ ├── mmvet.yaml │ │ │ └── utils.py │ │ ├── mmvetv2 │ │ │ ├── mmvetv2.yaml │ │ │ ├── mmvetv2_group_img.yaml │ │ │ └── utils.py │ │ ├── mmvu │ │ │ ├── mmvu_val.yaml │ │ │ ├── mmvu_val_cot copy.yaml │ │ │ └── utils.py │ │ ├── mmworld │ │ │ ├── mmworld.yaml │ │ │ └── utils.py │ │ ├── moviechat │ │ │ ├── README.md │ │ │ ├── _default_template_yaml │ │ │ ├── moviechat_breakpoint.yaml │ │ │ ├── moviechat_global.yaml │ │ │ └── utils.py │ │ ├── muchomusic │ │ │ ├── muchomusic.yaml │ │ │ └── utils.py │ │ ├── muirbench │ │ │ ├── muirbench.yaml │ │ │ └── utils.py │ │ ├── multidocvqa │ │ │ ├── multidocvqa.yaml │ │ │ ├── multidocvqa_test.yaml │ │ │ ├── multidocvqa_val.yaml │ │ │ └── utils.py │ │ ├── multilingual-llava-bench-in-the-wild │ │ │ ├── README.md │ │ │ ├── _default_template_yaml │ │ │ ├── arabic_llava_in_the_wild.yaml │ │ │ ├── bengali_llava_in_the_wild.yaml │ │ │ ├── chinese_llava_in_the_wild.yaml │ │ │ ├── french_llava_in_the_wild.yaml │ │ │ ├── hindi_llava_in_the_wild.yaml │ │ │ ├── japanese_llava_in_the_wild.yaml │ │ │ ├── rule.json │ │ │ ├── russian_llava_in_the_wild.yaml │ │ │ ├── spanish_llava_in_the_wild.yaml │ │ │ ├── urdu_llava_in_the_wild.yaml │ │ │ └── utils.py │ │ ├── multimodal_rewardbench │ │ │ ├── multimodal_rewardbench.yaml │ │ │ └── utils.py │ │ ├── mvbench │ │ │ ├── _default_template_yaml │ │ │ ├── mvbench.yaml │ │ │ ├── mvbench_action_antonym.yaml │ │ │ ├── mvbench_action_count.yaml │ │ │ ├── mvbench_action_localization.yaml │ │ │ ├── mvbench_action_prediction.yaml │ │ │ ├── mvbench_action_sequence.yaml │ │ │ ├── mvbench_character_order.yaml │ │ │ ├── mvbench_counterfactual_inference.yaml │ │ │ ├── mvbench_egocentric_navigation.yaml │ │ │ ├── mvbench_episodic_reasoning.yaml │ │ │ ├── mvbench_fine_grained_action.yaml │ │ │ ├── mvbench_fine_grained_pose.yaml │ │ │ ├── mvbench_moving_attribute.yaml │ │ │ ├── mvbench_moving_count.yaml │ │ │ ├── mvbench_moving_direction.yaml │ │ │ ├── mvbench_object_existence.yaml │ │ │ ├── mvbench_object_interaction.yaml │ │ │ ├── mvbench_object_shuffle.yaml │ │ │ ├── mvbench_scene_transition.yaml │ │ │ ├── mvbench_state_change.yaml │ │ │ ├── mvbench_unexpected_action.yaml │ │ │ └── utils.py │ │ ├── naturalbench │ │ │ ├── naturalbench.yaml │ │ │ └── utils.py │ │ ├── nextqa │ │ │ ├── _default_template_yaml │ │ │ ├── nextqa.yaml │ │ │ ├── nextqa_mc_test.yaml │ │ │ ├── nextqa_oe_test.yaml │ │ │ ├── nextqa_oe_val.yaml │ │ │ ├── stopwords.csv │ │ │ └── utils.py │ │ ├── nocaps │ │ │ ├── _default_template_nocaps_yaml │ │ │ ├── nocaps.yaml │ │ │ ├── nocaps_test.yaml │ │ │ ├── nocaps_val.yaml │ │ │ ├── nocaps_val_lite.yaml │ │ │ └── utils.py │ │ ├── ocrbench │ │ │ ├── ocrbench.yaml │ │ │ ├── upload_ocrbench.py │ │ │ └── utils.py │ │ ├── ocrbench_v2 │ │ │ ├── IoUscore_metric.py │ │ │ ├── TEDS_metric.py │ │ │ ├── __init__.py │ │ │ ├── ocrbench_v2.yaml │ │ │ ├── page_ocr_metric.py │ │ │ ├── parallel.py │ │ │ ├── spotting_eval │ │ │ │ ├── __init__.py │ │ │ │ ├── readme.txt │ │ │ │ ├── rrc_evaluation_funcs_1_1.py │ │ │ │ └── script.py │ │ │ ├── spotting_metric.py │ │ │ ├── upload_ocrbench_v2.py │ │ │ ├── utils.py │ │ │ └── vqa_metric.py │ │ ├── ok_vqa │ │ │ ├── _default_template_vqa_yaml │ │ │ ├── _generate_config.py │ │ │ ├── _ok_vqa.yaml │ │ │ ├── ok_vqa_val2014.yaml │ │ │ ├── ok_vqa_val2014_lite.yaml │ │ │ └── utils.py │ │ ├── olympiadbench │ │ │ ├── cn_utils.py │ │ │ ├── en_utils.py │ │ │ ├── olympiadbench.yaml │ │ │ ├── olympiadbench_OE_MM_maths_en_COMP.yaml │ │ │ ├── olympiadbench_OE_MM_physics_en_COMP.yaml │ │ │ ├── olympiadbench_evals.py │ │ │ └── testmini_utils.py │ │ ├── olympiadbench_mimo │ │ │ ├── en_utils.py │ │ │ ├── olympiadbench_all_boxed.yaml │ │ │ ├── olympiadbench_boxed.yaml │ │ │ ├── olympiadbench_evals.py │ │ │ ├── olympiadbench_image_math_en.yaml │ │ │ ├── olympiadbench_image_math_zh.yaml │ │ │ ├── olympiadbench_image_physics_en.yaml │ │ │ ├── olympiadbench_image_physics_zh.yaml │ │ │ ├── olympiadbench_math_en.yaml │ │ │ ├── olympiadbench_math_en_no_proof.yaml │ │ │ ├── olympiadbench_math_zh.yaml │ │ │ ├── olympiadbench_math_zh_no_proof.yaml │ │ │ ├── olympiadbench_official.yaml │ │ │ ├── olympiadbench_official_en.yaml │ │ │ ├── olympiadbench_official_en_no_proof.yaml │ │ │ ├── olympiadbench_official_no_proof.yaml │ │ │ ├── olympiadbench_official_zh.yaml │ │ │ ├── olympiadbench_official_zh_no_proof.yaml │ │ │ ├── olympiadbench_physics_en.yaml │ │ │ ├── olympiadbench_physics_en_no_proof.yaml │ │ │ ├── olympiadbench_physics_zh.yaml │ │ │ ├── olympiadbench_physics_zh_no_proof.yaml │ │ │ ├── utils.py │ │ │ └── zh_utils.py │ │ ├── omni_bench │ │ │ ├── _default_template_yaml │ │ │ ├── omni_bench.yaml │ │ │ ├── omni_bench_audio_transcript.yaml │ │ │ ├── omni_bench_image_caption.yaml │ │ │ └── utils.py │ │ ├── open_asr │ │ │ ├── _default_template_yaml │ │ │ ├── openasr.yaml │ │ │ ├── openasr_ami.yaml │ │ │ ├── openasr_common_voice.yaml │ │ │ ├── openasr_earnings22.yaml │ │ │ ├── openasr_gigaspeech.yaml │ │ │ ├── openasr_librispeech.yaml │ │ │ ├── openasr_librispeech_test_clean.yaml │ │ │ ├── openasr_librispeech_test_other.yaml │ │ │ ├── openasr_spgispeech.yaml │ │ │ ├── openasr_tedlium.yaml │ │ │ ├── openasr_voxpopuli.yaml │ │ │ └── utils.py │ │ ├── openai_math │ │ │ ├── openai_math.yaml │ │ │ ├── openai_math_agg64.yaml │ │ │ ├── openai_math_cov64.yaml │ │ │ ├── openai_math_cov64_train.yaml │ │ │ ├── openai_math_maj64_cov64.yaml │ │ │ ├── openai_math_maj64_cov64_train.yaml │ │ │ ├── openai_math_train.yaml │ │ │ └── utils.py │ │ ├── openhermes │ │ │ ├── openhermes.yaml │ │ │ └── utils.py │ │ ├── people_speech │ │ │ ├── people_speech_val.yaml │ │ │ └── utils.py │ │ ├── perceptiontest │ │ │ ├── test │ │ │ │ ├── _default_template_yaml │ │ │ │ ├── perceptiontest_mc.yaml │ │ │ │ ├── perceptiontest_mcppl.yaml │ │ │ │ └── utils.py │ │ │ └── val │ │ │ │ ├── _default_template_yaml │ │ │ │ ├── perceptiontest_mc.yaml │ │ │ │ ├── perceptiontest_mcppl.yaml │ │ │ │ └── utils.py │ │ ├── phyx │ │ │ ├── phyx.yaml │ │ │ ├── phyx_evals.py │ │ │ ├── phyx_mc.yaml │ │ │ ├── phyx_mini_mc.yaml │ │ │ ├── phyx_mini_oe.yaml │ │ │ ├── phyx_oe.yaml │ │ │ └── utils.py │ │ ├── plm_videobench │ │ │ ├── README.md │ │ │ ├── _default_template_yaml │ │ │ ├── eval_utils.py │ │ │ ├── fgqa │ │ │ │ ├── fgqa_test.yaml │ │ │ │ └── fgqa_utils.py │ │ │ ├── rcap │ │ │ │ ├── rcap_test.yaml │ │ │ │ └── rcap_utils.py │ │ │ ├── rdcap │ │ │ │ ├── rdcap_test.yaml │ │ │ │ └── rdcap_utils.py │ │ │ ├── rtloc │ │ │ │ ├── rtloc_test.yaml │ │ │ │ └── rtloc_utils.py │ │ │ └── sgqa │ │ │ │ ├── sgqa_test.yaml │ │ │ │ └── sgqa_utils.py │ │ ├── pope │ │ │ ├── pope.yaml │ │ │ ├── pope_adv.yaml │ │ │ ├── pope_full.yaml │ │ │ ├── pope_pop.yaml │ │ │ ├── pope_random.yaml │ │ │ └── utils.py │ │ ├── qbench │ │ │ ├── abench_dev.yaml │ │ │ ├── qbench2_dev.yaml │ │ │ ├── qbench_dev.yaml │ │ │ ├── qbenchs_dev.yaml │ │ │ └── utils.py │ │ ├── realworldqa │ │ │ ├── realworldqa.yaml │ │ │ └── utils.py │ │ ├── refcoco+ │ │ │ ├── _default_template_bbox_rec_yaml │ │ │ ├── _default_template_bbox_yaml │ │ │ ├── _default_template_seg_yaml │ │ │ ├── _generate_config.py │ │ │ ├── _refcoco.yaml │ │ │ ├── refcoco+_bbox_rec_testA.yaml │ │ │ ├── refcoco+_bbox_rec_testB.yaml │ │ │ ├── refcoco+_bbox_rec_val.yaml │ │ │ ├── refcoco+_bbox_testA.yaml │ │ │ ├── refcoco+_bbox_testB.yaml │ │ │ ├── refcoco+_bbox_val.yaml │ │ │ ├── refcoco+_seg_testA.yaml │ │ │ ├── refcoco+_seg_testB.yaml │ │ │ ├── refcoco+_seg_val.yaml │ │ │ ├── utils.py │ │ │ └── utils_rec.py │ │ ├── refcoco │ │ │ ├── _default_template_bbox_rec_yaml │ │ │ ├── _default_template_bbox_yaml │ │ │ ├── _default_template_seg_yaml │ │ │ ├── _generate_config.py │ │ │ ├── _refcoco.yaml │ │ │ ├── refcoco_bbox_rec_test.yaml │ │ │ ├── refcoco_bbox_rec_testA.yaml │ │ │ ├── refcoco_bbox_rec_testB.yaml │ │ │ ├── refcoco_bbox_rec_val.yaml │ │ │ ├── refcoco_bbox_test.yaml │ │ │ ├── refcoco_bbox_testA.yaml │ │ │ ├── refcoco_bbox_testB.yaml │ │ │ ├── refcoco_bbox_val.yaml │ │ │ ├── refcoco_bbox_val_lite.yaml │ │ │ ├── refcoco_seg_test.yaml │ │ │ ├── refcoco_seg_testA.yaml │ │ │ ├── refcoco_seg_testB.yaml │ │ │ ├── refcoco_seg_val.yaml │ │ │ ├── utils.py │ │ │ └── utils_rec.py │ │ ├── refcocog │ │ │ ├── _default_template_bbox_rec_yaml │ │ │ ├── _default_template_bbox_yaml │ │ │ ├── _default_template_seg_yaml │ │ │ ├── _generate_config.py │ │ │ ├── _refcoco.yaml │ │ │ ├── refcocog_bbox_rec_test.yaml │ │ │ ├── refcocog_bbox_rec_val.yaml │ │ │ ├── refcocog_bbox_test.yaml │ │ │ ├── refcocog_bbox_val.yaml │ │ │ ├── refcocog_seg_test.yaml │ │ │ ├── refcocog_seg_val.yaml │ │ │ ├── utils.py │ │ │ └── utils_rec.py │ │ ├── salbench │ │ │ ├── _o3_default │ │ │ ├── _p3_default │ │ │ ├── o3.yaml │ │ │ ├── o3_box.yaml │ │ │ ├── o3_box_img.yaml │ │ │ ├── p3.yaml │ │ │ ├── p3_box.yaml │ │ │ ├── p3_box_img.yaml │ │ │ └── utils.py │ │ ├── scienceqa │ │ │ ├── scienceqa.yaml │ │ │ ├── scienceqa_full.yaml │ │ │ ├── scienceqa_img.yaml │ │ │ └── utils.py │ │ ├── screenspot │ │ │ ├── README.md │ │ │ ├── _default_template_rec_yaml │ │ │ ├── _default_template_reg_yaml │ │ │ ├── _screenspot.yaml │ │ │ ├── screenspot_rec_test.yaml │ │ │ ├── screenspot_reg_test.yaml │ │ │ ├── utils.py │ │ │ └── utils_rec.py │ │ ├── seedbench │ │ │ ├── ko_utils.py │ │ │ ├── seedbench.yaml │ │ │ ├── seedbench_ko.yaml │ │ │ ├── seedbench_lite.yaml │ │ │ ├── seedbench_ppl.yaml │ │ │ └── utils.py │ │ ├── seedbench_2 │ │ │ ├── seedbench_2.yaml │ │ │ └── utils.py │ │ ├── seedbench_2_plus │ │ │ ├── seedbench_2_plus.yaml │ │ │ └── utils.py │ │ ├── stvqa │ │ │ ├── stvqa.yaml │ │ │ └── utils.py │ │ ├── synthdog │ │ │ ├── donut_evaluator.py │ │ │ ├── synthdog.yaml │ │ │ ├── synthdog_en.yaml │ │ │ ├── synthdog_zh.yaml │ │ │ └── utils.py │ │ ├── tedlium │ │ │ ├── tedlium_dev_test.yaml │ │ │ ├── tedlium_long_form.yaml │ │ │ └── utils.py │ │ ├── tempcompass │ │ │ ├── _default_template_yaml │ │ │ ├── _tempcompass.yaml │ │ │ ├── tempcompass_caption_matching.yaml │ │ │ ├── tempcompass_captioning.yaml │ │ │ ├── tempcompass_mc.yaml │ │ │ ├── tempcompass_yes_no.yaml │ │ │ └── utils.py │ │ ├── temporalbench │ │ │ ├── temporalbench.yaml │ │ │ ├── temporalbench_long_qa.yaml │ │ │ ├── temporalbench_short_caption.yaml │ │ │ ├── temporalbench_short_qa.yaml │ │ │ └── utils.py │ │ ├── textcaps │ │ │ ├── _default_template_textcaps_yaml │ │ │ ├── textcaps.yaml │ │ │ ├── textcaps_test.yaml │ │ │ ├── textcaps_train.yaml │ │ │ ├── textcaps_val.yaml │ │ │ ├── textcaps_val_lite.yaml │ │ │ └── utils.py │ │ ├── textvqa │ │ │ ├── _default_template_textvqa_yaml │ │ │ ├── _textvqa.yaml │ │ │ ├── textvqa_test.yaml │ │ │ ├── textvqa_val.yaml │ │ │ ├── textvqa_val_lite.yaml │ │ │ └── utils.py │ │ ├── timescope │ │ │ ├── timescope.yaml │ │ │ └── utils.py │ │ ├── tomato │ │ │ ├── tomato.yaml │ │ │ └── utils.py │ │ ├── vatex │ │ │ ├── _vatex.yaml │ │ │ ├── utils.py │ │ │ ├── vatex_test.yaml │ │ │ └── vatex_val_zh.yaml │ │ ├── vcr_wiki │ │ │ ├── _default_template_vcr_yaml │ │ │ ├── utils.py │ │ │ ├── vcr_wiki_en_easy.yaml │ │ │ ├── vcr_wiki_en_easy_100.yaml │ │ │ ├── vcr_wiki_en_easy_500.yaml │ │ │ ├── vcr_wiki_en_hard.yaml │ │ │ ├── vcr_wiki_en_hard_100.yaml │ │ │ ├── vcr_wiki_en_hard_500.yaml │ │ │ ├── vcr_wiki_zh_easy.yaml │ │ │ ├── vcr_wiki_zh_easy_100.yaml │ │ │ ├── vcr_wiki_zh_easy_500.yaml │ │ │ ├── vcr_wiki_zh_hard.yaml │ │ │ ├── vcr_wiki_zh_hard_100.yaml │ │ │ └── vcr_wiki_zh_hard_500.yaml │ │ ├── vdc │ │ │ ├── README.md │ │ │ ├── _default_template_yaml │ │ │ ├── background_test.yaml │ │ │ ├── camera_test.yaml │ │ │ ├── detailed_test.yaml │ │ │ ├── main_object_test.yaml │ │ │ ├── short_test.yaml │ │ │ └── utils.py │ │ ├── vibe_eval │ │ │ ├── utils.py │ │ │ └── vibe_eval.yaml │ │ ├── video-tt │ │ │ ├── _default_template.yaml │ │ │ ├── gpt_utils.py │ │ │ ├── utils.py │ │ │ ├── videott_all.yaml │ │ │ ├── videott_all_audio.yaml │ │ │ ├── videott_correct_leading_oe.yaml │ │ │ ├── videott_no_leading_oe.yaml │ │ │ ├── videott_paraphrase_oe.yaml │ │ │ ├── videott_single_mc.yaml │ │ │ ├── videott_single_mc_description.yaml │ │ │ └── videott_wrong_leading_oe.yaml │ │ ├── video_detail_description │ │ │ ├── README.md │ │ │ ├── _default_template_yaml │ │ │ ├── utils.py │ │ │ └── video_detail_description.yaml │ │ ├── videochatgpt │ │ │ ├── _default_template_yaml │ │ │ ├── _videochatgpt.yaml │ │ │ ├── utils.py │ │ │ ├── videochatgpt_consistency.yaml │ │ │ ├── videochatgpt_generic.yaml │ │ │ └── videochatgpt_temporal.yaml │ │ ├── videoevalpro │ │ │ ├── utils.py │ │ │ └── videoevalpro.yaml │ │ ├── videomathqa │ │ │ ├── README.md │ │ │ ├── cot_postprocess.py │ │ │ ├── cot_step_evaluation.py │ │ │ ├── utils.py │ │ │ ├── videomathqa_mbin.yaml │ │ │ ├── videomathqa_mbin_cot.yaml │ │ │ ├── videomathqa_mbin_cot_w_subtitle.yaml │ │ │ ├── videomathqa_mbin_w_subtitle.yaml │ │ │ ├── videomathqa_mcq.yaml │ │ │ ├── videomathqa_mcq_cot.yaml │ │ │ ├── videomathqa_mcq_cot_w_subtitle.yaml │ │ │ └── videomathqa_mcq_w_subtitle.yaml │ │ ├── videomme │ │ │ ├── utils.py │ │ │ ├── videomme.yaml │ │ │ └── videomme_w_subtitle.yaml │ │ ├── videommmu │ │ │ ├── _default_template_yaml │ │ │ ├── adaptation.yaml │ │ │ ├── adaptation_question_only.yaml │ │ │ ├── comprehension.yaml │ │ │ ├── perception.yaml │ │ │ ├── utils.py │ │ │ └── video_mmmu.yaml │ │ ├── vinoground │ │ │ ├── utils.py │ │ │ └── vinoground.yaml │ │ ├── visualwebbench │ │ │ ├── prompts.py │ │ │ ├── utils.py │ │ │ ├── visualwebbench_action_ground.yaml │ │ │ ├── visualwebbench_action_prediction.yaml │ │ │ ├── visualwebbench_element_ground.yaml │ │ │ ├── visualwebbench_element_ocr.yaml │ │ │ ├── visualwebbench_heading_ocr.yaml │ │ │ ├── visualwebbench_web_caption.yaml │ │ │ └── visualwebbench_webqa.yaml │ │ ├── vitatecs │ │ │ ├── _default_template_yaml │ │ │ ├── _vitatecs.yaml │ │ │ ├── utils.py │ │ │ ├── vitatecs_compositionality.yaml │ │ │ ├── vitatecs_direction.yaml │ │ │ ├── vitatecs_intensity.yaml │ │ │ ├── vitatecs_localization.yaml │ │ │ ├── vitatecs_sequence.yaml │ │ │ └── vitatecs_type.yaml │ │ ├── vizwiz_vqa │ │ │ ├── _default_template_vqa_yaml │ │ │ ├── _generate_config.py │ │ │ ├── _vizwiz_vqa.yaml │ │ │ ├── utils.py │ │ │ ├── vizwiz_vqa_test.yaml │ │ │ ├── vizwiz_vqa_val.yaml │ │ │ └── vizwiz_vqa_val_lite.yaml │ │ ├── vl_rewardbench │ │ │ ├── utils.py │ │ │ └── vl_rewardbench.yaml │ │ ├── vlmsareblind │ │ │ ├── README.md │ │ │ ├── __init__.py │ │ │ ├── utils.py │ │ │ ├── vlmsareblind.yaml │ │ │ └── vlmsareblind_lite.yaml │ │ ├── vmcbench │ │ │ ├── utils.py │ │ │ └── vmcbench.yaml │ │ ├── vocalsound │ │ │ ├── _default_template_yaml │ │ │ ├── utils.py │ │ │ ├── vocalsound_test.yaml │ │ │ └── vocalsound_val.yaml │ │ ├── vqav2 │ │ │ ├── _default_template_vqav2_yaml │ │ │ ├── _vqav2.yaml │ │ │ ├── utils.py │ │ │ ├── vqav2_test.yaml │ │ │ ├── vqav2_val.yaml │ │ │ └── vqav2_val_lite.yaml │ │ ├── vsibench │ │ │ ├── utils.py │ │ │ └── vsibench.yaml │ │ ├── vstar_bench │ │ │ ├── README.md │ │ │ ├── __init__.py │ │ │ ├── _default_template_yaml │ │ │ ├── utils.py │ │ │ ├── vstar_bench.yaml │ │ │ ├── vstar_bench_direct_attributes.yaml │ │ │ └── vstar_bench_relative_position.yaml │ │ ├── wavcaps │ │ │ ├── utils.py │ │ │ └── wavcaps.yaml │ │ ├── websrc │ │ │ ├── README.md │ │ │ ├── utils.py │ │ │ ├── websrc.yaml │ │ │ ├── websrc_test.yaml │ │ │ └── websrc_val.yaml │ │ ├── wild_vision_bench │ │ │ ├── _default_template_yaml │ │ │ ├── utils.py │ │ │ ├── wild_vision_bench0617.yaml │ │ │ ├── wild_vision_bench0630.yaml │ │ │ └── wildvision_bench.yaml │ │ ├── worldqa │ │ │ ├── _default_template_yaml │ │ │ ├── utils.py │ │ │ ├── worldqa.yaml │ │ │ ├── worldqa_generation.yaml │ │ │ ├── worldqa_mc.yaml │ │ │ ├── worldqa_mc_evaluator.py │ │ │ └── worldqa_mcppl.yaml │ │ ├── worldsense │ │ │ ├── utils.py │ │ │ ├── worldsense.yaml │ │ │ └── worldsense_w_subtitle.yaml │ │ ├── xlrs │ │ │ ├── XLRS-lite.yaml │ │ │ └── mcq_utils.py │ │ └── youcook2 │ │ │ ├── _default_template_yaml │ │ │ ├── utils.py │ │ │ └── youcook2_val.yaml │ └── utils.py ├── miscs │ ├── example_eval.yaml │ ├── llava_repr_requirements.txt │ ├── llava_result_check.md │ ├── llava_sglang_result_check.md │ ├── repr_torch_envs.txt │ ├── scienceqa_id.txt │ ├── script.sh │ ├── test_llava.py │ ├── test_scienceqa.py │ └── tinyllava_repr_requirements.txt ├── plotly.min.js ├── pyproject.toml ├── setup.py ├── tools │ ├── get_split_zip.py │ ├── get_video_avg_time.py │ ├── lite │ │ ├── embed.py │ │ ├── embedder │ │ │ ├── BaseEmbedder.py │ │ │ ├── ClipBgeEmbedder.py │ │ │ └── __init__.py │ │ ├── shrink.py │ │ └── shrinker │ │ │ ├── BaseShrinker.py │ │ │ ├── EmbedShrinker.py │ │ │ ├── __init__.py │ │ │ └── sampling_methods │ │ │ ├── __init__.py │ │ │ ├── kcenter_greedy.py │ │ │ └── sampling_def.py │ ├── live_bench │ │ ├── create_dataset.py │ │ ├── data_summary.ipynb │ │ ├── example.ipynb │ │ ├── filter.ipynb │ │ ├── live_bench │ │ │ ├── __init__.py │ │ │ ├── api │ │ │ │ └── live_bench.py │ │ │ ├── data_generator │ │ │ │ ├── __init__.py │ │ │ │ ├── check_prompt.md │ │ │ │ ├── default_criteria.md │ │ │ │ ├── example │ │ │ │ │ ├── example_output.json │ │ │ │ │ └── example_website.png │ │ │ │ ├── live_bench.py │ │ │ │ ├── live_bench_data.py │ │ │ │ ├── prompt.md │ │ │ │ ├── qa_generator.py │ │ │ │ ├── question_finalizer.py │ │ │ │ ├── response.py │ │ │ │ ├── score_getter.py │ │ │ │ ├── score_prompt.md │ │ │ │ └── utils │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── claude.py │ │ │ │ │ ├── extract_information.py │ │ │ │ │ ├── gemini.py │ │ │ │ │ └── gpt4v.py │ │ │ ├── driver │ │ │ │ ├── .gitignore │ │ │ │ ├── __init__.py │ │ │ │ └── load_driver.py │ │ │ ├── screen_shoter │ │ │ │ ├── __init__.py │ │ │ │ ├── screen.py │ │ │ │ └── screen_shoter.py │ │ │ ├── view.ipynb │ │ │ └── websites │ │ │ │ ├── __init__.py │ │ │ │ ├── load_website.py │ │ │ │ ├── website.py │ │ │ │ └── website_list.yaml │ │ ├── pyproject.toml │ │ ├── refine_all_results.py │ │ ├── script │ │ │ ├── README.md │ │ │ ├── change.ipynb │ │ │ ├── compare.ipynb │ │ │ ├── modify.ipynb │ │ │ ├── refractor.py │ │ │ ├── select.ipynb │ │ │ ├── update_banchmark.ipynb │ │ │ └── upload_results.py │ │ ├── setup.py │ │ └── summerize.ipynb │ ├── make_audio_hf_dataset.ipynb │ ├── make_image_hf_dataset.ipynb │ ├── make_vatex.py │ ├── make_video_hf_dataset.ipynb │ ├── make_video_hf_dataset_from_json.py │ ├── makecvrr.ipynb │ └── regression.py └── uv.lock ├── ms-swift ├── .dev_scripts │ ├── build_docs.sh │ ├── ci_container_test.sh │ └── dockerci.sh ├── .github │ ├── ISSUE_TEMPLATE │ │ ├── bug_report.md │ │ ├── custom.md │ │ └── feature_request.md │ ├── PULL_REQUEST_TEMPLATE.md │ ├── SECURITY.md │ └── workflows │ │ ├── citest.yaml │ │ ├── close_tale_issue.yaml │ │ ├── lint.yaml │ │ └── publish.yaml ├── .gitignore ├── .pre-commit-config.yaml ├── .pre-commit-config_local.yaml ├── CODE_OF_CONDUCT.md ├── CONTRIBUTING.md ├── CONTRIBUTING_CN.md ├── LICENSE ├── MANIFEST.in ├── Makefile ├── README.md ├── README_CN.md ├── asset │ ├── banner.png │ ├── ding.png │ ├── discord_qr.jpg │ ├── wechat.png │ ├── wechat_grpo.png │ └── wechat_megatron.png ├── docs │ ├── Makefile │ ├── README.md │ ├── make.bat │ ├── resources │ │ ├── asyncengine.png │ │ ├── deepeyes.png │ │ ├── dpo_data.png │ │ ├── grpo.png │ │ ├── grpo_clevr_count.png │ │ ├── grpo_code.png │ │ ├── grpo_countdown.png │ │ ├── grpo_countdown_1.png │ │ ├── grpo_geoqa.png │ │ ├── grpo_openr1_multimodal.png │ │ ├── gym_env.png │ │ ├── kto_data.png │ │ ├── multiturn_pipeline.png │ │ ├── web-ui-en.jpg │ │ └── web-ui.jpg │ ├── source │ │ ├── .readthedocs.yaml │ │ ├── BestPractices │ │ │ ├── Embedding训练.md │ │ │ ├── GRPO代码训练.md │ │ │ ├── GRPO多模态训练.md │ │ │ ├── GRPO完整流程.md │ │ │ ├── NPU支持.md │ │ │ ├── Qwen3最佳实践.md │ │ │ ├── Reranker训练.md │ │ │ ├── 快速训练VL模型.md │ │ │ └── 更多最佳实践.md │ │ ├── Customization │ │ │ ├── 插件化.md │ │ │ ├── 自定义数据集.md │ │ │ └── 自定义模型.md │ │ ├── GetStarted │ │ │ ├── SWIFT安装.md │ │ │ ├── Web-UI.md │ │ │ └── 快速开始.md │ │ ├── Instruction │ │ │ ├── Agent支持.md │ │ │ ├── GRPO │ │ │ │ ├── AdvancedResearch │ │ │ │ │ ├── DAPO.md │ │ │ │ │ ├── GSPO.md │ │ │ │ │ ├── deepeyes.md │ │ │ │ │ ├── entropy_mask.md │ │ │ │ │ └── index.rst │ │ │ │ ├── DeveloperGuide │ │ │ │ │ ├── GYM环境训练.md │ │ │ │ │ ├── index.rst │ │ │ │ │ ├── 多任务.md │ │ │ │ │ ├── 多轮训练.md │ │ │ │ │ ├── 奖励函数.md │ │ │ │ │ └── 奖励模型.md │ │ │ │ ├── GetStarted │ │ │ │ │ ├── GRPO.md │ │ │ │ │ └── index.rst │ │ │ │ └── index.rst │ │ │ ├── Megatron-SWIFT训练.md │ │ │ ├── ReleaseNote3.0.md │ │ │ ├── 人类对齐.md │ │ │ ├── 使用tuners.md │ │ │ ├── 命令行参数.md │ │ │ ├── 导出与推送.md │ │ │ ├── 常见问题整理.md │ │ │ ├── 强化微调.md │ │ │ ├── 推理和部署.md │ │ │ ├── 支持的模型和数据集.md │ │ │ ├── 评测.md │ │ │ ├── 采样.md │ │ │ └── 预训练与微调.md │ │ ├── _templates │ │ │ ├── autosummary │ │ │ │ └── class.rst │ │ │ ├── classtemplate.rst │ │ │ └── sobolengine.rst │ │ ├── conf.py │ │ └── index.rst │ └── source_en │ │ ├── .readthedocs.yaml │ │ ├── BestPractices │ │ ├── Embedding.md │ │ ├── GRPO-Code-Training.md │ │ ├── GRPO-Multi-Modal-Training.md │ │ ├── GRPO.md │ │ ├── More-Best-Practices.md │ │ ├── NPU-support.md │ │ ├── Qwen3-Best-Practice.md │ │ ├── Rapidly-Training-VL-model.md │ │ └── Reranker.md │ │ ├── Customization │ │ ├── Custom-dataset.md │ │ ├── Custom-model.md │ │ └── Pluginization.md │ │ ├── GetStarted │ │ ├── Quick-start.md │ │ ├── SWIFT-installation.md │ │ └── Web-UI.md │ │ ├── Instruction │ │ ├── Agent-support.md │ │ ├── Command-line-parameters.md │ │ ├── Evaluation.md │ │ ├── Export-and-push.md │ │ ├── Frequently-asked-questions.md │ │ ├── GRPO │ │ │ ├── AdvancedResearch │ │ │ │ ├── DAPO.md │ │ │ │ ├── GSPO.md │ │ │ │ ├── deepeyes.md │ │ │ │ ├── entropy_mask.md │ │ │ │ └── index.rst │ │ │ ├── DeveloperGuide │ │ │ │ ├── gym_env.md │ │ │ │ ├── index.rst │ │ │ │ ├── multi_task.md │ │ │ │ ├── multi_turn.md │ │ │ │ ├── reward_function.md │ │ │ │ └── reward_model.md │ │ │ ├── GetStarted │ │ │ │ ├── GRPO.md │ │ │ │ └── index.rst │ │ │ └── index.rst │ │ ├── Inference-and-deployment.md │ │ ├── Megatron-SWIFT-Training.md │ │ ├── Pre-training-and-Fine-tuning.md │ │ ├── RLHF.md │ │ ├── Reinforced-Fine-tuning.md │ │ ├── ReleaseNote3.0.md │ │ ├── Sample.md │ │ ├── Supported-models-and-datasets.md │ │ └── Use-tuners.md │ │ ├── _templates │ │ ├── autosummary │ │ │ └── class.rst │ │ ├── classtemplate.rst │ │ └── sobolengine.rst │ │ ├── conf.py │ │ └── index.rst ├── examples │ ├── README.md │ ├── app │ │ ├── base_url │ │ │ ├── demo.py │ │ │ └── demo.sh │ │ ├── llm │ │ │ ├── sglang.sh │ │ │ └── vllm.sh │ │ └── mllm.sh │ ├── custom │ │ ├── dataset.py │ │ ├── infer.sh │ │ ├── model.py │ │ ├── model_hf.py │ │ └── sft.sh │ ├── deploy │ │ ├── agent │ │ │ ├── client.py │ │ │ └── server.sh │ │ ├── bert │ │ │ ├── client.py │ │ │ └── server.sh │ │ ├── client │ │ │ ├── llm │ │ │ │ ├── base │ │ │ │ │ ├── openai_client.py │ │ │ │ │ └── swift_client.py │ │ │ │ └── chat │ │ │ │ │ ├── openai_client.py │ │ │ │ │ └── swift_client.py │ │ │ └── mllm │ │ │ │ ├── openai_client.py │ │ │ │ └── swift_client.py │ │ ├── embedding │ │ │ ├── client.py │ │ │ └── server.sh │ │ ├── lora │ │ │ ├── client.py │ │ │ └── server.sh │ │ ├── reward_model │ │ │ ├── client.py │ │ │ └── server.sh │ │ └── server │ │ │ ├── README.md │ │ │ ├── sglang.sh │ │ │ └── vllm.sh │ ├── eval │ │ ├── eval_url │ │ │ ├── demo.py │ │ │ └── eval.sh │ │ ├── llm │ │ │ ├── sglang.sh │ │ │ └── vllm.sh │ │ ├── train_eval │ │ │ └── train.sh │ │ └── vlm │ │ │ └── eval.sh │ ├── export │ │ ├── cached_dataset │ │ │ ├── mcore.sh │ │ │ ├── pretrained.sh │ │ │ └── sft.sh │ │ ├── merge_lora.sh │ │ ├── ollama.sh │ │ ├── push_to_hub.sh │ │ └── quantize │ │ │ ├── awq.sh │ │ │ ├── bert │ │ │ ├── bnb.sh │ │ │ └── gptq.sh │ │ │ ├── bnb.sh │ │ │ ├── fp8.sh │ │ │ ├── gptq.sh │ │ │ ├── mllm │ │ │ ├── awq.sh │ │ │ ├── bnb.sh │ │ │ ├── fp8.sh │ │ │ └── gptq.sh │ │ │ ├── moe │ │ │ ├── awq.sh │ │ │ ├── bnb.sh │ │ │ ├── fp8.sh │ │ │ └── gptq.sh │ │ │ ├── omni │ │ │ └── gptq.sh │ │ │ └── reward_model │ │ │ ├── bnb.sh │ │ │ └── gptq.sh │ ├── infer │ │ ├── cli_demo.sh │ │ ├── demo.py │ │ ├── demo_agent.py │ │ ├── demo_bert.py │ │ ├── demo_grounding.py │ │ ├── demo_hf.py │ │ ├── demo_lora.py │ │ ├── demo_mllm.py │ │ ├── demo_reward_model.py │ │ ├── lmdeploy │ │ │ └── mllm_tp.sh │ │ ├── pt │ │ │ ├── batch_ddp.sh │ │ │ ├── bert.sh │ │ │ ├── lora.sh │ │ │ ├── mllm_device_map.sh │ │ │ ├── prm.sh │ │ │ └── reward_model.sh │ │ ├── sglang │ │ │ ├── demo.sh │ │ │ ├── distill_qwen3_235b.sh │ │ │ └── tp.sh │ │ └── vllm │ │ │ ├── dp_tp.sh │ │ │ ├── mllm_ddp.sh │ │ │ └── mllm_tp.sh │ ├── models │ │ ├── deepseek_vl2 │ │ │ └── train.sh │ │ ├── gpt_oss │ │ │ └── train.sh │ │ ├── internvl3 │ │ │ └── train.sh │ │ ├── minicpmv │ │ │ └── train.sh │ │ └── ovis2 │ │ │ └── train.sh │ ├── notebook │ │ ├── qwen2_5-self-cognition │ │ │ ├── infer.ipynb │ │ │ ├── infer.sh │ │ │ ├── self-cognition-sft.ipynb │ │ │ └── sft.sh │ │ ├── qwen2_5-vl-grounding │ │ │ └── zh.ipynb │ │ └── qwen2vl-ocr │ │ │ ├── infer.ipynb │ │ │ └── ocr-sft.ipynb │ ├── sampler │ │ ├── distill │ │ │ └── distill.sh │ │ └── mcts │ │ │ ├── mcts.py │ │ │ ├── mcts.sh │ │ │ └── system_prompt.txt │ └── train │ │ ├── agent │ │ ├── deepseek_r1.sh │ │ ├── glm4.sh │ │ ├── loss_scale │ │ │ ├── infer_lora.py │ │ │ └── train.sh │ │ └── qwen2_5.sh │ │ ├── all_to_all │ │ ├── infer.sh │ │ └── train.sh │ │ ├── base_to_chat │ │ ├── full.sh │ │ ├── lora.sh │ │ └── lora2.sh │ │ ├── embedding │ │ ├── train_emb.sh │ │ └── train_gme.sh │ │ ├── flash_attention_3 │ │ ├── mcore.sh │ │ └── transformers.sh │ │ ├── full │ │ ├── infer.sh │ │ ├── qwen2_5_32b.sh │ │ └── train.sh │ │ ├── grpo │ │ ├── external │ │ │ ├── README.md │ │ │ ├── agent.sh │ │ │ ├── grpo_32b_full.sh │ │ │ ├── grpo_7b.sh │ │ │ ├── vllm_gym.sh │ │ │ └── vllm_multi_turn.sh │ │ ├── internal │ │ │ ├── README.md │ │ │ ├── full_lmdeploy.sh │ │ │ ├── pt.sh │ │ │ ├── vllm_72b_4gpu.sh │ │ │ ├── vllm_lora_qwenvl72b.sh │ │ │ ├── vllm_multi_turn.sh │ │ │ └── vllm_vl7b.sh │ │ ├── multi_node │ │ │ ├── Qwen2_5_32B_full.sh │ │ │ ├── colocate_multi_node1.sh │ │ │ ├── colocate_multi_node2.sh │ │ │ ├── server_multi_node.sh │ │ │ └── train_dlc.sh │ │ ├── plugin │ │ │ ├── deepeyes │ │ │ │ ├── deepeyes.sh │ │ │ │ └── deepeyes_plugin.py │ │ │ ├── plugin.py │ │ │ ├── run_external_reward_func.sh │ │ │ └── run_external_reward_model.sh │ │ ├── prompt.txt │ │ └── qwen2_5_omni │ │ │ ├── grpo.sh │ │ │ └── infer.sh │ │ ├── infer.sh │ │ ├── liger │ │ └── sft.sh │ │ ├── lora_sft.sh │ │ ├── megatron │ │ ├── base_to_chat.sh │ │ ├── benchmark │ │ │ └── deepspeed.sh │ │ ├── dense │ │ │ ├── 72b_offload.sh │ │ │ └── qwen3_32b.sh │ │ ├── fp8.sh │ │ ├── long_text.sh │ │ ├── lora │ │ │ ├── dense.sh │ │ │ ├── dpo.sh │ │ │ ├── glm4_5_106b.sh │ │ │ ├── loss_scale.sh │ │ │ ├── moe.sh │ │ │ ├── new_special_tokens.sh │ │ │ └── qwen3_235b.sh │ │ ├── moe │ │ │ ├── deepseek_v3.sh │ │ │ ├── moe.sh │ │ │ ├── qwen3_moe.sh │ │ │ └── qwen3_moe_offload.sh │ │ ├── multi-node │ │ │ ├── node1.sh │ │ │ └── node2.sh │ │ ├── pretrain.sh │ │ ├── rlhf │ │ │ └── dpo │ │ │ │ ├── dense.sh │ │ │ │ └── moe.sh │ │ └── sft.sh │ │ ├── moe │ │ ├── llama4.sh │ │ └── qwen3_moe.sh │ │ ├── multi-gpu │ │ ├── ddp │ │ │ └── train.sh │ │ ├── ddp_device_map │ │ │ └── train.sh │ │ ├── deepspeed │ │ │ ├── train_zero2.sh │ │ │ └── train_zero3.sh │ │ ├── device_map │ │ │ └── train.sh │ │ └── fsdp_qlora │ │ │ ├── fsdp_offload.json │ │ │ └── train.sh │ │ ├── multi-node │ │ ├── accelerate │ │ │ ├── multi_node.yaml │ │ │ ├── train_node1.sh │ │ │ └── train_node2.sh │ │ ├── deepspeed │ │ │ ├── README.md │ │ │ ├── host.txt │ │ │ └── train.sh │ │ ├── dlc │ │ │ └── train.sh │ │ ├── swift │ │ │ ├── train_node1.sh │ │ │ └── train_node2.sh │ │ └── torchrun │ │ │ ├── train_node1.sh │ │ │ └── train_node2.sh │ │ ├── multimodal │ │ ├── audio.sh │ │ ├── caption.sh │ │ ├── grounding.sh │ │ ├── infer.sh │ │ ├── lora_llm_full_vit │ │ │ ├── custom_plugin.py │ │ │ ├── infer.sh │ │ │ ├── merge_lora.sh │ │ │ ├── seq_cls.sh │ │ │ └── sft.sh │ │ ├── ocr.sh │ │ ├── omni │ │ │ ├── infer.sh │ │ │ └── sft.sh │ │ ├── rlhf │ │ │ ├── dpo │ │ │ │ ├── full.sh │ │ │ │ └── lora.sh │ │ │ ├── gkd │ │ │ │ ├── fast.sh │ │ │ │ └── full.sh │ │ │ └── kto.sh │ │ ├── video.sh │ │ └── vit_gradient_checkpointing.sh │ │ ├── new_special_tokens │ │ ├── infer.sh │ │ ├── merge_lora.sh │ │ ├── tokens.txt │ │ └── train.sh │ │ ├── optimizer │ │ └── muon.sh │ │ ├── packing │ │ ├── liger_kernel.sh │ │ ├── llm.sh │ │ ├── qwen2_5_omni.sh │ │ ├── qwen2_5_vl.sh │ │ └── streaming.sh │ │ ├── padding_free │ │ ├── dpo.sh │ │ ├── dpo_vlm.sh │ │ └── sft.sh │ │ ├── plugins │ │ ├── channel_loss.sh │ │ ├── loss_scale.sh │ │ └── tuner_phi4_mm.sh │ │ ├── predict_with_generate │ │ └── train.sh │ │ ├── pretrain │ │ └── train.sh │ │ ├── qlora │ │ ├── awq │ │ │ ├── merge_lora.sh │ │ │ └── train.sh │ │ ├── bnb │ │ │ ├── merge_lora.sh │ │ │ └── train.sh │ │ ├── gptq.sh │ │ └── hqq.sh │ │ ├── reranker │ │ ├── train_generative_reranker.sh │ │ ├── train_generative_reranker_listwise.sh │ │ ├── train_reranker.sh │ │ └── train_reranker_listwise.sh │ │ ├── rft │ │ ├── math.json │ │ └── rft.py │ │ ├── rlhf │ │ ├── README.md │ │ ├── cpo.sh │ │ ├── dpo │ │ │ ├── full.sh │ │ │ └── lora.sh │ │ ├── gkd │ │ │ ├── fast.sh │ │ │ ├── full.sh │ │ │ └── think_model.sh │ │ ├── kto.sh │ │ ├── mpo.sh │ │ ├── orpo.sh │ │ ├── ppo │ │ │ ├── full.sh │ │ │ └── lora.sh │ │ ├── rm.sh │ │ └── simpo.sh │ │ ├── seq_cls │ │ ├── bert │ │ │ ├── deploy.sh │ │ │ ├── infer.sh │ │ │ └── sft.sh │ │ ├── multi_label │ │ │ └── sft.sh │ │ ├── qwen2_5 │ │ │ ├── deploy.sh │ │ │ ├── infer.sh │ │ │ └── sft.sh │ │ ├── qwen2_vl │ │ │ ├── infer.py │ │ │ ├── infer.sh │ │ │ └── sft.sh │ │ └── regression │ │ │ ├── deploy.sh │ │ │ ├── infer.sh │ │ │ └── sft.sh │ │ ├── sequence_parallel │ │ ├── ring_attention │ │ │ ├── sequence_parallel.sh │ │ │ ├── sequence_parallel_256k.sh │ │ │ ├── sequence_parallel_dpo.sh │ │ │ └── sequence_parallel_grpo.sh │ │ └── ulysses │ │ │ ├── sequence_parallel.sh │ │ │ ├── sequence_parallel_512k.sh │ │ │ ├── sequence_parallel_dpo.sh │ │ │ └── sequence_parallel_grpo.sh │ │ ├── streaming │ │ ├── lazy_tokenize.sh │ │ └── streaming.sh │ │ ├── think_model │ │ ├── deepseek_r1.sh │ │ ├── qwen3_demo1.sh │ │ └── qwen3_demo2.sh │ │ └── tuners │ │ ├── adalora │ │ └── train.sh │ │ ├── adapter │ │ └── train.sh │ │ ├── boft │ │ └── train.sh │ │ ├── bone │ │ └── train.sh │ │ ├── dora │ │ └── train.sh │ │ ├── galore │ │ ├── train_galore.sh │ │ └── train_qgalore.sh │ │ ├── lisa │ │ └── train.sh │ │ ├── llamapro │ │ └── train.sh │ │ ├── longlora │ │ └── train.sh │ │ ├── lora-ga │ │ └── train.sh │ │ ├── lora │ │ └── train.sh │ │ ├── neftune │ │ └── train.sh │ │ ├── olora │ │ └── train.sh │ │ ├── pissa │ │ └── train.sh │ │ ├── qlora │ │ └── train.sh │ │ ├── reft │ │ └── train.sh │ │ └── unsloth │ │ └── train.sh ├── fla │ ├── __init__.py │ ├── layers │ │ ├── __init__.py │ │ ├── abc.py │ │ ├── attn.py │ │ ├── based.py │ │ ├── bitattn.py │ │ ├── comba.py │ │ ├── delta_net.py │ │ ├── forgetting_attn.py │ │ ├── gated_deltanet.py │ │ ├── gated_deltaproduct.py │ │ ├── gla.py │ │ ├── gsa.py │ │ ├── hgrn.py │ │ ├── hgrn2.py │ │ ├── lightnet.py │ │ ├── linear_attn.py │ │ ├── mamba.py │ │ ├── mamba2.py │ │ ├── mesa_net.py │ │ ├── mla.py │ │ ├── multiscale_retention.py │ │ ├── nsa.py │ │ ├── path_attn.py │ │ ├── rebased.py │ │ ├── rodimus.py │ │ ├── rwkv6.py │ │ ├── rwkv7.py │ │ ├── simple_gla.py │ │ └── utils.py │ ├── models │ │ ├── __init__.py │ │ ├── abc │ │ │ ├── __init__.py │ │ │ ├── configuration_abc.py │ │ │ └── modeling_abc.py │ │ ├── bitnet │ │ │ ├── __init__.py │ │ │ ├── configuration_bitnet.py │ │ │ └── modeling_bitnet.py │ │ ├── comba │ │ │ ├── __init__.py │ │ │ ├── configuration_comba.py │ │ │ └── modeling_comba.py │ │ ├── delta_net │ │ │ ├── __init__.py │ │ │ ├── configuration_delta_net.py │ │ │ └── modeling_delta_net.py │ │ ├── forgetting_transformer │ │ │ ├── __init__.py │ │ │ ├── configuration_forgetting_transformer.py │ │ │ └── modeling_forgetting_transformer.py │ │ ├── gated_deltanet │ │ │ ├── __init__.py │ │ │ ├── configuration_gated_deltanet.py │ │ │ └── modeling_gated_deltanet.py │ │ ├── gated_deltaproduct │ │ │ ├── __init__.py │ │ │ ├── configuration_gated_deltaproduct.py │ │ │ └── modeling_gated_deltaproduct.py │ │ ├── gla │ │ │ ├── __init__.py │ │ │ ├── configuration_gla.py │ │ │ └── modeling_gla.py │ │ ├── gsa │ │ │ ├── __init__.py │ │ │ ├── configuration_gsa.py │ │ │ └── modeling_gsa.py │ │ ├── hgrn │ │ │ ├── __init__.py │ │ │ ├── configuration_hgrn.py │ │ │ └── modeling_hgrn.py │ │ ├── hgrn2 │ │ │ ├── __init__.py │ │ │ ├── configuration_hgrn2.py │ │ │ └── modeling_hgrn2.py │ │ ├── lightnet │ │ │ ├── __init__.py │ │ │ ├── configuration_lightnet.py │ │ │ └── modeling_lightnet.py │ │ ├── linear_attn │ │ │ ├── __init__.py │ │ │ ├── configuration_linear_attn.py │ │ │ └── modeling_linear_attn.py │ │ ├── mamba │ │ │ ├── __init__.py │ │ │ ├── configuration_mamba.py │ │ │ └── modeling_mamba.py │ │ ├── mamba2 │ │ │ ├── __init__.py │ │ │ ├── configuration_mamba2.py │ │ │ └── modeling_mamba2.py │ │ ├── mesa_net │ │ │ ├── __init__.py │ │ │ ├── configuration_mesa_net.py │ │ │ └── modeling_mesa_net.py │ │ ├── mla │ │ │ ├── __init__.py │ │ │ ├── configuration_mla.py │ │ │ └── modeling_mla.py │ │ ├── nsa │ │ │ ├── __init__.py │ │ │ ├── configuration_nsa.py │ │ │ └── modeling_nsa.py │ │ ├── path_attn │ │ │ ├── __init__.py │ │ │ ├── configuration_path_attention.py │ │ │ └── modeling_path_attention.py │ │ ├── retnet │ │ │ ├── __init__.py │ │ │ ├── configuration_retnet.py │ │ │ └── modeling_retnet.py │ │ ├── rodimus │ │ │ ├── __init__.py │ │ │ ├── configuration_rodimus.py │ │ │ └── modeling_rodimus.py │ │ ├── rwkv6 │ │ │ ├── __init__.py │ │ │ ├── configuration_rwkv6.py │ │ │ └── modeling_rwkv6.py │ │ ├── rwkv7 │ │ │ ├── __init__.py │ │ │ ├── configuration_rwkv7.py │ │ │ └── modeling_rwkv7.py │ │ ├── samba │ │ │ ├── __init__.py │ │ │ ├── configuration_samba.py │ │ │ └── modeling_samba.py │ │ ├── transformer │ │ │ ├── __init__.py │ │ │ ├── configuration_transformer.py │ │ │ └── modeling_transformer.py │ │ └── utils.py │ ├── modules │ │ ├── __init__.py │ │ ├── activations.py │ │ ├── convolution.py │ │ ├── feature_map.py │ │ ├── fused_bitlinear.py │ │ ├── fused_cross_entropy.py │ │ ├── fused_kl_div.py │ │ ├── fused_linear_cross_entropy.py │ │ ├── fused_norm_gate.py │ │ ├── grpo.py │ │ ├── l2norm.py │ │ ├── l2warp.py │ │ ├── layernorm.py │ │ ├── layernorm_gated.py │ │ ├── mlp.py │ │ ├── parallel.py │ │ ├── rotary.py │ │ └── token_shift.py │ ├── ops │ │ ├── __init__.py │ │ ├── abc │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ └── naive.py │ │ ├── attn │ │ │ ├── __init__.py │ │ │ ├── decoding.py │ │ │ └── parallel.py │ │ ├── based │ │ │ ├── __init__.py │ │ │ ├── fused_chunk.py │ │ │ ├── naive.py │ │ │ └── parallel.py │ │ ├── comba │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_recurrent.py │ │ │ ├── utils.py │ │ │ └── wy_fast.py │ │ ├── common │ │ │ ├── __init__.py │ │ │ ├── chunk_delta_h.py │ │ │ ├── chunk_h.py │ │ │ ├── chunk_h_parallel.py │ │ │ ├── chunk_h_split.py │ │ │ ├── chunk_o.py │ │ │ ├── chunk_scaled_dot_kkt.py │ │ │ ├── fused_chunk.py │ │ │ └── fused_recurrent.py │ │ ├── delta_rule │ │ │ ├── README.md │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_chunk.py │ │ │ ├── fused_recurrent.py │ │ │ ├── naive.py │ │ │ ├── parallel.py │ │ │ └── wy_fast.py │ │ ├── forgetting_attn │ │ │ ├── __init__.py │ │ │ └── parallel.py │ │ ├── gated_delta_product │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── chunk_deltaproduct_h.py │ │ │ ├── chunk_deltaproduct_o.py │ │ │ ├── chunk_ref.py │ │ │ └── naive.py │ │ ├── gated_delta_rule │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_recurrent.py │ │ │ └── wy_fast.py │ │ ├── generalized_delta_rule │ │ │ ├── README.md │ │ │ ├── __init__.py │ │ │ ├── dplr │ │ │ │ ├── __init__.py │ │ │ │ ├── chunk.py │ │ │ │ ├── chunk_A_bwd.py │ │ │ │ ├── chunk_A_fwd.py │ │ │ │ ├── chunk_h_bwd.py │ │ │ │ ├── chunk_h_fwd.py │ │ │ │ ├── chunk_o_bwd.py │ │ │ │ ├── chunk_o_fwd.py │ │ │ │ ├── fused_recurrent.py │ │ │ │ ├── naive.py │ │ │ │ ├── wy_fast_bwd.py │ │ │ │ └── wy_fast_fwd.py │ │ │ └── iplr │ │ │ │ ├── __init__.py │ │ │ │ ├── chunk.py │ │ │ │ ├── fused_recurrent.py │ │ │ │ ├── naive.py │ │ │ │ └── wy_fast.py │ │ ├── gla │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_chunk.py │ │ │ ├── fused_recurrent.py │ │ │ └── naive.py │ │ ├── gsa │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_recurrent.py │ │ │ └── naive.py │ │ ├── hgrn │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_recurrent.py │ │ │ └── naive.py │ │ ├── lightning_attn │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ └── fused_recurrent.py │ │ ├── linear_attn │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_chunk.py │ │ │ ├── fused_recurrent.py │ │ │ ├── naive.py │ │ │ └── utils.py │ │ ├── mesa_net │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── chunk_cg_solver_bwd.py │ │ │ ├── chunk_cg_solver_fwd.py │ │ │ ├── chunk_h_fwd.py │ │ │ ├── chunk_h_kk_intra_bwd.py │ │ │ ├── chunk_h_kv_intra_bwd.py │ │ │ ├── chunk_h_kv_intra_bwd_separate.py │ │ │ ├── decoding_one_step.py │ │ │ └── naive.py │ │ ├── nsa │ │ │ ├── __init__.py │ │ │ ├── compression.py │ │ │ ├── naive.py │ │ │ ├── parallel.py │ │ │ └── utils.py │ │ ├── path_attn │ │ │ ├── __init__.py │ │ │ ├── cumprod_householder_bwd.py │ │ │ ├── cumprod_householder_fwd.py │ │ │ ├── intra_chunk_preprocess_bwd.py │ │ │ ├── intra_chunk_preprocess_bwd_prepare.py │ │ │ ├── intra_chunk_preprocess_fwd.py │ │ │ ├── parallel.py │ │ │ ├── parallel_path_bwd_inter_dkv.py │ │ │ ├── parallel_path_bwd_inter_dqh.py │ │ │ ├── parallel_path_bwd_intra.py │ │ │ ├── parallel_path_fwd.py │ │ │ ├── prepare_k_cache.py │ │ │ └── transform_q.py │ │ ├── rebased │ │ │ ├── __init__.py │ │ │ ├── naive.py │ │ │ └── parallel.py │ │ ├── retention │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_chunk.py │ │ │ ├── fused_recurrent.py │ │ │ ├── naive.py │ │ │ └── parallel.py │ │ ├── rwkv4 │ │ │ ├── __init__.py │ │ │ └── fused_recurrent.py │ │ ├── rwkv6 │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── chunk_naive.py │ │ │ ├── fused_recurrent.py │ │ │ └── recurrent_naive.py │ │ ├── rwkv7 │ │ │ ├── RWKV7(Goose).md │ │ │ ├── __init__.py │ │ │ ├── channel_mixing.py │ │ │ ├── chunk.py │ │ │ ├── fused_addcmul.py │ │ │ ├── fused_k_update.py │ │ │ ├── fused_recurrent.py │ │ │ └── gate_output_correction.py │ │ ├── simple_gla │ │ │ ├── README.md │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_chunk.py │ │ │ ├── fused_recurrent.py │ │ │ ├── naive.py │ │ │ └── parallel.py │ │ ├── titans │ │ │ ├── __init__.py │ │ │ ├── log_impl.py │ │ │ └── naive.py │ │ ├── ttt │ │ │ ├── __init__.py │ │ │ ├── chunk.py │ │ │ ├── fused_chunk.py │ │ │ └── naive.py │ │ └── utils │ │ │ ├── __init__.py │ │ │ ├── asm.py │ │ │ ├── constant.py │ │ │ ├── cumsum.py │ │ │ ├── index.py │ │ │ ├── logcumsumexp.py │ │ │ ├── logsumexp.py │ │ │ ├── matmul.py │ │ │ ├── op.py │ │ │ ├── pack.py │ │ │ ├── pooling.py │ │ │ ├── softmax.py │ │ │ └── solve_tril.py │ └── utils.py ├── kubectl ├── nsa │ ├── compression.py │ ├── nsa.py │ ├── ops │ │ ├── __init__.py │ │ ├── naive.py │ │ ├── parallel.py │ │ └── utils.py │ └── selection.py ├── requirements.txt ├── requirements │ ├── docs.txt │ ├── eval.txt │ ├── framework.txt │ ├── install_all.sh │ ├── swanlab.txt │ └── tests.txt ├── scripts │ ├── benchmark │ │ ├── config │ │ │ └── tuner.json │ │ ├── exp.py │ │ ├── exp_utils.py │ │ └── generate_report.py │ ├── inference │ │ └── keye.py │ └── utils │ │ ├── plot_loss.py │ │ ├── run_dataset_info.py │ │ ├── run_model_info.py │ │ ├── run_template.py │ │ └── test_link_valid.py ├── setup.cfg ├── setup.py ├── swift │ ├── __init__.py │ ├── cli │ │ ├── __init__.py │ │ ├── _megatron │ │ │ ├── __init__.py │ │ │ ├── main.py │ │ │ ├── pt.py │ │ │ ├── rlhf.py │ │ │ └── sft.py │ │ ├── app.py │ │ ├── deploy.py │ │ ├── eval.py │ │ ├── export.py │ │ ├── infer.py │ │ ├── main.py │ │ ├── merge_lora.py │ │ ├── pt.py │ │ ├── rlhf.py │ │ ├── rollout.py │ │ ├── sample.py │ │ ├── sft.py │ │ └── web_ui.py │ ├── hub │ │ ├── __init__.py │ │ ├── constant.py │ │ └── hub.py │ ├── llm │ │ ├── __init__.py │ │ ├── app │ │ │ ├── __init__.py │ │ │ ├── app.py │ │ │ ├── build_ui.py │ │ │ └── locale.py │ │ ├── argument │ │ │ ├── __init__.py │ │ │ ├── app_args.py │ │ │ ├── base_args │ │ │ │ ├── __init__.py │ │ │ │ ├── base_args.py │ │ │ │ ├── data_args.py │ │ │ │ ├── generation_args.py │ │ │ │ ├── model_args.py │ │ │ │ ├── quant_args.py │ │ │ │ ├── template_args.py │ │ │ │ └── utils.py │ │ │ ├── deploy_args.py │ │ │ ├── eval_args.py │ │ │ ├── export_args.py │ │ │ ├── infer_args.py │ │ │ ├── merge_args.py │ │ │ ├── rlhf_args.py │ │ │ ├── sampling_args.py │ │ │ ├── train_args.py │ │ │ ├── tuner_args.py │ │ │ └── webui_args.py │ │ ├── base.py │ │ ├── data_loader.py │ │ ├── dataset │ │ │ ├── __init__.py │ │ │ ├── data │ │ │ │ └── dataset_info.json │ │ │ ├── dataset │ │ │ │ ├── __init__.py │ │ │ │ ├── llm.py │ │ │ │ └── mllm.py │ │ │ ├── indexed_dataset.py │ │ │ ├── loader.py │ │ │ ├── media.py │ │ │ ├── preprocessor │ │ │ │ ├── __init__.py │ │ │ │ ├── core.py │ │ │ │ └── extra.py │ │ │ ├── register.py │ │ │ └── utils.py │ │ ├── ds_config │ │ │ ├── zero0.json │ │ │ ├── zero1.json │ │ │ ├── zero2.json │ │ │ ├── zero2_offload.json │ │ │ ├── zero3.json │ │ │ └── zero3_offload.json │ │ ├── eval │ │ │ ├── __init__.py │ │ │ ├── eval.py │ │ │ └── utils.py │ │ ├── export │ │ │ ├── __init__.py │ │ │ ├── cached_dataset.py │ │ │ ├── export.py │ │ │ ├── merge_lora.py │ │ │ ├── ollama.py │ │ │ └── quant.py │ │ ├── infer │ │ │ ├── __init__.py │ │ │ ├── deploy.py │ │ │ ├── infer.py │ │ │ ├── infer_engine │ │ │ │ ├── __init__.py │ │ │ │ ├── base.py │ │ │ │ ├── grpo_vllm_engine.py │ │ │ │ ├── infer_client.py │ │ │ │ ├── infer_engine.py │ │ │ │ ├── lmdeploy_engine.py │ │ │ │ ├── patch.py │ │ │ │ ├── pt_engine.py │ │ │ │ ├── sglang_engine.py │ │ │ │ ├── utils.py │ │ │ │ └── vllm_engine.py │ │ │ ├── protocol.py │ │ │ ├── rollout.py │ │ │ └── utils.py │ │ ├── model │ │ │ ├── __init__.py │ │ │ ├── constant.py │ │ │ ├── model │ │ │ │ ├── __init__.py │ │ │ │ ├── baai.py │ │ │ │ ├── baichuan.py │ │ │ │ ├── baidu.py │ │ │ │ ├── bert.py │ │ │ │ ├── codefuse.py │ │ │ │ ├── deepseek.py │ │ │ │ ├── gemma.py │ │ │ │ ├── glm.py │ │ │ │ ├── internlm.py │ │ │ │ ├── llama.py │ │ │ │ ├── llava.py │ │ │ │ ├── llm.py │ │ │ │ ├── mamba.py │ │ │ │ ├── microsoft.py │ │ │ │ ├── minicpm.py │ │ │ │ ├── minimax.py │ │ │ │ ├── mistral.py │ │ │ │ ├── mllm.py │ │ │ │ ├── moonshot.py │ │ │ │ ├── mplug.py │ │ │ │ ├── openbuddy.py │ │ │ │ ├── qwen.py │ │ │ │ ├── qwen25_vl │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── configuration_qwen2_5_vl.py │ │ │ │ │ ├── modeling │ │ │ │ │ │ ├── flex_attention.py │ │ │ │ │ │ ├── initial.py │ │ │ │ │ │ ├── last_layer.py │ │ │ │ │ │ ├── modeling_flash_attention_utils.py │ │ │ │ │ │ ├── modeling_rope_utils.py │ │ │ │ │ │ ├── npu_flash_attention.py │ │ │ │ │ │ └── utils │ │ │ │ │ │ │ ├── args_doc.py │ │ │ │ │ │ │ ├── doc.py │ │ │ │ │ │ │ ├── generic.py │ │ │ │ │ │ │ ├── import_utils.py │ │ │ │ │ │ │ └── logging.py │ │ │ │ │ ├── modeling_qwen2_5_vl.py │ │ │ │ │ └── processing_qwen2_5_vl.py │ │ │ │ ├── skywork.py │ │ │ │ ├── stepfun.py │ │ │ │ ├── telechat.py │ │ │ │ ├── valley.py │ │ │ │ ├── videonsa.py │ │ │ │ └── yi.py │ │ │ ├── model_arch.py │ │ │ ├── patcher.py │ │ │ ├── register.py │ │ │ └── utils.py │ │ ├── sampling │ │ │ ├── __init__.py │ │ │ ├── base.py │ │ │ ├── distill_sampler.py │ │ │ ├── mcts.py │ │ │ ├── sampling.py │ │ │ ├── utils.py │ │ │ └── vanilla_sampler.py │ │ ├── template │ │ │ ├── __init__.py │ │ │ ├── base.py │ │ │ ├── constant.py │ │ │ ├── grounding.py │ │ │ ├── register.py │ │ │ ├── template │ │ │ │ ├── __init__.py │ │ │ │ ├── baidu.py │ │ │ │ ├── bert.py │ │ │ │ ├── deepseek.py │ │ │ │ ├── emu3.py │ │ │ │ ├── gemma.py │ │ │ │ ├── glm.py │ │ │ │ ├── idefics3.py │ │ │ │ ├── internlm.py │ │ │ │ ├── internvl.py │ │ │ │ ├── kwai.py │ │ │ │ ├── llama.py │ │ │ │ ├── llava.py │ │ │ │ ├── llm.py │ │ │ │ ├── megrez.py │ │ │ │ ├── microsoft.py │ │ │ │ ├── minicpm.py │ │ │ │ ├── minimax.py │ │ │ │ ├── mistral.py │ │ │ │ ├── molmo.py │ │ │ │ ├── moonshot.py │ │ │ │ ├── mplug.py │ │ │ │ ├── openbuddy.py │ │ │ │ ├── pixtral.py │ │ │ │ ├── qwen.py │ │ │ │ ├── stepfun.py │ │ │ │ ├── utils.py │ │ │ │ ├── valley.py │ │ │ │ └── yi.py │ │ │ ├── template_inputs.py │ │ │ ├── template_meta.py │ │ │ ├── utils.py │ │ │ └── vision_utils.py │ │ ├── train │ │ │ ├── __init__.py │ │ │ ├── callback.py │ │ │ ├── kto.py │ │ │ ├── pt.py │ │ │ ├── rlhf.py │ │ │ ├── sft.py │ │ │ └── tuner.py │ │ └── utils.py │ ├── megatron │ │ ├── __init__.py │ │ ├── argument │ │ │ ├── __init__.py │ │ │ ├── megatron_args.py │ │ │ ├── rlhf_args.py │ │ │ └── train_args.py │ │ ├── init.py │ │ ├── model │ │ │ ├── __init__.py │ │ │ ├── config.py │ │ │ ├── constant.py │ │ │ ├── gpt │ │ │ │ ├── __init__.py │ │ │ │ ├── config.py │ │ │ │ ├── hf2mcore.py │ │ │ │ ├── mcore2hf.py │ │ │ │ └── model.py │ │ │ ├── gpt_model.py │ │ │ ├── register.py │ │ │ └── rope.py │ │ ├── train │ │ │ ├── __init__.py │ │ │ ├── pt.py │ │ │ ├── rlhf.py │ │ │ ├── sft.py │ │ │ └── utils.py │ │ ├── trainers │ │ │ ├── __init__.py │ │ │ ├── base.py │ │ │ ├── dpo_trainer.py │ │ │ ├── trainer.py │ │ │ └── utils.py │ │ ├── tuners │ │ │ ├── __init__.py │ │ │ └── lora.py │ │ └── utils │ │ │ ├── __init__.py │ │ │ ├── convert.py │ │ │ ├── patcher.py │ │ │ └── utils.py │ ├── plugin │ │ ├── __init__.py │ │ ├── agent_template │ │ │ ├── __init__.py │ │ │ ├── base.py │ │ │ ├── extra.py │ │ │ ├── glm4.py │ │ │ ├── hermes.py │ │ │ ├── llama.py │ │ │ ├── mistral.py │ │ │ ├── qwen.py │ │ │ ├── react.py │ │ │ └── toolbench.py │ │ ├── callback.py │ │ ├── context_manager.py │ │ ├── env.py │ │ ├── loss.py │ │ ├── loss_scale │ │ │ ├── __init__.py │ │ │ ├── config │ │ │ │ ├── agentflan.json │ │ │ │ ├── alpha_umi.json │ │ │ │ ├── hermes.json │ │ │ │ ├── ignore_empty_think.json │ │ │ │ ├── qwen.json │ │ │ │ └── react.json │ │ │ ├── loss_scale.py │ │ │ └── utils.py │ │ ├── metric.py │ │ ├── multi_turn.py │ │ ├── optimizer.py │ │ ├── orm.py │ │ ├── prm.py │ │ ├── rm_plugin.py │ │ └── tuner.py │ ├── trainers │ │ ├── __init__.py │ │ ├── arguments.py │ │ ├── callback.py │ │ ├── mixin.py │ │ ├── optimizers │ │ │ ├── __init__.py │ │ │ └── galore │ │ │ │ ├── __init__.py │ │ │ │ ├── adafactor.py │ │ │ │ ├── adamw.py │ │ │ │ ├── adamw8bit.py │ │ │ │ ├── galore_projector.py │ │ │ │ └── utils.py │ │ ├── rlhf_arguments.py │ │ ├── rlhf_trainer │ │ │ ├── __init__.py │ │ │ ├── cpo_trainer.py │ │ │ ├── dpo_trainer.py │ │ │ ├── gkd_trainer.py │ │ │ ├── grpo_trainer.py │ │ │ ├── kto_trainer.py │ │ │ ├── orpo_trainer.py │ │ │ ├── ppo_trainer.py │ │ │ ├── reward_trainer.py │ │ │ ├── rlhf_mixin.py │ │ │ ├── utils.py │ │ │ └── vllm_client.py │ │ ├── sequence_parallel │ │ │ ├── __init__.py │ │ │ ├── base.py │ │ │ ├── ring_attention.py │ │ │ ├── ulysses.py │ │ │ └── utils.py │ │ ├── trainer_factory.py │ │ ├── trainers.py │ │ └── utils.py │ ├── tuners │ │ ├── __init__.py │ │ ├── adapter.py │ │ ├── base.py │ │ ├── llamapro.py │ │ ├── longlora │ │ │ ├── __init__.py │ │ │ ├── llama.py │ │ │ └── longlora.py │ │ ├── lora.py │ │ ├── lora_layers.py │ │ ├── mapping.py │ │ ├── neftune.py │ │ ├── part.py │ │ ├── peft.py │ │ ├── prompt.py │ │ ├── reft.py │ │ ├── restuning.py │ │ ├── restuning_components.py │ │ ├── scetuning │ │ │ ├── __init__.py │ │ │ ├── scetuning.py │ │ │ └── scetuning_components.py │ │ ├── side.py │ │ └── utils.py │ ├── ui │ │ ├── __init__.py │ │ ├── app.py │ │ ├── base.py │ │ ├── llm_eval │ │ │ ├── __init__.py │ │ │ ├── eval.py │ │ │ ├── llm_eval.py │ │ │ ├── model.py │ │ │ └── runtime.py │ │ ├── llm_export │ │ │ ├── __init__.py │ │ │ ├── export.py │ │ │ ├── llm_export.py │ │ │ ├── model.py │ │ │ └── runtime.py │ │ ├── llm_grpo │ │ │ ├── __init__.py │ │ │ ├── advanced.py │ │ │ ├── dataset.py │ │ │ ├── external_rollout.py │ │ │ ├── external_runtime.py │ │ │ ├── grpo_advanced.py │ │ │ ├── hyper.py │ │ │ ├── llm_grpo.py │ │ │ ├── lora.py │ │ │ ├── model.py │ │ │ ├── optimizer.py │ │ │ ├── quantization.py │ │ │ ├── report_to.py │ │ │ ├── reward.py │ │ │ ├── rollout.py │ │ │ ├── runtime.py │ │ │ ├── save.py │ │ │ ├── target.py │ │ │ └── tuner.py │ │ ├── llm_infer │ │ │ ├── __init__.py │ │ │ ├── generate.py │ │ │ ├── llm_infer.py │ │ │ ├── model.py │ │ │ └── runtime.py │ │ ├── llm_rlhf │ │ │ ├── __init__.py │ │ │ ├── advanced.py │ │ │ ├── dataset.py │ │ │ ├── hyper.py │ │ │ ├── llm_rlhf.py │ │ │ ├── lora.py │ │ │ ├── model.py │ │ │ ├── optimizer.py │ │ │ ├── quantization.py │ │ │ ├── report_to.py │ │ │ ├── rlhf.py │ │ │ ├── runtime.py │ │ │ ├── save.py │ │ │ ├── target.py │ │ │ └── tuner.py │ │ ├── llm_sample │ │ │ ├── __init__.py │ │ │ ├── llm_sample.py │ │ │ ├── model.py │ │ │ ├── runtime.py │ │ │ └── sample.py │ │ └── llm_train │ │ │ ├── __init__.py │ │ │ ├── advanced.py │ │ │ ├── dataset.py │ │ │ ├── hyper.py │ │ │ ├── llm_train.py │ │ │ ├── lora.py │ │ │ ├── model.py │ │ │ ├── optimizer.py │ │ │ ├── quantization.py │ │ │ ├── report_to.py │ │ │ ├── runtime.py │ │ │ ├── save.py │ │ │ ├── self_cog.py │ │ │ ├── target.py │ │ │ ├── task.py │ │ │ ├── tuner.py │ │ │ └── utils.py │ ├── utils │ │ ├── __init__.py │ │ ├── constants.py │ │ ├── env.py │ │ ├── import_utils.py │ │ ├── io_utils.py │ │ ├── logger.py │ │ ├── np_utils.py │ │ ├── tb_utils.py │ │ ├── torch_utils.py │ │ └── utils.py │ └── version.py └── tests │ ├── __init__.py │ ├── app │ └── test_app.py │ ├── deploy │ ├── test_dataset.py │ └── test_logprobs.py │ ├── eval │ └── test_eval.py │ ├── export │ └── test_quant.py │ ├── general │ ├── test_arch.py │ ├── test_dataset.py │ ├── test_model.py │ ├── test_stream.py │ └── test_template.py │ ├── hub │ ├── __init__.py │ └── test_check_model.py │ ├── infer │ ├── test_agent.py │ ├── test_infer.py │ ├── test_logprobs.py │ ├── test_main.py │ ├── test_max_memory.py │ ├── test_mllm.py │ └── test_sglang.py │ ├── llm │ ├── __init__.py │ ├── config │ │ ├── infer.json │ │ └── sft.json │ ├── data │ │ ├── alpaca.csv │ │ ├── alpaca.jsonl │ │ ├── alpaca2.csv │ │ ├── chatml.jsonl │ │ ├── conversations.jsonl │ │ ├── multi_modal_1.jsonl │ │ ├── multi_modal_2.jsonl │ │ ├── multi_modal_3.jsonl │ │ ├── sharegpt.jsonl │ │ ├── swift_multi.json │ │ ├── swift_multi.jsonl │ │ ├── swift_pre.csv │ │ ├── swift_pre.jsonl │ │ ├── swift_single.csv │ │ └── swift_single.jsonl │ ├── load_model.py │ ├── load_template.py │ ├── test_custom.py │ ├── test_dataset.py │ ├── test_ollama_export.py │ ├── test_run.py │ ├── test_run3.py │ ├── test_template.py │ ├── test_utils.py │ └── test_web_ui.py │ ├── megatron │ ├── test_align │ │ └── test_llm.py │ ├── test_export.py │ ├── test_lora.py │ ├── test_model.py │ ├── test_rlhf.py │ ├── test_save.py │ └── test_train.py │ ├── model_tag.py │ ├── models │ ├── test_flash_attn.py │ ├── test_llm.py │ └── test_mllm.py │ ├── run.py │ ├── run_config.yaml │ ├── sample │ └── test_client.py │ ├── test_align │ ├── test_cls.py │ ├── test_lmdeploy_vlm.py │ ├── test_padding_side.py │ ├── test_rlhf_loss.py │ ├── test_template │ │ ├── test_agent.py │ │ ├── test_audio.py │ │ ├── test_gene.py │ │ ├── test_llm.py │ │ ├── test_template.py │ │ ├── test_tool.py │ │ ├── test_video.py │ │ └── test_vision.py │ └── test_vllm_vlm.py │ ├── test_utils.py │ ├── train │ ├── test_channel.py │ ├── test_cls.py │ ├── test_embedding.py │ ├── test_export_cached_dataset.py │ ├── test_freeze.py │ ├── test_gkd.py │ ├── test_grounding.py │ ├── test_grpo.py │ ├── test_kto.py │ ├── test_liger.py │ ├── test_multilabel.py │ ├── test_packing.py │ ├── test_ppo.py │ ├── test_pt.py │ ├── test_resume_from_checkpoint.py │ ├── test_rlhf.py │ ├── test_sample.py │ ├── test_sft.py │ ├── test_train_eval.py │ └── test_vit_lr.py │ ├── tuners │ ├── __init__.py │ ├── test_extra_state_dict.py │ ├── test_merged_linear.py │ ├── test_neft.py │ ├── test_peft.py │ ├── test_scetuning.py │ ├── test_swift_base.py │ ├── test_swift_device_map.py │ └── test_swift_restuning.py │ └── utils │ ├── __init__.py │ ├── test_file_utils.py │ ├── test_io_utils.py │ ├── test_split_str_parts_by.py │ └── test_torch_utils.py └── scrips ├── baselines.sh ├── eval.sh └── train.sh /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/README.md -------------------------------------------------------------------------------- /assets/teaser.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/assets/teaser.png -------------------------------------------------------------------------------- /lmms-eval/CLAUDE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/CLAUDE.md -------------------------------------------------------------------------------- /lmms-eval/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/LICENSE -------------------------------------------------------------------------------- /lmms-eval/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/README.md -------------------------------------------------------------------------------- /lmms-eval/docs/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/docs/README.md -------------------------------------------------------------------------------- /lmms-eval/docs/commands.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/docs/commands.md -------------------------------------------------------------------------------- /lmms-eval/docs/current_tasks.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/docs/current_tasks.md -------------------------------------------------------------------------------- /lmms-eval/docs/lmms-eval-0.3.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/docs/lmms-eval-0.3.md -------------------------------------------------------------------------------- /lmms-eval/docs/lmms-eval-0.4.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/docs/lmms-eval-0.4.md -------------------------------------------------------------------------------- /lmms-eval/docs/model_guide.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/docs/model_guide.md -------------------------------------------------------------------------------- /lmms-eval/docs/run_examples.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/docs/run_examples.md -------------------------------------------------------------------------------- /lmms-eval/docs/task_guide.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/docs/task_guide.md -------------------------------------------------------------------------------- /lmms-eval/docs/throughput_metrics.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/docs/throughput_metrics.md -------------------------------------------------------------------------------- /lmms-eval/examples/models/aero_1_audio.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/aero_1_audio.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/aria.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/aria.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/auroracap.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/auroracap.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/claude.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/claude.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/idefics2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/idefics2.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/instructblip.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/instructblip.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/internvl1.5.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/internvl1.5.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/internvl2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/internvl2.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/llama_vid.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/llama_vid.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/llama_vision.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/llama_vision.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/llava_1_5.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/llava_1_5.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/llava_next.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/llava_next.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/llava_video.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/llava_video.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/movie_chat.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/movie_chat.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/mplug_owl.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/mplug_owl.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/plm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/plm.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/qwen25vl.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/qwen25vl.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/qwen2vl.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/qwen2vl.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/sglang.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/sglang.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/slime.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/slime.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/tinyllava.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/tinyllava.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/video_llava.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/video_llava.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/vllm_qwen2vl.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/vllm_qwen2vl.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/xai_grok.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/xai_grok.sh -------------------------------------------------------------------------------- /lmms-eval/examples/models/xcomposer.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/examples/models/xcomposer.sh -------------------------------------------------------------------------------- /lmms-eval/fla/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/abc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/abc.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/attn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/attn.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/based.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/based.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/bitattn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/bitattn.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/comba.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/comba.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/delta_net.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/delta_net.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/forgetting_attn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/forgetting_attn.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/gated_deltanet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/gated_deltanet.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/gla.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/gla.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/gsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/gsa.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/hgrn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/hgrn.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/hgrn2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/hgrn2.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/lightnet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/lightnet.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/linear_attn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/linear_attn.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/mamba.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/mamba.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/mamba2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/mamba2.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/mesa_net.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/mesa_net.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/mla.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/mla.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/nsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/nsa.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/path_attn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/path_attn.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/rebased.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/rebased.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/rodimus.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/rodimus.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/rwkv6.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/rwkv6.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/rwkv7.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/rwkv7.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/simple_gla.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/simple_gla.py -------------------------------------------------------------------------------- /lmms-eval/fla/layers/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/layers/utils.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/abc/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/abc/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/abc/modeling_abc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/abc/modeling_abc.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/bitnet/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/bitnet/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/comba/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/comba/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/gla/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/gla/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/gla/modeling_gla.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/gla/modeling_gla.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/gsa/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/gsa/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/gsa/modeling_gsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/gsa/modeling_gsa.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/hgrn/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/hgrn/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/hgrn2/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/hgrn2/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/lightnet/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/lightnet/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/mamba/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/mamba/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/mamba2/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/mamba2/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/mesa_net/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/mesa_net/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/mla/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/mla/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/mla/modeling_mla.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/mla/modeling_mla.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/nsa/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/nsa/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/nsa/modeling_nsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/nsa/modeling_nsa.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/retnet/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/retnet/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/rodimus/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/rodimus/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/rwkv6/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/rwkv6/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/rwkv7/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/rwkv7/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/samba/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/samba/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/models/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/models/utils.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/activations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/activations.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/convolution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/convolution.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/feature_map.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/feature_map.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/fused_bitlinear.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/fused_bitlinear.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/fused_kl_div.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/fused_kl_div.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/fused_norm_gate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/fused_norm_gate.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/grpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/grpo.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/l2norm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/l2norm.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/l2warp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/l2warp.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/layernorm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/layernorm.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/layernorm_gated.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/layernorm_gated.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/mlp.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/parallel.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/rotary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/rotary.py -------------------------------------------------------------------------------- /lmms-eval/fla/modules/token_shift.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/modules/token_shift.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/abc/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/abc/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/abc/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/abc/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/abc/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/abc/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/attn/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/attn/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/attn/decoding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/attn/decoding.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/attn/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/attn/parallel.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/based/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/based/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/based/fused_chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/based/fused_chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/based/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/based/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/based/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/based/parallel.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/comba/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/comba/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/comba/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/comba/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/comba/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/comba/utils.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/comba/wy_fast.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/comba/wy_fast.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/common/__init__.py: -------------------------------------------------------------------------------- 1 | # -*- coding: utf-8 -*- 2 | -------------------------------------------------------------------------------- /lmms-eval/fla/ops/common/chunk_delta_h.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/common/chunk_delta_h.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/common/chunk_h.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/common/chunk_h.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/common/chunk_h_split.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/common/chunk_h_split.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/common/chunk_o.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/common/chunk_o.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/common/fused_chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/common/fused_chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/delta_rule/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/delta_rule/README.md -------------------------------------------------------------------------------- /lmms-eval/fla/ops/delta_rule/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/delta_rule/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/delta_rule/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/delta_rule/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/delta_rule/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/delta_rule/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/delta_rule/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/delta_rule/parallel.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/delta_rule/wy_fast.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/delta_rule/wy_fast.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/gla/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/gla/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/gla/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/gla/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/gla/fused_chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/gla/fused_chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/gla/fused_recurrent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/gla/fused_recurrent.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/gla/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/gla/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/gsa/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/gsa/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/gsa/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/gsa/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/gsa/fused_recurrent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/gsa/fused_recurrent.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/gsa/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/gsa/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/hgrn/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/hgrn/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/hgrn/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/hgrn/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/hgrn/fused_recurrent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/hgrn/fused_recurrent.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/hgrn/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/hgrn/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/lightning_attn/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/lightning_attn/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/linear_attn/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/linear_attn/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/linear_attn/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/linear_attn/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/linear_attn/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/linear_attn/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/linear_attn/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/linear_attn/utils.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/mesa_net/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/mesa_net/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/mesa_net/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/mesa_net/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/mesa_net/chunk_h_fwd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/mesa_net/chunk_h_fwd.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/mesa_net/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/mesa_net/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/nsa/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/nsa/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/nsa/compression.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/nsa/compression.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/nsa/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/nsa/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/nsa/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/nsa/parallel.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/nsa/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/nsa/utils.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/path_attn/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/path_attn/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/path_attn/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/path_attn/parallel.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rebased/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rebased/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rebased/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rebased/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rebased/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rebased/parallel.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/retention/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/retention/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/retention/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/retention/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/retention/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/retention/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/retention/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/retention/parallel.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rwkv4/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rwkv4/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rwkv6/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rwkv6/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rwkv6/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rwkv6/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rwkv6/chunk_naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rwkv6/chunk_naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rwkv7/RWKV7(Goose).md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rwkv7/RWKV7(Goose).md -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rwkv7/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rwkv7/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rwkv7/channel_mixing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rwkv7/channel_mixing.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rwkv7/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rwkv7/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rwkv7/fused_addcmul.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rwkv7/fused_addcmul.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/rwkv7/fused_k_update.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/rwkv7/fused_k_update.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/simple_gla/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/simple_gla/README.md -------------------------------------------------------------------------------- /lmms-eval/fla/ops/simple_gla/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/simple_gla/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/simple_gla/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/simple_gla/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/simple_gla/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/simple_gla/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/simple_gla/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/simple_gla/parallel.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/titans/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/titans/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/titans/log_impl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/titans/log_impl.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/titans/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/titans/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/ttt/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/ttt/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/ttt/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/ttt/chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/ttt/fused_chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/ttt/fused_chunk.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/ttt/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/ttt/naive.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/__init__.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/asm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/asm.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/constant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/constant.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/cumsum.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/cumsum.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/index.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/index.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/logcumsumexp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/logcumsumexp.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/logsumexp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/logsumexp.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/matmul.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/matmul.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/op.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/op.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/pack.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/pack.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/pooling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/pooling.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/softmax.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/softmax.py -------------------------------------------------------------------------------- /lmms-eval/fla/ops/utils/solve_tril.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/ops/utils/solve_tril.py -------------------------------------------------------------------------------- /lmms-eval/fla/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/fla/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/__main__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/__main__.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/api/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/api/filter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/api/filter.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/api/group.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/api/group.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/api/instance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/api/instance.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/api/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/api/metrics.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/api/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/api/model.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/api/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/api/registry.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/api/samplers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/api/samplers.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/api/task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/api/task.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/caching/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/caching/cache.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/caching/cache.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/evaluator.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/evaluator_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/evaluator_utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/filters/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/filters/__init__.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/filters/extraction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/filters/extraction.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/filters/selection.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/filters/selection.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/llm_judge/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/llm_judge/__init__.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/llm_judge/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/llm_judge/base.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/llm_judge/factory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/llm_judge/factory.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/llm_judge/prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/llm_judge/prompt.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/llm_judge/protocol.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/llm_judge/protocol.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/llm_judge/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/llm_judge/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/loggers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/loggers/__init__.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/loggers/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/loggers/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/logging_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/logging_utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/mcp/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/mcp/__init__.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/mcp/client.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/mcp/client.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/__init__.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/chat/sglang.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/chat/sglang.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/chat/vllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/chat/vllm.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/model_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/simple/aero.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/simple/aero.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/simple/aria.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/simple/aria.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/simple/fuyu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/simple/fuyu.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/simple/ola.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/simple/ola.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/simple/oryx.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/simple/oryx.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/simple/plm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/simple/plm.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/simple/reka.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/simple/reka.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/simple/ross.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/simple/ross.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/simple/vila.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/simple/vila.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/simple/vita.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/simple/vita.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/simple/vllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/simple/vllm.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/models/simple/vora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/models/simple/vora.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/protocol.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/protocol.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/__init__.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/_task_utils/gpt_eval_utils.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/ai2d/ai2d.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/ai2d/ai2d.yaml -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/ai2d/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/ai2d/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/aime/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/aime/README.md -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/aime/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/aime/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/arc/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/arc/README.md -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/cmmmu/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/cmmmu/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/cuva/cuva.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/cuva/cuva.yaml -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/cuva/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/cuva/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/cvrr/_cvrr.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/cvrr/_cvrr.yaml -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/cvrr/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/cvrr/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/docvqa/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/docvqa/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/emma/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/emma/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/ferret/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/ferret/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/fleurs/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/fleurs/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/funqa/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/funqa/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/gpqa/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/gpqa/README.md -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/gqa/gqa.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/gqa/gqa.yaml -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/gqa/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/gqa/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/gqa_ru/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/gqa_ru/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/gsm8k/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/gsm8k/README.md -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/iconqa/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/iconqa/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/ifeval/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/ifeval/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/jmmmu/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/jmmmu/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/k12/k12.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/k12/k12.yaml -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/k12/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/k12/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mirb/mirb.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mirb/mirb.yaml -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mirb/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mirb/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mlvu/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mlvu/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mmau/mmau.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mmau/mmau.yaml -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mmau/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mmau/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mme/mme.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mme/mme.yaml -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mme/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mme/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mmmu/arial.ttf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mmmu/arial.ttf -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mmmu/mmmu.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mmmu/mmmu.yaml -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mmmu/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mmmu/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mmsearch/retrieve_content/tokenization/__init__.py: -------------------------------------------------------------------------------- 1 | # Implement your code here. 2 | -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mmstar/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mmstar/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mmt/mmt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mmt/mmt.yaml -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/mmt/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/mmt/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/multilingual-llava-bench-in-the-wild/README.md: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/ocrbench_v2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/ocrbench_v2/spotting_eval/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/vdc/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/tasks/vdc/utils.py -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/tasks/vstar_bench/__init__.py: -------------------------------------------------------------------------------- 1 | # V* Benchmark: Guided Visual Search as a Core Mechanism in Multimodal LLMs 2 | -------------------------------------------------------------------------------- /lmms-eval/lmms_eval/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/lmms_eval/utils.py -------------------------------------------------------------------------------- /lmms-eval/miscs/example_eval.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/miscs/example_eval.yaml -------------------------------------------------------------------------------- /lmms-eval/miscs/llava_result_check.md: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lmms-eval/miscs/llava_sglang_result_check.md: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lmms-eval/miscs/repr_torch_envs.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/miscs/repr_torch_envs.txt -------------------------------------------------------------------------------- /lmms-eval/miscs/scienceqa_id.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/miscs/scienceqa_id.txt -------------------------------------------------------------------------------- /lmms-eval/miscs/script.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/miscs/script.sh -------------------------------------------------------------------------------- /lmms-eval/miscs/test_llava.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/miscs/test_llava.py -------------------------------------------------------------------------------- /lmms-eval/miscs/test_scienceqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/miscs/test_scienceqa.py -------------------------------------------------------------------------------- /lmms-eval/plotly.min.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/plotly.min.js -------------------------------------------------------------------------------- /lmms-eval/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/pyproject.toml -------------------------------------------------------------------------------- /lmms-eval/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/setup.py -------------------------------------------------------------------------------- /lmms-eval/tools/get_split_zip.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/tools/get_split_zip.py -------------------------------------------------------------------------------- /lmms-eval/tools/get_video_avg_time.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/tools/get_video_avg_time.py -------------------------------------------------------------------------------- /lmms-eval/tools/lite/embed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/tools/lite/embed.py -------------------------------------------------------------------------------- /lmms-eval/tools/lite/shrink.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/tools/lite/shrink.py -------------------------------------------------------------------------------- /lmms-eval/tools/live_bench/live_bench/data_generator/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /lmms-eval/tools/live_bench/live_bench/driver/.gitignore: -------------------------------------------------------------------------------- 1 | extensions/ 2 | -------------------------------------------------------------------------------- /lmms-eval/tools/live_bench/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/tools/live_bench/setup.py -------------------------------------------------------------------------------- /lmms-eval/tools/make_vatex.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/tools/make_vatex.py -------------------------------------------------------------------------------- /lmms-eval/tools/makecvrr.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/tools/makecvrr.ipynb -------------------------------------------------------------------------------- /lmms-eval/tools/regression.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/tools/regression.py -------------------------------------------------------------------------------- /lmms-eval/uv.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/lmms-eval/uv.lock -------------------------------------------------------------------------------- /ms-swift/.dev_scripts/build_docs.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/.dev_scripts/build_docs.sh -------------------------------------------------------------------------------- /ms-swift/.dev_scripts/dockerci.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/.dev_scripts/dockerci.sh -------------------------------------------------------------------------------- /ms-swift/.github/SECURITY.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/.github/SECURITY.md -------------------------------------------------------------------------------- /ms-swift/.github/workflows/citest.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/.github/workflows/citest.yaml -------------------------------------------------------------------------------- /ms-swift/.github/workflows/lint.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/.github/workflows/lint.yaml -------------------------------------------------------------------------------- /ms-swift/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/.gitignore -------------------------------------------------------------------------------- /ms-swift/.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/.pre-commit-config.yaml -------------------------------------------------------------------------------- /ms-swift/.pre-commit-config_local.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/.pre-commit-config_local.yaml -------------------------------------------------------------------------------- /ms-swift/CODE_OF_CONDUCT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/CODE_OF_CONDUCT.md -------------------------------------------------------------------------------- /ms-swift/CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/CONTRIBUTING.md -------------------------------------------------------------------------------- /ms-swift/CONTRIBUTING_CN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/CONTRIBUTING_CN.md -------------------------------------------------------------------------------- /ms-swift/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/LICENSE -------------------------------------------------------------------------------- /ms-swift/MANIFEST.in: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/MANIFEST.in -------------------------------------------------------------------------------- /ms-swift/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/Makefile -------------------------------------------------------------------------------- /ms-swift/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/README.md -------------------------------------------------------------------------------- /ms-swift/README_CN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/README_CN.md -------------------------------------------------------------------------------- /ms-swift/asset/banner.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/asset/banner.png -------------------------------------------------------------------------------- /ms-swift/asset/ding.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/asset/ding.png -------------------------------------------------------------------------------- /ms-swift/asset/discord_qr.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/asset/discord_qr.jpg -------------------------------------------------------------------------------- /ms-swift/asset/wechat.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/asset/wechat.png -------------------------------------------------------------------------------- /ms-swift/asset/wechat_grpo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/asset/wechat_grpo.png -------------------------------------------------------------------------------- /ms-swift/asset/wechat_megatron.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/asset/wechat_megatron.png -------------------------------------------------------------------------------- /ms-swift/docs/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/Makefile -------------------------------------------------------------------------------- /ms-swift/docs/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/README.md -------------------------------------------------------------------------------- /ms-swift/docs/make.bat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/make.bat -------------------------------------------------------------------------------- /ms-swift/docs/resources/deepeyes.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/resources/deepeyes.png -------------------------------------------------------------------------------- /ms-swift/docs/resources/dpo_data.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/resources/dpo_data.png -------------------------------------------------------------------------------- /ms-swift/docs/resources/grpo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/resources/grpo.png -------------------------------------------------------------------------------- /ms-swift/docs/resources/grpo_code.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/resources/grpo_code.png -------------------------------------------------------------------------------- /ms-swift/docs/resources/grpo_geoqa.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/resources/grpo_geoqa.png -------------------------------------------------------------------------------- /ms-swift/docs/resources/gym_env.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/resources/gym_env.png -------------------------------------------------------------------------------- /ms-swift/docs/resources/kto_data.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/resources/kto_data.png -------------------------------------------------------------------------------- /ms-swift/docs/resources/web-ui-en.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/resources/web-ui-en.jpg -------------------------------------------------------------------------------- /ms-swift/docs/resources/web-ui.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/resources/web-ui.jpg -------------------------------------------------------------------------------- /ms-swift/docs/source/.readthedocs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/source/.readthedocs.yaml -------------------------------------------------------------------------------- /ms-swift/docs/source/Instruction/评测.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/source/Instruction/评测.md -------------------------------------------------------------------------------- /ms-swift/docs/source/Instruction/采样.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/source/Instruction/采样.md -------------------------------------------------------------------------------- /ms-swift/docs/source/conf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/source/conf.py -------------------------------------------------------------------------------- /ms-swift/docs/source/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/source/index.rst -------------------------------------------------------------------------------- /ms-swift/docs/source_en/conf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/source_en/conf.py -------------------------------------------------------------------------------- /ms-swift/docs/source_en/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/docs/source_en/index.rst -------------------------------------------------------------------------------- /ms-swift/examples/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/README.md -------------------------------------------------------------------------------- /ms-swift/examples/app/base_url/demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/app/base_url/demo.py -------------------------------------------------------------------------------- /ms-swift/examples/app/base_url/demo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/app/base_url/demo.sh -------------------------------------------------------------------------------- /ms-swift/examples/app/llm/sglang.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/app/llm/sglang.sh -------------------------------------------------------------------------------- /ms-swift/examples/app/llm/vllm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/app/llm/vllm.sh -------------------------------------------------------------------------------- /ms-swift/examples/app/mllm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/app/mllm.sh -------------------------------------------------------------------------------- /ms-swift/examples/custom/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/custom/dataset.py -------------------------------------------------------------------------------- /ms-swift/examples/custom/infer.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/custom/infer.sh -------------------------------------------------------------------------------- /ms-swift/examples/custom/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/custom/model.py -------------------------------------------------------------------------------- /ms-swift/examples/custom/model_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/custom/model_hf.py -------------------------------------------------------------------------------- /ms-swift/examples/custom/sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/custom/sft.sh -------------------------------------------------------------------------------- /ms-swift/examples/eval/llm/sglang.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/eval/llm/sglang.sh -------------------------------------------------------------------------------- /ms-swift/examples/eval/llm/vllm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/eval/llm/vllm.sh -------------------------------------------------------------------------------- /ms-swift/examples/eval/vlm/eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/eval/vlm/eval.sh -------------------------------------------------------------------------------- /ms-swift/examples/export/merge_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/export/merge_lora.sh -------------------------------------------------------------------------------- /ms-swift/examples/export/ollama.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/export/ollama.sh -------------------------------------------------------------------------------- /ms-swift/examples/infer/cli_demo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/cli_demo.sh -------------------------------------------------------------------------------- /ms-swift/examples/infer/demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/demo.py -------------------------------------------------------------------------------- /ms-swift/examples/infer/demo_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/demo_agent.py -------------------------------------------------------------------------------- /ms-swift/examples/infer/demo_bert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/demo_bert.py -------------------------------------------------------------------------------- /ms-swift/examples/infer/demo_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/demo_hf.py -------------------------------------------------------------------------------- /ms-swift/examples/infer/demo_lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/demo_lora.py -------------------------------------------------------------------------------- /ms-swift/examples/infer/demo_mllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/demo_mllm.py -------------------------------------------------------------------------------- /ms-swift/examples/infer/pt/bert.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/pt/bert.sh -------------------------------------------------------------------------------- /ms-swift/examples/infer/pt/lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/pt/lora.sh -------------------------------------------------------------------------------- /ms-swift/examples/infer/pt/prm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/pt/prm.sh -------------------------------------------------------------------------------- /ms-swift/examples/infer/sglang/demo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/sglang/demo.sh -------------------------------------------------------------------------------- /ms-swift/examples/infer/sglang/tp.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/sglang/tp.sh -------------------------------------------------------------------------------- /ms-swift/examples/infer/vllm/dp_tp.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/infer/vllm/dp_tp.sh -------------------------------------------------------------------------------- /ms-swift/examples/sampler/mcts/mcts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/sampler/mcts/mcts.py -------------------------------------------------------------------------------- /ms-swift/examples/sampler/mcts/mcts.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/sampler/mcts/mcts.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/agent/glm4.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/agent/glm4.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/full/infer.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/full/infer.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/full/train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/full/train.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/infer.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/infer.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/liger/sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/liger/sft.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/lora_sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/lora_sft.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/moe/llama4.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/moe/llama4.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/packing/llm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/packing/llm.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/qlora/gptq.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/qlora/gptq.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/qlora/hqq.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/qlora/hqq.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/rft/math.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/rft/math.json -------------------------------------------------------------------------------- /ms-swift/examples/train/rft/rft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/rft/rft.py -------------------------------------------------------------------------------- /ms-swift/examples/train/rlhf/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/rlhf/README.md -------------------------------------------------------------------------------- /ms-swift/examples/train/rlhf/cpo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/rlhf/cpo.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/rlhf/kto.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/rlhf/kto.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/rlhf/mpo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/rlhf/mpo.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/rlhf/orpo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/rlhf/orpo.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/rlhf/rm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/rlhf/rm.sh -------------------------------------------------------------------------------- /ms-swift/examples/train/rlhf/simpo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/examples/train/rlhf/simpo.sh -------------------------------------------------------------------------------- /ms-swift/fla/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/abc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/abc.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/attn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/attn.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/based.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/based.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/bitattn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/bitattn.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/comba.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/comba.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/delta_net.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/delta_net.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/forgetting_attn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/forgetting_attn.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/gated_deltanet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/gated_deltanet.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/gla.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/gla.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/gsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/gsa.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/hgrn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/hgrn.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/hgrn2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/hgrn2.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/lightnet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/lightnet.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/linear_attn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/linear_attn.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/mamba.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/mamba.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/mamba2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/mamba2.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/mesa_net.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/mesa_net.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/mla.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/mla.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/nsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/nsa.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/path_attn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/path_attn.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/rebased.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/rebased.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/rodimus.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/rodimus.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/rwkv6.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/rwkv6.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/rwkv7.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/rwkv7.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/simple_gla.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/simple_gla.py -------------------------------------------------------------------------------- /ms-swift/fla/layers/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/layers/utils.py -------------------------------------------------------------------------------- /ms-swift/fla/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/abc/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/abc/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/bitnet/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/bitnet/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/comba/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/comba/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/gla/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/gla/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/gsa/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/gsa/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/hgrn/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/hgrn/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/hgrn2/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/hgrn2/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/mamba/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/mamba/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/mamba2/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/mamba2/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/mla/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/mla/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/nsa/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/nsa/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/retnet/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/retnet/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/rwkv6/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/rwkv6/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/rwkv7/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/rwkv7/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/samba/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/samba/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/models/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/models/utils.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/activations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/activations.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/convolution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/convolution.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/feature_map.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/feature_map.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/fused_kl_div.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/fused_kl_div.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/grpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/grpo.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/l2norm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/l2norm.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/l2warp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/l2warp.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/layernorm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/layernorm.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/mlp.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/parallel.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/rotary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/rotary.py -------------------------------------------------------------------------------- /ms-swift/fla/modules/token_shift.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/modules/token_shift.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/abc/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/abc/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/abc/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/abc/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/abc/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/abc/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/attn/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/attn/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/attn/decoding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/attn/decoding.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/attn/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/attn/parallel.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/based/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/based/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/based/fused_chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/based/fused_chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/based/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/based/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/based/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/based/parallel.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/comba/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/comba/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/comba/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/comba/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/comba/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/comba/utils.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/comba/wy_fast.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/comba/wy_fast.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/common/__init__.py: -------------------------------------------------------------------------------- 1 | # -*- coding: utf-8 -*- 2 | -------------------------------------------------------------------------------- /ms-swift/fla/ops/common/chunk_h.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/common/chunk_h.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/common/chunk_o.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/common/chunk_o.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/common/fused_chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/common/fused_chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/delta_rule/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/delta_rule/README.md -------------------------------------------------------------------------------- /ms-swift/fla/ops/delta_rule/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/delta_rule/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/delta_rule/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/delta_rule/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/delta_rule/wy_fast.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/delta_rule/wy_fast.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/gla/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/gla/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/gla/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/gla/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/gla/fused_chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/gla/fused_chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/gla/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/gla/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/gsa/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/gsa/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/gsa/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/gsa/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/gsa/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/gsa/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/hgrn/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/hgrn/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/hgrn/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/hgrn/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/hgrn/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/hgrn/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/linear_attn/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/linear_attn/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/linear_attn/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/linear_attn/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/linear_attn/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/linear_attn/utils.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/mesa_net/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/mesa_net/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/mesa_net/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/mesa_net/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/mesa_net/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/mesa_net/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/nsa/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/nsa/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/nsa/compression.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/nsa/compression.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/nsa/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/nsa/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/nsa/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/nsa/parallel.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/nsa/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/nsa/utils.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/path_attn/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/path_attn/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/path_attn/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/path_attn/parallel.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/rebased/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/rebased/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/rebased/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/rebased/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/rebased/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/rebased/parallel.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/retention/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/retention/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/retention/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/retention/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/retention/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/retention/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/retention/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/retention/parallel.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/rwkv4/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/rwkv4/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/rwkv6/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/rwkv6/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/rwkv6/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/rwkv6/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/rwkv6/chunk_naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/rwkv6/chunk_naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/rwkv7/RWKV7(Goose).md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/rwkv7/RWKV7(Goose).md -------------------------------------------------------------------------------- /ms-swift/fla/ops/rwkv7/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/rwkv7/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/rwkv7/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/rwkv7/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/simple_gla/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/simple_gla/README.md -------------------------------------------------------------------------------- /ms-swift/fla/ops/simple_gla/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/simple_gla/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/simple_gla/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/simple_gla/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/titans/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/titans/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/titans/log_impl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/titans/log_impl.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/titans/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/titans/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/ttt/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/ttt/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/ttt/chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/ttt/chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/ttt/fused_chunk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/ttt/fused_chunk.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/ttt/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/ttt/naive.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/__init__.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/asm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/asm.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/constant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/constant.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/cumsum.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/cumsum.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/index.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/index.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/logcumsumexp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/logcumsumexp.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/logsumexp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/logsumexp.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/matmul.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/matmul.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/op.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/op.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/pack.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/pack.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/pooling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/pooling.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/softmax.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/softmax.py -------------------------------------------------------------------------------- /ms-swift/fla/ops/utils/solve_tril.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/ops/utils/solve_tril.py -------------------------------------------------------------------------------- /ms-swift/fla/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/fla/utils.py -------------------------------------------------------------------------------- /ms-swift/kubectl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/kubectl -------------------------------------------------------------------------------- /ms-swift/nsa/compression.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/nsa/compression.py -------------------------------------------------------------------------------- /ms-swift/nsa/nsa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/nsa/nsa.py -------------------------------------------------------------------------------- /ms-swift/nsa/ops/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/nsa/ops/__init__.py -------------------------------------------------------------------------------- /ms-swift/nsa/ops/naive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/nsa/ops/naive.py -------------------------------------------------------------------------------- /ms-swift/nsa/ops/parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/nsa/ops/parallel.py -------------------------------------------------------------------------------- /ms-swift/nsa/ops/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/nsa/ops/utils.py -------------------------------------------------------------------------------- /ms-swift/nsa/selection.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/nsa/selection.py -------------------------------------------------------------------------------- /ms-swift/requirements.txt: -------------------------------------------------------------------------------- 1 | -r requirements/framework.txt 2 | -------------------------------------------------------------------------------- /ms-swift/requirements/docs.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/requirements/docs.txt -------------------------------------------------------------------------------- /ms-swift/requirements/eval.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/requirements/eval.txt -------------------------------------------------------------------------------- /ms-swift/requirements/framework.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/requirements/framework.txt -------------------------------------------------------------------------------- /ms-swift/requirements/install_all.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/requirements/install_all.sh -------------------------------------------------------------------------------- /ms-swift/requirements/swanlab.txt: -------------------------------------------------------------------------------- 1 | swanlab 2 | -------------------------------------------------------------------------------- /ms-swift/requirements/tests.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/requirements/tests.txt -------------------------------------------------------------------------------- /ms-swift/scripts/benchmark/exp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/scripts/benchmark/exp.py -------------------------------------------------------------------------------- /ms-swift/scripts/inference/keye.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/scripts/inference/keye.py -------------------------------------------------------------------------------- /ms-swift/scripts/utils/plot_loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/scripts/utils/plot_loss.py -------------------------------------------------------------------------------- /ms-swift/scripts/utils/run_template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/scripts/utils/run_template.py -------------------------------------------------------------------------------- /ms-swift/setup.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/setup.cfg -------------------------------------------------------------------------------- /ms-swift/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/setup.py -------------------------------------------------------------------------------- /ms-swift/swift/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ms-swift/swift/cli/_megatron/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ms-swift/swift/cli/_megatron/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/_megatron/main.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/_megatron/pt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/_megatron/pt.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/_megatron/rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/_megatron/rlhf.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/_megatron/sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/_megatron/sft.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/app.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/deploy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/deploy.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/eval.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/export.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/export.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/infer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/infer.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/main.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/merge_lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/merge_lora.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/pt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/pt.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/rlhf.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/rollout.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/sample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/sample.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/sft.py -------------------------------------------------------------------------------- /ms-swift/swift/cli/web_ui.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/cli/web_ui.py -------------------------------------------------------------------------------- /ms-swift/swift/hub/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/hub/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/hub/constant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/hub/constant.py -------------------------------------------------------------------------------- /ms-swift/swift/hub/hub.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/hub/hub.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/app/__init__.py: -------------------------------------------------------------------------------- 1 | from .app import SwiftApp, app_main 2 | -------------------------------------------------------------------------------- /ms-swift/swift/llm/app/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/app/app.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/app/build_ui.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/app/build_ui.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/app/locale.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/app/locale.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/base.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/data_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/data_loader.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/dataset/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/dataset/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/dataset/loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/dataset/loader.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/dataset/media.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/dataset/media.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/dataset/register.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/dataset/register.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/dataset/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/dataset/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/eval/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/eval/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/eval/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/eval/eval.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/eval/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/eval/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/export/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/export/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/export/export.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/export/export.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/export/ollama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/export/ollama.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/export/quant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/export/quant.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/infer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/infer/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/infer/deploy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/infer/deploy.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/infer/infer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/infer/infer.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/infer/protocol.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/infer/protocol.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/infer/rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/infer/rollout.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/infer/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/infer/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/constant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/constant.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/model/baai.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/model/baai.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/model/bert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/model/bert.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/model/glm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/model/glm.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/model/llm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/model/llm.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/model/mllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/model/mllm.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/model/qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/model/qwen.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/model/yi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/model/yi.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/model_arch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/model_arch.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/patcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/patcher.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/register.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/register.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/model/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/model/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/sampling/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/sampling/base.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/sampling/mcts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/sampling/mcts.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/sampling/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/sampling/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/template/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/template/base.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/template/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/template/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/train/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/train/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/train/callback.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/train/callback.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/train/kto.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/train/kto.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/train/pt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/train/pt.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/train/rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/train/rlhf.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/train/sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/train/sft.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/train/tuner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/train/tuner.py -------------------------------------------------------------------------------- /ms-swift/swift/llm/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/llm/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/megatron/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/megatron/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/megatron/init.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/megatron/init.py -------------------------------------------------------------------------------- /ms-swift/swift/megatron/model/rope.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/megatron/model/rope.py -------------------------------------------------------------------------------- /ms-swift/swift/megatron/train/pt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/megatron/train/pt.py -------------------------------------------------------------------------------- /ms-swift/swift/megatron/train/rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/megatron/train/rlhf.py -------------------------------------------------------------------------------- /ms-swift/swift/megatron/train/sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/megatron/train/sft.py -------------------------------------------------------------------------------- /ms-swift/swift/megatron/train/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/megatron/train/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/megatron/tuners/__init__.py: -------------------------------------------------------------------------------- 1 | # Copyright (c) Alibaba, Inc. and its affiliates. 2 | from . import lora 3 | -------------------------------------------------------------------------------- /ms-swift/swift/megatron/tuners/lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/megatron/tuners/lora.py -------------------------------------------------------------------------------- /ms-swift/swift/megatron/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/megatron/utils/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/plugin/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/plugin/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/plugin/callback.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/plugin/callback.py -------------------------------------------------------------------------------- /ms-swift/swift/plugin/env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/plugin/env.py -------------------------------------------------------------------------------- /ms-swift/swift/plugin/loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/plugin/loss.py -------------------------------------------------------------------------------- /ms-swift/swift/plugin/metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/plugin/metric.py -------------------------------------------------------------------------------- /ms-swift/swift/plugin/multi_turn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/plugin/multi_turn.py -------------------------------------------------------------------------------- /ms-swift/swift/plugin/optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/plugin/optimizer.py -------------------------------------------------------------------------------- /ms-swift/swift/plugin/orm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/plugin/orm.py -------------------------------------------------------------------------------- /ms-swift/swift/plugin/prm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/plugin/prm.py -------------------------------------------------------------------------------- /ms-swift/swift/plugin/rm_plugin.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/plugin/rm_plugin.py -------------------------------------------------------------------------------- /ms-swift/swift/plugin/tuner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/plugin/tuner.py -------------------------------------------------------------------------------- /ms-swift/swift/trainers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/trainers/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/trainers/arguments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/trainers/arguments.py -------------------------------------------------------------------------------- /ms-swift/swift/trainers/callback.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/trainers/callback.py -------------------------------------------------------------------------------- /ms-swift/swift/trainers/mixin.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/trainers/mixin.py -------------------------------------------------------------------------------- /ms-swift/swift/trainers/optimizers/__init__.py: -------------------------------------------------------------------------------- 1 | # Copyright (c) Alibaba, Inc. and its affiliates. 2 | -------------------------------------------------------------------------------- /ms-swift/swift/trainers/trainers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/trainers/trainers.py -------------------------------------------------------------------------------- /ms-swift/swift/trainers/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/trainers/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/adapter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/adapter.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/base.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/llamapro.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/llamapro.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/longlora/__init__.py: -------------------------------------------------------------------------------- 1 | # Copyright (c) Alibaba, Inc. and its affiliates. 2 | -------------------------------------------------------------------------------- /ms-swift/swift/tuners/lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/lora.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/lora_layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/lora_layers.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/mapping.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/mapping.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/neftune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/neftune.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/part.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/part.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/peft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/peft.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/prompt.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/reft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/reft.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/restuning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/restuning.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/side.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/side.py -------------------------------------------------------------------------------- /ms-swift/swift/tuners/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/tuners/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/app.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/base.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_eval/__init__.py: -------------------------------------------------------------------------------- 1 | # Copyright (c) Alibaba, Inc. and its affiliates. 2 | -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_eval/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_eval/eval.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_eval/llm_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_eval/llm_eval.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_eval/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_eval/model.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_eval/runtime.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_eval/runtime.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_export/__init__.py: -------------------------------------------------------------------------------- 1 | # Copyright (c) Alibaba, Inc. and its affiliates. 2 | -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_export/export.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_export/export.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_export/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_export/model.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/__init__.py: -------------------------------------------------------------------------------- 1 | # Copyright (c) Alibaba, Inc. and its affiliates. 2 | -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/advanced.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_grpo/advanced.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_grpo/dataset.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/hyper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_grpo/hyper.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/llm_grpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_grpo/llm_grpo.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_grpo/lora.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_grpo/model.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/reward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_grpo/reward.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/rollout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_grpo/rollout.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/runtime.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_grpo/runtime.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/save.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_grpo/save.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/target.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_grpo/target.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_grpo/tuner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_grpo/tuner.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_infer/__init__.py: -------------------------------------------------------------------------------- 1 | # Copyright (c) Alibaba, Inc. and its affiliates. 2 | -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_infer/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_infer/model.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_infer/runtime.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_infer/runtime.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_rlhf/__init__.py: -------------------------------------------------------------------------------- 1 | # Copyright (c) Alibaba, Inc. and its affiliates. 2 | -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_rlhf/advanced.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_rlhf/advanced.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_rlhf/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_rlhf/dataset.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_rlhf/hyper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_rlhf/hyper.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_rlhf/llm_rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_rlhf/llm_rlhf.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_rlhf/lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_rlhf/lora.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_rlhf/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_rlhf/model.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_rlhf/rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_rlhf/rlhf.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_rlhf/runtime.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_rlhf/runtime.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_rlhf/save.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_rlhf/save.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_rlhf/target.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_rlhf/target.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_rlhf/tuner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_rlhf/tuner.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_sample/__init__.py: -------------------------------------------------------------------------------- 1 | # Copyright (c) Alibaba, Inc. and its affiliates. 2 | -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_sample/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_sample/model.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_sample/sample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_sample/sample.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_train/__init__.py: -------------------------------------------------------------------------------- 1 | # Copyright (c) Alibaba, Inc. and its affiliates. 2 | -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_train/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_train/dataset.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_train/hyper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_train/hyper.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_train/lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_train/lora.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_train/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_train/model.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_train/runtime.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_train/runtime.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_train/save.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_train/save.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_train/target.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_train/target.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_train/task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_train/task.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_train/tuner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_train/tuner.py -------------------------------------------------------------------------------- /ms-swift/swift/ui/llm_train/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/ui/llm_train/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/utils/__init__.py -------------------------------------------------------------------------------- /ms-swift/swift/utils/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/utils/constants.py -------------------------------------------------------------------------------- /ms-swift/swift/utils/env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/utils/env.py -------------------------------------------------------------------------------- /ms-swift/swift/utils/import_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/utils/import_utils.py -------------------------------------------------------------------------------- /ms-swift/swift/utils/io_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/utils/io_utils.py -------------------------------------------------------------------------------- /ms-swift/swift/utils/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/utils/logger.py -------------------------------------------------------------------------------- /ms-swift/swift/utils/np_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/utils/np_utils.py -------------------------------------------------------------------------------- /ms-swift/swift/utils/tb_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/utils/tb_utils.py -------------------------------------------------------------------------------- /ms-swift/swift/utils/torch_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/utils/torch_utils.py -------------------------------------------------------------------------------- /ms-swift/swift/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/utils/utils.py -------------------------------------------------------------------------------- /ms-swift/swift/version.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/swift/version.py -------------------------------------------------------------------------------- /ms-swift/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ms-swift/tests/app/test_app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/app/test_app.py -------------------------------------------------------------------------------- /ms-swift/tests/deploy/test_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/deploy/test_dataset.py -------------------------------------------------------------------------------- /ms-swift/tests/deploy/test_logprobs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/deploy/test_logprobs.py -------------------------------------------------------------------------------- /ms-swift/tests/eval/test_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/eval/test_eval.py -------------------------------------------------------------------------------- /ms-swift/tests/export/test_quant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/export/test_quant.py -------------------------------------------------------------------------------- /ms-swift/tests/general/test_arch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/general/test_arch.py -------------------------------------------------------------------------------- /ms-swift/tests/general/test_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/general/test_dataset.py -------------------------------------------------------------------------------- /ms-swift/tests/general/test_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/general/test_model.py -------------------------------------------------------------------------------- /ms-swift/tests/general/test_stream.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/general/test_stream.py -------------------------------------------------------------------------------- /ms-swift/tests/hub/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ms-swift/tests/hub/test_check_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/hub/test_check_model.py -------------------------------------------------------------------------------- /ms-swift/tests/infer/test_agent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/infer/test_agent.py -------------------------------------------------------------------------------- /ms-swift/tests/infer/test_infer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/infer/test_infer.py -------------------------------------------------------------------------------- /ms-swift/tests/infer/test_logprobs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/infer/test_logprobs.py -------------------------------------------------------------------------------- /ms-swift/tests/infer/test_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/infer/test_main.py -------------------------------------------------------------------------------- /ms-swift/tests/infer/test_mllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/infer/test_mllm.py -------------------------------------------------------------------------------- /ms-swift/tests/infer/test_sglang.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/infer/test_sglang.py -------------------------------------------------------------------------------- /ms-swift/tests/llm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ms-swift/tests/llm/config/infer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/config/infer.json -------------------------------------------------------------------------------- /ms-swift/tests/llm/config/sft.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/config/sft.json -------------------------------------------------------------------------------- /ms-swift/tests/llm/data/alpaca.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/data/alpaca.csv -------------------------------------------------------------------------------- /ms-swift/tests/llm/data/alpaca.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/data/alpaca.jsonl -------------------------------------------------------------------------------- /ms-swift/tests/llm/data/alpaca2.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/data/alpaca2.csv -------------------------------------------------------------------------------- /ms-swift/tests/llm/data/chatml.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/data/chatml.jsonl -------------------------------------------------------------------------------- /ms-swift/tests/llm/data/sharegpt.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/data/sharegpt.jsonl -------------------------------------------------------------------------------- /ms-swift/tests/llm/data/swift_pre.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/data/swift_pre.csv -------------------------------------------------------------------------------- /ms-swift/tests/llm/load_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/load_model.py -------------------------------------------------------------------------------- /ms-swift/tests/llm/load_template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/load_template.py -------------------------------------------------------------------------------- /ms-swift/tests/llm/test_custom.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/test_custom.py -------------------------------------------------------------------------------- /ms-swift/tests/llm/test_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/test_dataset.py -------------------------------------------------------------------------------- /ms-swift/tests/llm/test_run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/test_run.py -------------------------------------------------------------------------------- /ms-swift/tests/llm/test_run3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/test_run3.py -------------------------------------------------------------------------------- /ms-swift/tests/llm/test_template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/test_template.py -------------------------------------------------------------------------------- /ms-swift/tests/llm/test_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/test_utils.py -------------------------------------------------------------------------------- /ms-swift/tests/llm/test_web_ui.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/llm/test_web_ui.py -------------------------------------------------------------------------------- /ms-swift/tests/megatron/test_export.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/megatron/test_export.py -------------------------------------------------------------------------------- /ms-swift/tests/megatron/test_lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/megatron/test_lora.py -------------------------------------------------------------------------------- /ms-swift/tests/megatron/test_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/megatron/test_model.py -------------------------------------------------------------------------------- /ms-swift/tests/megatron/test_rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/megatron/test_rlhf.py -------------------------------------------------------------------------------- /ms-swift/tests/megatron/test_save.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/megatron/test_save.py -------------------------------------------------------------------------------- /ms-swift/tests/megatron/test_train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/megatron/test_train.py -------------------------------------------------------------------------------- /ms-swift/tests/model_tag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/model_tag.py -------------------------------------------------------------------------------- /ms-swift/tests/models/test_llm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/models/test_llm.py -------------------------------------------------------------------------------- /ms-swift/tests/models/test_mllm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/models/test_mllm.py -------------------------------------------------------------------------------- /ms-swift/tests/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/run.py -------------------------------------------------------------------------------- /ms-swift/tests/run_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/run_config.yaml -------------------------------------------------------------------------------- /ms-swift/tests/sample/test_client.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/sample/test_client.py -------------------------------------------------------------------------------- /ms-swift/tests/test_align/test_cls.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/test_align/test_cls.py -------------------------------------------------------------------------------- /ms-swift/tests/test_align/test_rlhf_loss.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ms-swift/tests/test_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/test_utils.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_channel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_channel.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_cls.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_cls.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_embedding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_embedding.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_freeze.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_freeze.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_gkd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_gkd.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_grounding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_grounding.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_grpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_grpo.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_kto.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_kto.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_liger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_liger.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_packing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_packing.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_ppo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_ppo.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_pt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_pt.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_rlhf.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_sample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_sample.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_sft.py -------------------------------------------------------------------------------- /ms-swift/tests/train/test_vit_lr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/train/test_vit_lr.py -------------------------------------------------------------------------------- /ms-swift/tests/tuners/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ms-swift/tests/tuners/test_neft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/tuners/test_neft.py -------------------------------------------------------------------------------- /ms-swift/tests/tuners/test_peft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/tuners/test_peft.py -------------------------------------------------------------------------------- /ms-swift/tests/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /ms-swift/tests/utils/test_io_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/ms-swift/tests/utils/test_io_utils.py -------------------------------------------------------------------------------- /scrips/baselines.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/scrips/baselines.sh -------------------------------------------------------------------------------- /scrips/eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/scrips/eval.sh -------------------------------------------------------------------------------- /scrips/train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Espere-1119-Song/VideoNSA/HEAD/scrips/train.sh --------------------------------------------------------------------------------