├── .gitignore ├── Inference.md ├── LICENSE ├── README.md ├── Train.md ├── backward.mermaid ├── configs ├── ARWKV-0.5B │ ├── config.json │ ├── generation_config.json │ ├── tokenizer.json │ ├── tokenizer_config.json │ └── vocab.json ├── ARWKV-1.5B │ ├── config.json │ ├── generation_config.json │ ├── tokenizer.json │ ├── tokenizer_config.json │ └── vocab.json ├── ARWKV-14B │ ├── config.json │ ├── generation_config.json │ ├── tokenizer.json │ ├── tokenizer_config.json │ └── vocab.json ├── ARWKV-32B │ ├── config.json │ ├── generation_config.json │ ├── tokenizer.json │ ├── tokenizer_config.json │ └── vocab.json ├── ARWKV-3B │ ├── config.json │ ├── generation_config.json │ ├── tokenizer.json │ ├── tokenizer_config.json │ └── vocab.json ├── ARWKV-72B │ ├── config.json │ ├── generation_config.json │ ├── tokenizer.json │ ├── tokenizer_config.json │ └── vocab.json ├── ARWKV-7B │ ├── config.json │ ├── generation_config.json │ ├── tokenizer.json │ ├── tokenizer_config.json │ └── vocab.json ├── qwen_0.5b.yaml └── qwen_7b.yaml ├── convert_pt_and_hf.sh ├── data ├── multi_source_datasets.py └── raw_dataset.py ├── forward.mermaid ├── image-1.png ├── image.png ├── rl ├── data_producer.py ├── deepspeed_rl_train.py ├── grpo_config.py ├── grpo_trainer.py ├── profiler.py ├── rl_trainer.py ├── train.mermaid ├── train_rl.py ├── train_rl_model.py └── utilities.py ├── rwkv_inside ├── TimeMixer.py ├── __init__.py ├── cuda │ ├── wkv6_cuda.cu │ ├── wkv6_op.cpp │ ├── wkv7_cuda.cu │ └── wkv7_op.cpp ├── hip │ ├── wkv6_hip.hip │ ├── wkv6_op.cpp │ ├── wkv7_hip.hip │ └── wkv7_op.cpp ├── hybrid_model.py ├── modeling_arwkv.py ├── rwkv_cuda_wind │ ├── backstepping_f32.cpp │ ├── backstepping_f32_1.cu │ ├── backstepping_f32_2.cu │ ├── tile.cuh │ ├── wind_rwkv7.cpp │ └── wind_rwkv7.cu ├── test_mask.py └── utilities.py ├── test ├── chinese_conv.jsonl ├── codes_python.jsonl ├── convert_2_hf.py ├── evaluate_distribution.py ├── hybrid_model_run_rwkv7.py ├── news_test.jsonl ├── test_chat_cli.py ├── test_hf.py ├── test_hf_gradio.py ├── test_hf_gradio_thinking.py ├── test_hf_thinking.py ├── test_hf_webui.py ├── test_samples.jsonl └── utilities.py ├── train.sh ├── train_memo.txt └── train_scripts ├── convert_pt.py ├── profiler.py ├── save_checkpoint.py ├── split_model_params.py ├── train_functions.py └── train_hybrid_deepspeed.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/.gitignore -------------------------------------------------------------------------------- /Inference.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/Inference.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/README.md -------------------------------------------------------------------------------- /Train.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/Train.md -------------------------------------------------------------------------------- /backward.mermaid: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/backward.mermaid -------------------------------------------------------------------------------- /configs/ARWKV-0.5B/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-0.5B/config.json -------------------------------------------------------------------------------- /configs/ARWKV-0.5B/generation_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-0.5B/generation_config.json -------------------------------------------------------------------------------- /configs/ARWKV-0.5B/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-0.5B/tokenizer.json -------------------------------------------------------------------------------- /configs/ARWKV-0.5B/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-0.5B/tokenizer_config.json -------------------------------------------------------------------------------- /configs/ARWKV-0.5B/vocab.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-0.5B/vocab.json -------------------------------------------------------------------------------- /configs/ARWKV-1.5B/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-1.5B/config.json -------------------------------------------------------------------------------- /configs/ARWKV-1.5B/generation_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-1.5B/generation_config.json -------------------------------------------------------------------------------- /configs/ARWKV-1.5B/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-1.5B/tokenizer.json -------------------------------------------------------------------------------- /configs/ARWKV-1.5B/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-1.5B/tokenizer_config.json -------------------------------------------------------------------------------- /configs/ARWKV-1.5B/vocab.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-1.5B/vocab.json -------------------------------------------------------------------------------- /configs/ARWKV-14B/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-14B/config.json -------------------------------------------------------------------------------- /configs/ARWKV-14B/generation_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-14B/generation_config.json -------------------------------------------------------------------------------- /configs/ARWKV-14B/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-14B/tokenizer.json -------------------------------------------------------------------------------- /configs/ARWKV-14B/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-14B/tokenizer_config.json -------------------------------------------------------------------------------- /configs/ARWKV-14B/vocab.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-14B/vocab.json -------------------------------------------------------------------------------- /configs/ARWKV-32B/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-32B/config.json -------------------------------------------------------------------------------- /configs/ARWKV-32B/generation_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-32B/generation_config.json -------------------------------------------------------------------------------- /configs/ARWKV-32B/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-32B/tokenizer.json -------------------------------------------------------------------------------- /configs/ARWKV-32B/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-32B/tokenizer_config.json -------------------------------------------------------------------------------- /configs/ARWKV-32B/vocab.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-32B/vocab.json -------------------------------------------------------------------------------- /configs/ARWKV-3B/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-3B/config.json -------------------------------------------------------------------------------- /configs/ARWKV-3B/generation_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-3B/generation_config.json -------------------------------------------------------------------------------- /configs/ARWKV-3B/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-3B/tokenizer.json -------------------------------------------------------------------------------- /configs/ARWKV-3B/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-3B/tokenizer_config.json -------------------------------------------------------------------------------- /configs/ARWKV-3B/vocab.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-3B/vocab.json -------------------------------------------------------------------------------- /configs/ARWKV-72B/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-72B/config.json -------------------------------------------------------------------------------- /configs/ARWKV-72B/generation_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-72B/generation_config.json -------------------------------------------------------------------------------- /configs/ARWKV-72B/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-72B/tokenizer.json -------------------------------------------------------------------------------- /configs/ARWKV-72B/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-72B/tokenizer_config.json -------------------------------------------------------------------------------- /configs/ARWKV-72B/vocab.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-72B/vocab.json -------------------------------------------------------------------------------- /configs/ARWKV-7B/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-7B/config.json -------------------------------------------------------------------------------- /configs/ARWKV-7B/generation_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-7B/generation_config.json -------------------------------------------------------------------------------- /configs/ARWKV-7B/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-7B/tokenizer.json -------------------------------------------------------------------------------- /configs/ARWKV-7B/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-7B/tokenizer_config.json -------------------------------------------------------------------------------- /configs/ARWKV-7B/vocab.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/ARWKV-7B/vocab.json -------------------------------------------------------------------------------- /configs/qwen_0.5b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/qwen_0.5b.yaml -------------------------------------------------------------------------------- /configs/qwen_7b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/configs/qwen_7b.yaml -------------------------------------------------------------------------------- /convert_pt_and_hf.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/convert_pt_and_hf.sh -------------------------------------------------------------------------------- /data/multi_source_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/data/multi_source_datasets.py -------------------------------------------------------------------------------- /data/raw_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/data/raw_dataset.py -------------------------------------------------------------------------------- /forward.mermaid: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/forward.mermaid -------------------------------------------------------------------------------- /image-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/image-1.png -------------------------------------------------------------------------------- /image.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/image.png -------------------------------------------------------------------------------- /rl/data_producer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rl/data_producer.py -------------------------------------------------------------------------------- /rl/deepspeed_rl_train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rl/deepspeed_rl_train.py -------------------------------------------------------------------------------- /rl/grpo_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rl/grpo_config.py -------------------------------------------------------------------------------- /rl/grpo_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rl/grpo_trainer.py -------------------------------------------------------------------------------- /rl/profiler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rl/profiler.py -------------------------------------------------------------------------------- /rl/rl_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rl/rl_trainer.py -------------------------------------------------------------------------------- /rl/train.mermaid: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rl/train.mermaid -------------------------------------------------------------------------------- /rl/train_rl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rl/train_rl.py -------------------------------------------------------------------------------- /rl/train_rl_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rl/train_rl_model.py -------------------------------------------------------------------------------- /rl/utilities.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rl/utilities.py -------------------------------------------------------------------------------- /rwkv_inside/TimeMixer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/TimeMixer.py -------------------------------------------------------------------------------- /rwkv_inside/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /rwkv_inside/cuda/wkv6_cuda.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/cuda/wkv6_cuda.cu -------------------------------------------------------------------------------- /rwkv_inside/cuda/wkv6_op.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/cuda/wkv6_op.cpp -------------------------------------------------------------------------------- /rwkv_inside/cuda/wkv7_cuda.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/cuda/wkv7_cuda.cu -------------------------------------------------------------------------------- /rwkv_inside/cuda/wkv7_op.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/cuda/wkv7_op.cpp -------------------------------------------------------------------------------- /rwkv_inside/hip/wkv6_hip.hip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/hip/wkv6_hip.hip -------------------------------------------------------------------------------- /rwkv_inside/hip/wkv6_op.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/hip/wkv6_op.cpp -------------------------------------------------------------------------------- /rwkv_inside/hip/wkv7_hip.hip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/hip/wkv7_hip.hip -------------------------------------------------------------------------------- /rwkv_inside/hip/wkv7_op.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/hip/wkv7_op.cpp -------------------------------------------------------------------------------- /rwkv_inside/hybrid_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/hybrid_model.py -------------------------------------------------------------------------------- /rwkv_inside/modeling_arwkv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/modeling_arwkv.py -------------------------------------------------------------------------------- /rwkv_inside/rwkv_cuda_wind/backstepping_f32.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/rwkv_cuda_wind/backstepping_f32.cpp -------------------------------------------------------------------------------- /rwkv_inside/rwkv_cuda_wind/backstepping_f32_1.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/rwkv_cuda_wind/backstepping_f32_1.cu -------------------------------------------------------------------------------- /rwkv_inside/rwkv_cuda_wind/backstepping_f32_2.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/rwkv_cuda_wind/backstepping_f32_2.cu -------------------------------------------------------------------------------- /rwkv_inside/rwkv_cuda_wind/tile.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/rwkv_cuda_wind/tile.cuh -------------------------------------------------------------------------------- /rwkv_inside/rwkv_cuda_wind/wind_rwkv7.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/rwkv_cuda_wind/wind_rwkv7.cpp -------------------------------------------------------------------------------- /rwkv_inside/rwkv_cuda_wind/wind_rwkv7.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/rwkv_cuda_wind/wind_rwkv7.cu -------------------------------------------------------------------------------- /rwkv_inside/test_mask.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/test_mask.py -------------------------------------------------------------------------------- /rwkv_inside/utilities.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/rwkv_inside/utilities.py -------------------------------------------------------------------------------- /test/chinese_conv.jsonl: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /test/codes_python.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/codes_python.jsonl -------------------------------------------------------------------------------- /test/convert_2_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/convert_2_hf.py -------------------------------------------------------------------------------- /test/evaluate_distribution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/evaluate_distribution.py -------------------------------------------------------------------------------- /test/hybrid_model_run_rwkv7.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/hybrid_model_run_rwkv7.py -------------------------------------------------------------------------------- /test/news_test.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/news_test.jsonl -------------------------------------------------------------------------------- /test/test_chat_cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/test_chat_cli.py -------------------------------------------------------------------------------- /test/test_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/test_hf.py -------------------------------------------------------------------------------- /test/test_hf_gradio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/test_hf_gradio.py -------------------------------------------------------------------------------- /test/test_hf_gradio_thinking.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/test_hf_gradio_thinking.py -------------------------------------------------------------------------------- /test/test_hf_thinking.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/test_hf_thinking.py -------------------------------------------------------------------------------- /test/test_hf_webui.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/test_hf_webui.py -------------------------------------------------------------------------------- /test/test_samples.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/test_samples.jsonl -------------------------------------------------------------------------------- /test/utilities.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/test/utilities.py -------------------------------------------------------------------------------- /train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/train.sh -------------------------------------------------------------------------------- /train_memo.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/train_memo.txt -------------------------------------------------------------------------------- /train_scripts/convert_pt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/train_scripts/convert_pt.py -------------------------------------------------------------------------------- /train_scripts/profiler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/train_scripts/profiler.py -------------------------------------------------------------------------------- /train_scripts/save_checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/train_scripts/save_checkpoint.py -------------------------------------------------------------------------------- /train_scripts/split_model_params.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/train_scripts/split_model_params.py -------------------------------------------------------------------------------- /train_scripts/train_functions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/train_scripts/train_functions.py -------------------------------------------------------------------------------- /train_scripts/train_hybrid_deepspeed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/yynil/RWKVInside/HEAD/train_scripts/train_hybrid_deepspeed.py --------------------------------------------------------------------------------