├── .vscode ├── launch.json └── task.json ├── README.md ├── flashattention └── flash.cu ├── image ├── CPU&GPU arch.drawio ├── CPU&GPU arch.jpg ├── GPU memory hierarchy.drawio ├── GPU memory hierarchy.jpg ├── LoRA.drawio ├── LoRA.jpg ├── LoRA_record.jpeg ├── MindSpore框架下注意力正向反向计算时延.jpeg ├── MindSpore框架下注意力正向计算时延.jpeg ├── MindSpore框架下注意力正向计算时延z(续).jpeg ├── README │ └── 1712827717331.png ├── SPDA&MHA.drawio ├── SPDA&MHA.jpg ├── falcon_rw_1b模型架构图.drawio ├── falcon_rw_1b模型架构图.jpg ├── flash_attn CUDA.drawio ├── flash_attn CUDA.jpg ├── flash_attn分块算法示意图.drawio ├── flash_attn分块算法示意图.jpg ├── triton compile process.drawio ├── triton compile process.jpg ├── 工作路线图.drawio └── 工作路线图.jpg ├── peft_model └── falcon │ └── mrpc_lora │ ├── adapter_config.json │ └── adapter_model.ckpt ├── src └── falcon │ ├── __init__.py │ ├── configuration_falcon.py │ ├── convert_custom_code_checkpoint.py │ └── modeling_falcon.py ├── test ├── test_falcon │ ├── __init__.py │ └── test_modeling_falcon.py └── test_flashattention │ ├── debug_flash_2_kernel.cu │ ├── output │ ├── draw.py │ ├── draw_training_process.py │ ├── extract.py │ ├── forward+backward │ │ ├── flash_attn_1_fwdbwd_seqlen1024.csv │ │ ├── flash_attn_1_fwdbwd_seqlen128.csv │ │ ├── flash_attn_1_fwdbwd_seqlen2048.csv │ │ ├── flash_attn_1_fwdbwd_seqlen256.csv │ │ ├── flash_attn_1_fwdbwd_seqlen32.csv │ │ ├── flash_attn_1_fwdbwd_seqlen512.csv │ │ ├── flash_attn_1_fwdbwd_seqlen64.csv │ │ ├── flash_attn_2_fwdbwd_seqlen1024.csv │ │ ├── flash_attn_2_fwdbwd_seqlen128.csv │ │ ├── flash_attn_2_fwdbwd_seqlen2048.csv │ │ ├── flash_attn_2_fwdbwd_seqlen256.csv │ │ ├── flash_attn_2_fwdbwd_seqlen32.csv │ │ ├── flash_attn_2_fwdbwd_seqlen512.csv │ │ ├── flash_attn_2_fwdbwd_seqlen64.csv │ │ ├── manul_attn_fwdbwd_seqlen1024.csv │ │ ├── manul_attn_fwdbwd_seqlen128.csv │ │ ├── manul_attn_fwdbwd_seqlen2048.csv │ │ ├── manul_attn_fwdbwd_seqlen256.csv │ │ ├── manul_attn_fwdbwd_seqlen32.csv │ │ ├── manul_attn_fwdbwd_seqlen512.csv │ │ └── manul_attn_fwdbwd_seqlen64.csv │ ├── forward │ │ ├── flash_attn_1_fwd_seqlen1.csv │ │ ├── flash_attn_1_fwd_seqlen1024.csv │ │ ├── flash_attn_1_fwd_seqlen128.csv │ │ ├── flash_attn_1_fwd_seqlen2048.csv │ │ ├── flash_attn_1_fwd_seqlen256.csv │ │ ├── flash_attn_1_fwd_seqlen32.csv │ │ ├── flash_attn_1_fwd_seqlen512.csv │ │ ├── flash_attn_1_fwd_seqlen64.csv │ │ ├── flash_attn_2_fwd_seqlen1.csv │ │ ├── flash_attn_2_fwd_seqlen1024.csv │ │ ├── flash_attn_2_fwd_seqlen128.csv │ │ ├── flash_attn_2_fwd_seqlen2048.csv │ │ ├── flash_attn_2_fwd_seqlen256.csv │ │ ├── flash_attn_2_fwd_seqlen32.csv │ │ ├── flash_attn_2_fwd_seqlen512.csv │ │ ├── flash_attn_2_fwd_seqlen64.csv │ │ ├── manul_attn_fwd_seqlen1.csv │ │ ├── manul_attn_fwd_seqlen1024.csv │ │ ├── manul_attn_fwd_seqlen128.csv │ │ ├── manul_attn_fwd_seqlen2048.csv │ │ ├── manul_attn_fwd_seqlen256.csv │ │ ├── manul_attn_fwd_seqlen32.csv │ │ ├── manul_attn_fwd_seqlen512.csv │ │ └── manul_attn_fwd_seqlen64.csv │ └── test.py │ ├── profile │ ├── forward+backward │ │ ├── test_flash_attn_1_fwdbwd.py │ │ ├── test_flash_attn_2_fwdbwd.py │ │ └── test_manual_attn_fwdbwd.py │ └── forward │ │ ├── test_flash_attn_1_fwd.py │ │ ├── test_flash_attn_2_fwd.py │ │ └── test_manual_attn_fwd.py │ └── test_flashattention.py ├── train_falcon ├── alpaca_dataset.py ├── data │ └── alpaca │ │ ├── alpaca_data_cleaned_archive.json │ │ ├── test.ms │ │ ├── test.ms.db │ │ ├── train.ms │ │ └── train.ms.db ├── mrpc_dataset.py ├── prepare_alpaca.py ├── readme.md ├── train_alpaca.py └── train_mrpc.py └── 周记 ├── BiLLM.pptx ├── Deep into Intel CPU Inference.pptx ├── Intel CPU Inference.pptx ├── Intel SparseLib.pptx ├── Llama.cpp RISC-V Support.pptx ├── Llama.cpp RISC-V Support(2).pptx ├── RISC-V-Extension-for-1bit.pptx ├── Week-1 生成模型初探.pptx ├── Week-10 分布式并行.pptx ├── Week-11 tokenizer.pptx ├── Week-12 finetune logs.pptx ├── Week-13 MindSpore分布式并行.pptx ├── Week-14 flash attention & triton.pptx ├── Week-15 flash attention v2.pptx ├── Week-16 Triton&Polyheral Model.pptx ├── Week-17 Triton&OneBit.pptx ├── Week-18 1bit.pptx ├── Week-2 Falcon模型迁移.pptx ├── Week-3 MindSpore模型迁移细节.pptx ├── Week-4 RoPE.pptx ├── Week-5 MQA&ALiBi&FlashAttention.pptx ├── Week-6 PEFT.pptx ├── Week-7 迁移进展.pptx ├── Week-8 模型迁移完成.pptx ├── Week-9 Alpaca_dataset.pptx ├── ~$Deep into Intel CPU Inference.pptx ├── ~$Intel CPU Inference.pptx └── ~$Week-5 MQA&ALiBi&FlashAttention.pptx /.vscode/launch.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/.vscode/launch.json -------------------------------------------------------------------------------- /.vscode/task.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/.vscode/task.json -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/README.md -------------------------------------------------------------------------------- /flashattention/flash.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/flashattention/flash.cu -------------------------------------------------------------------------------- /image/CPU&GPU arch.drawio: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/CPU&GPU arch.drawio -------------------------------------------------------------------------------- /image/CPU&GPU arch.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/CPU&GPU arch.jpg -------------------------------------------------------------------------------- /image/GPU memory hierarchy.drawio: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/GPU memory hierarchy.drawio -------------------------------------------------------------------------------- /image/GPU memory hierarchy.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/GPU memory hierarchy.jpg -------------------------------------------------------------------------------- /image/LoRA.drawio: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/LoRA.drawio -------------------------------------------------------------------------------- /image/LoRA.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/LoRA.jpg -------------------------------------------------------------------------------- /image/LoRA_record.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/LoRA_record.jpeg -------------------------------------------------------------------------------- /image/MindSpore框架下注意力正向反向计算时延.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/MindSpore框架下注意力正向反向计算时延.jpeg -------------------------------------------------------------------------------- /image/MindSpore框架下注意力正向计算时延.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/MindSpore框架下注意力正向计算时延.jpeg -------------------------------------------------------------------------------- /image/MindSpore框架下注意力正向计算时延z(续).jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/MindSpore框架下注意力正向计算时延z(续).jpeg -------------------------------------------------------------------------------- /image/README/1712827717331.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/README/1712827717331.png -------------------------------------------------------------------------------- /image/SPDA&MHA.drawio: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/SPDA&MHA.drawio -------------------------------------------------------------------------------- /image/SPDA&MHA.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/SPDA&MHA.jpg -------------------------------------------------------------------------------- /image/falcon_rw_1b模型架构图.drawio: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/falcon_rw_1b模型架构图.drawio -------------------------------------------------------------------------------- /image/falcon_rw_1b模型架构图.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/falcon_rw_1b模型架构图.jpg -------------------------------------------------------------------------------- /image/flash_attn CUDA.drawio: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/flash_attn CUDA.drawio -------------------------------------------------------------------------------- /image/flash_attn CUDA.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/flash_attn CUDA.jpg -------------------------------------------------------------------------------- /image/flash_attn分块算法示意图.drawio: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/flash_attn分块算法示意图.drawio -------------------------------------------------------------------------------- /image/flash_attn分块算法示意图.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/flash_attn分块算法示意图.jpg -------------------------------------------------------------------------------- /image/triton compile process.drawio: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/triton compile process.drawio -------------------------------------------------------------------------------- /image/triton compile process.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/triton compile process.jpg -------------------------------------------------------------------------------- /image/工作路线图.drawio: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/工作路线图.drawio -------------------------------------------------------------------------------- /image/工作路线图.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/image/工作路线图.jpg -------------------------------------------------------------------------------- /peft_model/falcon/mrpc_lora/adapter_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/peft_model/falcon/mrpc_lora/adapter_config.json -------------------------------------------------------------------------------- /peft_model/falcon/mrpc_lora/adapter_model.ckpt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/peft_model/falcon/mrpc_lora/adapter_model.ckpt -------------------------------------------------------------------------------- /src/falcon/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/src/falcon/__init__.py -------------------------------------------------------------------------------- /src/falcon/configuration_falcon.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/src/falcon/configuration_falcon.py -------------------------------------------------------------------------------- /src/falcon/convert_custom_code_checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/src/falcon/convert_custom_code_checkpoint.py -------------------------------------------------------------------------------- /src/falcon/modeling_falcon.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/src/falcon/modeling_falcon.py -------------------------------------------------------------------------------- /test/test_falcon/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /test/test_falcon/test_modeling_falcon.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_falcon/test_modeling_falcon.py -------------------------------------------------------------------------------- /test/test_flashattention/debug_flash_2_kernel.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/debug_flash_2_kernel.cu -------------------------------------------------------------------------------- /test/test_flashattention/output/draw.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/draw.py -------------------------------------------------------------------------------- /test/test_flashattention/output/draw_training_process.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/draw_training_process.py -------------------------------------------------------------------------------- /test/test_flashattention/output/extract.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/extract.py -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen1024.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen1024.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen128.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen128.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen2048.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen2048.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen256.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen256.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen32.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen32.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen512.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen512.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen64.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_1_fwdbwd_seqlen64.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen1024.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen1024.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen128.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen128.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen2048.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen2048.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen256.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen256.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen32.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen32.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen512.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen512.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen64.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/flash_attn_2_fwdbwd_seqlen64.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen1024.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen1024.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen128.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen128.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen2048.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen2048.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen256.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen256.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen32.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen32.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen512.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen512.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen64.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward+backward/manul_attn_fwdbwd_seqlen64.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen1.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen1.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen1024.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen1024.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen128.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen128.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen2048.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen2048.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen256.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen256.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen32.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen32.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen512.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen512.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen64.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_1_fwd_seqlen64.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen1.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen1.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen1024.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen1024.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen128.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen128.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen2048.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen2048.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen256.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen256.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen32.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen32.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen512.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen512.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen64.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/flash_attn_2_fwd_seqlen64.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/manul_attn_fwd_seqlen1.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/manul_attn_fwd_seqlen1.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/manul_attn_fwd_seqlen1024.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/manul_attn_fwd_seqlen1024.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/manul_attn_fwd_seqlen128.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/manul_attn_fwd_seqlen128.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/manul_attn_fwd_seqlen2048.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/manul_attn_fwd_seqlen2048.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/manul_attn_fwd_seqlen256.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/manul_attn_fwd_seqlen256.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/manul_attn_fwd_seqlen32.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/manul_attn_fwd_seqlen32.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/manul_attn_fwd_seqlen512.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/manul_attn_fwd_seqlen512.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/forward/manul_attn_fwd_seqlen64.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/forward/manul_attn_fwd_seqlen64.csv -------------------------------------------------------------------------------- /test/test_flashattention/output/test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/output/test.py -------------------------------------------------------------------------------- /test/test_flashattention/profile/forward+backward/test_flash_attn_1_fwdbwd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/profile/forward+backward/test_flash_attn_1_fwdbwd.py -------------------------------------------------------------------------------- /test/test_flashattention/profile/forward+backward/test_flash_attn_2_fwdbwd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/profile/forward+backward/test_flash_attn_2_fwdbwd.py -------------------------------------------------------------------------------- /test/test_flashattention/profile/forward+backward/test_manual_attn_fwdbwd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/profile/forward+backward/test_manual_attn_fwdbwd.py -------------------------------------------------------------------------------- /test/test_flashattention/profile/forward/test_flash_attn_1_fwd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/profile/forward/test_flash_attn_1_fwd.py -------------------------------------------------------------------------------- /test/test_flashattention/profile/forward/test_flash_attn_2_fwd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/profile/forward/test_flash_attn_2_fwd.py -------------------------------------------------------------------------------- /test/test_flashattention/profile/forward/test_manual_attn_fwd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/profile/forward/test_manual_attn_fwd.py -------------------------------------------------------------------------------- /test/test_flashattention/test_flashattention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/test/test_flashattention/test_flashattention.py -------------------------------------------------------------------------------- /train_falcon/alpaca_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/train_falcon/alpaca_dataset.py -------------------------------------------------------------------------------- /train_falcon/data/alpaca/alpaca_data_cleaned_archive.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/train_falcon/data/alpaca/alpaca_data_cleaned_archive.json -------------------------------------------------------------------------------- /train_falcon/data/alpaca/test.ms: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/train_falcon/data/alpaca/test.ms -------------------------------------------------------------------------------- /train_falcon/data/alpaca/test.ms.db: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/train_falcon/data/alpaca/test.ms.db -------------------------------------------------------------------------------- /train_falcon/data/alpaca/train.ms: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/train_falcon/data/alpaca/train.ms -------------------------------------------------------------------------------- /train_falcon/data/alpaca/train.ms.db: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/train_falcon/data/alpaca/train.ms.db -------------------------------------------------------------------------------- /train_falcon/mrpc_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/train_falcon/mrpc_dataset.py -------------------------------------------------------------------------------- /train_falcon/prepare_alpaca.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/train_falcon/prepare_alpaca.py -------------------------------------------------------------------------------- /train_falcon/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/train_falcon/readme.md -------------------------------------------------------------------------------- /train_falcon/train_alpaca.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/train_falcon/train_alpaca.py -------------------------------------------------------------------------------- /train_falcon/train_mrpc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/train_falcon/train_mrpc.py -------------------------------------------------------------------------------- /周记/BiLLM.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/BiLLM.pptx -------------------------------------------------------------------------------- /周记/Deep into Intel CPU Inference.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Deep into Intel CPU Inference.pptx -------------------------------------------------------------------------------- /周记/Intel CPU Inference.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Intel CPU Inference.pptx -------------------------------------------------------------------------------- /周记/Intel SparseLib.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Intel SparseLib.pptx -------------------------------------------------------------------------------- /周记/Llama.cpp RISC-V Support.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Llama.cpp RISC-V Support.pptx -------------------------------------------------------------------------------- /周记/Llama.cpp RISC-V Support(2).pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Llama.cpp RISC-V Support(2).pptx -------------------------------------------------------------------------------- /周记/RISC-V-Extension-for-1bit.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/RISC-V-Extension-for-1bit.pptx -------------------------------------------------------------------------------- /周记/Week-1 生成模型初探.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-1 生成模型初探.pptx -------------------------------------------------------------------------------- /周记/Week-10 分布式并行.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-10 分布式并行.pptx -------------------------------------------------------------------------------- /周记/Week-11 tokenizer.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-11 tokenizer.pptx -------------------------------------------------------------------------------- /周记/Week-12 finetune logs.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-12 finetune logs.pptx -------------------------------------------------------------------------------- /周记/Week-13 MindSpore分布式并行.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-13 MindSpore分布式并行.pptx -------------------------------------------------------------------------------- /周记/Week-14 flash attention & triton.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-14 flash attention & triton.pptx -------------------------------------------------------------------------------- /周记/Week-15 flash attention v2.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-15 flash attention v2.pptx -------------------------------------------------------------------------------- /周记/Week-16 Triton&Polyheral Model.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-16 Triton&Polyheral Model.pptx -------------------------------------------------------------------------------- /周记/Week-17 Triton&OneBit.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-17 Triton&OneBit.pptx -------------------------------------------------------------------------------- /周记/Week-18 1bit.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-18 1bit.pptx -------------------------------------------------------------------------------- /周记/Week-2 Falcon模型迁移.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-2 Falcon模型迁移.pptx -------------------------------------------------------------------------------- /周记/Week-3 MindSpore模型迁移细节.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-3 MindSpore模型迁移细节.pptx -------------------------------------------------------------------------------- /周记/Week-4 RoPE.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-4 RoPE.pptx -------------------------------------------------------------------------------- /周记/Week-5 MQA&ALiBi&FlashAttention.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-5 MQA&ALiBi&FlashAttention.pptx -------------------------------------------------------------------------------- /周记/Week-6 PEFT.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-6 PEFT.pptx -------------------------------------------------------------------------------- /周记/Week-7 迁移进展.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-7 迁移进展.pptx -------------------------------------------------------------------------------- /周记/Week-8 模型迁移完成.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-8 模型迁移完成.pptx -------------------------------------------------------------------------------- /周记/Week-9 Alpaca_dataset.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/Week-9 Alpaca_dataset.pptx -------------------------------------------------------------------------------- /周记/~$Deep into Intel CPU Inference.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/~$Deep into Intel CPU Inference.pptx -------------------------------------------------------------------------------- /周记/~$Intel CPU Inference.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/~$Intel CPU Inference.pptx -------------------------------------------------------------------------------- /周记/~$Week-5 MQA&ALiBi&FlashAttention.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/hypertseng/migration-falcon/HEAD/周记/~$Week-5 MQA&ALiBi&FlashAttention.pptx --------------------------------------------------------------------------------