├── .gitignore
├── INT8_GPT2
    ├── .gitattributes
    ├── .gitignore
    ├── LICENSE
    ├── README.md
    ├── assets
    │   ├── gpt2_124M_loss.png
    │   └── nanogpt.jpg
    ├── bench.py
    ├── config
    │   ├── eval_gpt2.py
    │   ├── eval_gpt2_large.py
    │   ├── eval_gpt2_medium.py
    │   ├── eval_gpt2_xl.py
    │   ├── finetune_shakespeare.py
    │   ├── train_gpt2.py
    │   └── train_shakespeare_char.py
    ├── configurator.py
    ├── data
    │   ├── openwebtext
    │   │   ├── prepare.py
    │   │   └── readme.md
    │   ├── shakespeare
    │   │   ├── prepare.py
    │   │   └── readme.md
    │   └── shakespeare_char
    │   │   ├── prepare.py
    │   │   └── readme.md
    ├── model.py
    ├── qmodel.py
    ├── sample.py
    ├── scaling_laws.ipynb
    ├── train.py
    └── transformer_sizing.ipynb
├── Jetfire
    ├── Linear
    │   ├── __init__.py
    │   ├── linear_bwd.py
    │   └── linear_fwd.py
    ├── Nonlinear
    │   ├── __init__.py
    │   ├── add.py
    │   ├── add_mean_var.py
    │   ├── common.py
    │   ├── dequantize.py
    │   ├── dropout_bwd.py
    │   ├── dropout_fwd.py
    │   ├── gelu_bwd.py
    │   ├── gelu_fwd.py
    │   ├── layernorm.py
    │   ├── quantize.py
    │   ├── quantize_transpose.py
    │   ├── testgelu.py
    │   ├── transpose.py
    │   └── utils.py
    └── __init__.py
├── JetfireGEMMKernel
    ├── BlockQuantize
    │   ├── QBlockLinear.py
    │   ├── __init__.py
    │   └── cpp_extension
    │   │   ├── bindings.cpp
    │   │   ├── hgelu.cu
    │   │   ├── hgemm.cu
    │   │   ├── igemm
    │   │       ├── igemm_BasicInt8Gemm.cu
    │   │       ├── igemm_BlockSquare32OutputFp.cu
    │   │       ├── igemm_BlockSquare32OutputIntQuantize.cu
    │   │       ├── igemm_BlockSquare32OutputIntQuantizeBiasRowCol.cu
    │   │       ├── igemm_BlockSquare32OutputIntQuantizeBiasRowRow.cu
    │   │       ├── igemm_BlockSquare32OutputIntQuantizeStochastic.cu
    │   │       └── igemm_BlockSquare32OutputIntQuantizeTrash.cu
    │   │   └── include
    │   │       ├── common.h
    │   │       ├── hgelu.h
    │   │       ├── hgemm.h
    │   │       ├── igelu.h
    │   │       └── igemm.h
    ├── benchmark
    │   ├── benchmark.ipynb
    │   ├── benchmark_fp.py
    │   ├── benchmark_ours.py
    │   ├── result
    │   │   ├── DQInt8Fp
    │   │   │   └── result.npy
    │   │   ├── torch-16
    │   │   │   └── result.npy
    │   │   └── torch-32
    │   │   │   └── result.npy
    │   └── transpose_speed.ipynb
    ├── cppsrc
    │   └── igemm
    │   │   ├── igemm_BasicInt8Gemm
    │   │       ├── compute
    │   │       ├── compute.cu
    │   │       └── makefile
    │   │   ├── igemm_BasicInt8Gemm_128_128_32
    │   │       ├── A.txt
    │   │       ├── B.txt
    │   │       ├── CPU.txt
    │   │       ├── GPU.txt
    │   │       ├── compute
    │   │       ├── compute.cu
    │   │       └── makefile
    │   │   ├── igemm_BlockSquare32OutputFp
    │   │       ├── CPU.txt
    │   │       ├── GPU.txt
    │   │       ├── compute
    │   │       ├── compute.cu
    │   │       └── makefile
    │   │   ├── igemm_PerBlockRowScaleOutputFp
    │   │       ├── compute
    │   │       ├── compute.cu
    │   │       └── makefile
    │   │   └── igemm_PerBlockRowScaleOutputFp_128_128_32
    │   │       ├── A.txt
    │   │       ├── B.txt
    │   │       ├── CPU.txt
    │   │       ├── GPU.txt
    │   │       ├── compute
    │   │       ├── compute.cu
    │   │       └── makefile
    ├── debug.txt
    ├── setup.py
    └── tests
    │   ├── test_basicint8igemm.py
    │   ├── test_hgemm.py
    │   ├── test_int8igemmOutputFPNoQuantize.py
    │   ├── test_int8igemmoutputIntQuantizeBiasRowCol.py
    │   ├── test_int8igemmoutputIntQuantizeBiasRowRow.py
    │   ├── test_int8igemmoutputIntQuantizeDeterministic.py
    │   └── test_int8igemmoutputIntQuantizeStochastic.py
└── README.md


/.gitignore:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/.gitignore


--------------------------------------------------------------------------------
/INT8_GPT2/.gitattributes:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/.gitattributes


--------------------------------------------------------------------------------
/INT8_GPT2/.gitignore:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/.gitignore


--------------------------------------------------------------------------------
/INT8_GPT2/LICENSE:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/LICENSE


--------------------------------------------------------------------------------
/INT8_GPT2/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/README.md


--------------------------------------------------------------------------------
/INT8_GPT2/assets/gpt2_124M_loss.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/assets/gpt2_124M_loss.png


--------------------------------------------------------------------------------
/INT8_GPT2/assets/nanogpt.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/assets/nanogpt.jpg


--------------------------------------------------------------------------------
/INT8_GPT2/bench.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/bench.py


--------------------------------------------------------------------------------
/INT8_GPT2/config/eval_gpt2.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/config/eval_gpt2.py


--------------------------------------------------------------------------------
/INT8_GPT2/config/eval_gpt2_large.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/config/eval_gpt2_large.py


--------------------------------------------------------------------------------
/INT8_GPT2/config/eval_gpt2_medium.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/config/eval_gpt2_medium.py


--------------------------------------------------------------------------------
/INT8_GPT2/config/eval_gpt2_xl.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/config/eval_gpt2_xl.py


--------------------------------------------------------------------------------
/INT8_GPT2/config/finetune_shakespeare.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/config/finetune_shakespeare.py


--------------------------------------------------------------------------------
/INT8_GPT2/config/train_gpt2.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/config/train_gpt2.py


--------------------------------------------------------------------------------
/INT8_GPT2/config/train_shakespeare_char.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/config/train_shakespeare_char.py


--------------------------------------------------------------------------------
/INT8_GPT2/configurator.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/configurator.py


--------------------------------------------------------------------------------
/INT8_GPT2/data/openwebtext/prepare.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/data/openwebtext/prepare.py


--------------------------------------------------------------------------------
/INT8_GPT2/data/openwebtext/readme.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/data/openwebtext/readme.md


--------------------------------------------------------------------------------
/INT8_GPT2/data/shakespeare/prepare.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/data/shakespeare/prepare.py


--------------------------------------------------------------------------------
/INT8_GPT2/data/shakespeare/readme.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/data/shakespeare/readme.md


--------------------------------------------------------------------------------
/INT8_GPT2/data/shakespeare_char/prepare.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/data/shakespeare_char/prepare.py


--------------------------------------------------------------------------------
/INT8_GPT2/data/shakespeare_char/readme.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/data/shakespeare_char/readme.md


--------------------------------------------------------------------------------
/INT8_GPT2/model.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/model.py


--------------------------------------------------------------------------------
/INT8_GPT2/qmodel.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/qmodel.py


--------------------------------------------------------------------------------
/INT8_GPT2/sample.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/sample.py


--------------------------------------------------------------------------------
/INT8_GPT2/scaling_laws.ipynb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/scaling_laws.ipynb


--------------------------------------------------------------------------------
/INT8_GPT2/train.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/train.py


--------------------------------------------------------------------------------
/INT8_GPT2/transformer_sizing.ipynb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/INT8_GPT2/transformer_sizing.ipynb


--------------------------------------------------------------------------------
/Jetfire/Linear/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Linear/__init__.py


--------------------------------------------------------------------------------
/Jetfire/Linear/linear_bwd.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Linear/linear_bwd.py


--------------------------------------------------------------------------------
/Jetfire/Linear/linear_fwd.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Linear/linear_fwd.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/__init__.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/add.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/add.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/add_mean_var.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/add_mean_var.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/common.py:
--------------------------------------------------------------------------------
1 | import torch
2 | 
3 | SCALE_MIN_THRES = 5e-5


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/dequantize.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/dequantize.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/dropout_bwd.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/dropout_bwd.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/dropout_fwd.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/dropout_fwd.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/gelu_bwd.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/gelu_bwd.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/gelu_fwd.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/gelu_fwd.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/layernorm.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/layernorm.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/quantize.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/quantize.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/quantize_transpose.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/quantize_transpose.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/testgelu.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/testgelu.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/transpose.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/transpose.py


--------------------------------------------------------------------------------
/Jetfire/Nonlinear/utils.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/Nonlinear/utils.py


--------------------------------------------------------------------------------
/Jetfire/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/Jetfire/__init__.py


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/QBlockLinear.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/QBlockLinear.py


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/bindings.cpp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/cpp_extension/bindings.cpp


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/hgelu.cu:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/hgemm.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/cpp_extension/hgemm.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BasicInt8Gemm.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BasicInt8Gemm.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BlockSquare32OutputFp.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BlockSquare32OutputFp.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BlockSquare32OutputIntQuantize.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BlockSquare32OutputIntQuantize.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BlockSquare32OutputIntQuantizeBiasRowCol.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BlockSquare32OutputIntQuantizeBiasRowCol.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BlockSquare32OutputIntQuantizeBiasRowRow.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BlockSquare32OutputIntQuantizeBiasRowRow.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BlockSquare32OutputIntQuantizeStochastic.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BlockSquare32OutputIntQuantizeStochastic.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BlockSquare32OutputIntQuantizeTrash.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/cpp_extension/igemm/igemm_BlockSquare32OutputIntQuantizeTrash.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/include/common.h:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/cpp_extension/include/common.h


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/include/hgelu.h:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/include/hgemm.h:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/cpp_extension/include/hgemm.h


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/include/igelu.h:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/JetfireGEMMKernel/BlockQuantize/cpp_extension/include/igemm.h:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/BlockQuantize/cpp_extension/include/igemm.h


--------------------------------------------------------------------------------
/JetfireGEMMKernel/benchmark/benchmark.ipynb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/benchmark/benchmark.ipynb


--------------------------------------------------------------------------------
/JetfireGEMMKernel/benchmark/benchmark_fp.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/benchmark/benchmark_fp.py


--------------------------------------------------------------------------------
/JetfireGEMMKernel/benchmark/benchmark_ours.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/benchmark/benchmark_ours.py


--------------------------------------------------------------------------------
/JetfireGEMMKernel/benchmark/result/DQInt8Fp/result.npy:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/benchmark/result/DQInt8Fp/result.npy


--------------------------------------------------------------------------------
/JetfireGEMMKernel/benchmark/result/torch-16/result.npy:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/benchmark/result/torch-16/result.npy


--------------------------------------------------------------------------------
/JetfireGEMMKernel/benchmark/result/torch-32/result.npy:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/benchmark/result/torch-32/result.npy


--------------------------------------------------------------------------------
/JetfireGEMMKernel/benchmark/transpose_speed.ipynb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/benchmark/transpose_speed.ipynb


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm/compute:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm/compute


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm/compute.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm/compute.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm/makefile:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm/makefile


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/A.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/A.txt


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/B.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/B.txt


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/CPU.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/CPU.txt


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/GPU.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/GPU.txt


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/compute:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/compute


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/compute.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/compute.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/makefile:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BasicInt8Gemm_128_128_32/makefile


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BlockSquare32OutputFp/CPU.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BlockSquare32OutputFp/CPU.txt


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BlockSquare32OutputFp/GPU.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BlockSquare32OutputFp/GPU.txt


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BlockSquare32OutputFp/compute:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BlockSquare32OutputFp/compute


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BlockSquare32OutputFp/compute.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BlockSquare32OutputFp/compute.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_BlockSquare32OutputFp/makefile:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_BlockSquare32OutputFp/makefile


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp/compute:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp/compute


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp/compute.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp/compute.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp/makefile:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp/makefile


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/A.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/A.txt


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/B.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/B.txt


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/CPU.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/CPU.txt


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/GPU.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/GPU.txt


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/compute:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/compute


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/compute.cu:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/compute.cu


--------------------------------------------------------------------------------
/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/makefile:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/cppsrc/igemm/igemm_PerBlockRowScaleOutputFp_128_128_32/makefile


--------------------------------------------------------------------------------
/JetfireGEMMKernel/debug.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/debug.txt


--------------------------------------------------------------------------------
/JetfireGEMMKernel/setup.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/setup.py


--------------------------------------------------------------------------------
/JetfireGEMMKernel/tests/test_basicint8igemm.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/tests/test_basicint8igemm.py


--------------------------------------------------------------------------------
/JetfireGEMMKernel/tests/test_hgemm.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/tests/test_hgemm.py


--------------------------------------------------------------------------------
/JetfireGEMMKernel/tests/test_int8igemmOutputFPNoQuantize.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/tests/test_int8igemmOutputFPNoQuantize.py


--------------------------------------------------------------------------------
/JetfireGEMMKernel/tests/test_int8igemmoutputIntQuantizeBiasRowCol.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/tests/test_int8igemmoutputIntQuantizeBiasRowCol.py


--------------------------------------------------------------------------------
/JetfireGEMMKernel/tests/test_int8igemmoutputIntQuantizeBiasRowRow.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/tests/test_int8igemmoutputIntQuantizeBiasRowRow.py


--------------------------------------------------------------------------------
/JetfireGEMMKernel/tests/test_int8igemmoutputIntQuantizeDeterministic.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/tests/test_int8igemmoutputIntQuantizeDeterministic.py


--------------------------------------------------------------------------------
/JetfireGEMMKernel/tests/test_int8igemmoutputIntQuantizeStochastic.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/JetfireGEMMKernel/tests/test_int8igemmoutputIntQuantizeStochastic.py


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/thu-ml/Jetfire-INT8Training/HEAD/README.md


--------------------------------------------------------------------------------