├── LICENSE ├── README.md ├── doc ├── CONTRIBUTING.md ├── README.md ├── fig │ ├── flashNorm_fig1.pdf │ ├── flashNorm_fig1.svg │ ├── flashNorm_fig2.pdf │ ├── flashNorm_fig3.pdf │ ├── flashNorm_fig4.pdf │ ├── flashNorm_fig5.pdf │ ├── flashNorm_fig6.pdf │ ├── flashNorm_fig7.pdf │ ├── flashNorm_fig8.pdf │ ├── flashNorm_figA.pdf │ ├── flashNorm_figB.pdf │ ├── matShrink_fig1.pdf │ ├── matShrink_fig2.pdf │ ├── matShrink_fig3.pdf │ ├── precomp1stLayer_fig1.pdf │ ├── precomp1stLayer_fig2.pdf │ ├── removeWeights_fig1.pdf │ ├── removeWeights_fig2.pdf │ ├── removeWeights_fig3.pdf │ ├── removeWeights_fig4.pdf │ ├── slimAttn_fig1.pdf │ ├── slimAttn_fig1.svg │ ├── slimAttn_fig2.pdf │ ├── slimAttn_fig3.pdf │ ├── slimAttn_fig4.pdf │ ├── slimAttn_fig5.pdf │ ├── slimAttn_fig6.pdf │ └── slimAttn_fig7.pdf ├── flashNorm.md ├── flashNorm.pdf ├── matShrink.pdf ├── precomp1stLayer.pdf ├── removeWeights.pdf ├── slimAttn.md └── slimAttn.pdf ├── flashNorm_example.py ├── flashNorm_modeling_llama.py ├── flashNorm_test.py ├── notebooks ├── README.md ├── flashNorm_example.ipynb ├── flashNorm_paper.ipynb ├── removeWeights_paper.ipynb ├── slimAttn_paper.ipynb └── update_packages.ipynb ├── pyproject.toml ├── requirements.txt ├── slimAttn_paper.py ├── tex ├── README.md ├── arxiv.sty ├── clean ├── flashNorm.tex ├── matShrink.tex ├── matShrink_Sid.tex ├── neurips_2025.sty ├── neurips_2025_mods.sty ├── precomp1stLayer.tex ├── references.bib ├── removeWeights.tex ├── run ├── slimAttn.tex └── submit ├── transformer_tricks.py └── util ├── .aspell ├── clean_all ├── gen_notebooks ├── gen_pdf ├── push_pypi └── spell_check /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/README.md -------------------------------------------------------------------------------- /doc/CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/CONTRIBUTING.md -------------------------------------------------------------------------------- /doc/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/README.md -------------------------------------------------------------------------------- /doc/fig/flashNorm_fig1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/flashNorm_fig1.pdf -------------------------------------------------------------------------------- /doc/fig/flashNorm_fig1.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/flashNorm_fig1.svg -------------------------------------------------------------------------------- /doc/fig/flashNorm_fig2.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/flashNorm_fig2.pdf -------------------------------------------------------------------------------- /doc/fig/flashNorm_fig3.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/flashNorm_fig3.pdf -------------------------------------------------------------------------------- /doc/fig/flashNorm_fig4.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/flashNorm_fig4.pdf -------------------------------------------------------------------------------- /doc/fig/flashNorm_fig5.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/flashNorm_fig5.pdf -------------------------------------------------------------------------------- /doc/fig/flashNorm_fig6.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/flashNorm_fig6.pdf -------------------------------------------------------------------------------- /doc/fig/flashNorm_fig7.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/flashNorm_fig7.pdf -------------------------------------------------------------------------------- /doc/fig/flashNorm_fig8.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/flashNorm_fig8.pdf -------------------------------------------------------------------------------- /doc/fig/flashNorm_figA.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/flashNorm_figA.pdf -------------------------------------------------------------------------------- /doc/fig/flashNorm_figB.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/flashNorm_figB.pdf -------------------------------------------------------------------------------- /doc/fig/matShrink_fig1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/matShrink_fig1.pdf -------------------------------------------------------------------------------- /doc/fig/matShrink_fig2.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/matShrink_fig2.pdf -------------------------------------------------------------------------------- /doc/fig/matShrink_fig3.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/matShrink_fig3.pdf -------------------------------------------------------------------------------- /doc/fig/precomp1stLayer_fig1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/precomp1stLayer_fig1.pdf -------------------------------------------------------------------------------- /doc/fig/precomp1stLayer_fig2.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/precomp1stLayer_fig2.pdf -------------------------------------------------------------------------------- /doc/fig/removeWeights_fig1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/removeWeights_fig1.pdf -------------------------------------------------------------------------------- /doc/fig/removeWeights_fig2.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/removeWeights_fig2.pdf -------------------------------------------------------------------------------- /doc/fig/removeWeights_fig3.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/removeWeights_fig3.pdf -------------------------------------------------------------------------------- /doc/fig/removeWeights_fig4.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/removeWeights_fig4.pdf -------------------------------------------------------------------------------- /doc/fig/slimAttn_fig1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/slimAttn_fig1.pdf -------------------------------------------------------------------------------- /doc/fig/slimAttn_fig1.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/slimAttn_fig1.svg -------------------------------------------------------------------------------- /doc/fig/slimAttn_fig2.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/slimAttn_fig2.pdf -------------------------------------------------------------------------------- /doc/fig/slimAttn_fig3.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/slimAttn_fig3.pdf -------------------------------------------------------------------------------- /doc/fig/slimAttn_fig4.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/slimAttn_fig4.pdf -------------------------------------------------------------------------------- /doc/fig/slimAttn_fig5.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/slimAttn_fig5.pdf -------------------------------------------------------------------------------- /doc/fig/slimAttn_fig6.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/slimAttn_fig6.pdf -------------------------------------------------------------------------------- /doc/fig/slimAttn_fig7.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/fig/slimAttn_fig7.pdf -------------------------------------------------------------------------------- /doc/flashNorm.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/flashNorm.md -------------------------------------------------------------------------------- /doc/flashNorm.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/flashNorm.pdf -------------------------------------------------------------------------------- /doc/matShrink.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/matShrink.pdf -------------------------------------------------------------------------------- /doc/precomp1stLayer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/precomp1stLayer.pdf -------------------------------------------------------------------------------- /doc/removeWeights.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/removeWeights.pdf -------------------------------------------------------------------------------- /doc/slimAttn.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/slimAttn.md -------------------------------------------------------------------------------- /doc/slimAttn.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/doc/slimAttn.pdf -------------------------------------------------------------------------------- /flashNorm_example.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/flashNorm_example.py -------------------------------------------------------------------------------- /flashNorm_modeling_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/flashNorm_modeling_llama.py -------------------------------------------------------------------------------- /flashNorm_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/flashNorm_test.py -------------------------------------------------------------------------------- /notebooks/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/notebooks/README.md -------------------------------------------------------------------------------- /notebooks/flashNorm_example.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/notebooks/flashNorm_example.ipynb -------------------------------------------------------------------------------- /notebooks/flashNorm_paper.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/notebooks/flashNorm_paper.ipynb -------------------------------------------------------------------------------- /notebooks/removeWeights_paper.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/notebooks/removeWeights_paper.ipynb -------------------------------------------------------------------------------- /notebooks/slimAttn_paper.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/notebooks/slimAttn_paper.ipynb -------------------------------------------------------------------------------- /notebooks/update_packages.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/notebooks/update_packages.ipynb -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/pyproject.toml -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/requirements.txt -------------------------------------------------------------------------------- /slimAttn_paper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/slimAttn_paper.py -------------------------------------------------------------------------------- /tex/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/README.md -------------------------------------------------------------------------------- /tex/arxiv.sty: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/arxiv.sty -------------------------------------------------------------------------------- /tex/clean: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/clean -------------------------------------------------------------------------------- /tex/flashNorm.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/flashNorm.tex -------------------------------------------------------------------------------- /tex/matShrink.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/matShrink.tex -------------------------------------------------------------------------------- /tex/matShrink_Sid.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/matShrink_Sid.tex -------------------------------------------------------------------------------- /tex/neurips_2025.sty: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/neurips_2025.sty -------------------------------------------------------------------------------- /tex/neurips_2025_mods.sty: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/neurips_2025_mods.sty -------------------------------------------------------------------------------- /tex/precomp1stLayer.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/precomp1stLayer.tex -------------------------------------------------------------------------------- /tex/references.bib: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/references.bib -------------------------------------------------------------------------------- /tex/removeWeights.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/removeWeights.tex -------------------------------------------------------------------------------- /tex/run: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/run -------------------------------------------------------------------------------- /tex/slimAttn.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/slimAttn.tex -------------------------------------------------------------------------------- /tex/submit: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/tex/submit -------------------------------------------------------------------------------- /transformer_tricks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/transformer_tricks.py -------------------------------------------------------------------------------- /util/.aspell: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/util/.aspell -------------------------------------------------------------------------------- /util/clean_all: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/util/clean_all -------------------------------------------------------------------------------- /util/gen_notebooks: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/util/gen_notebooks -------------------------------------------------------------------------------- /util/gen_pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/util/gen_pdf -------------------------------------------------------------------------------- /util/push_pypi: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/util/push_pypi -------------------------------------------------------------------------------- /util/spell_check: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/OpenMachine-ai/transformer-tricks/HEAD/util/spell_check --------------------------------------------------------------------------------