├── .gitignore ├── README.md ├── llama.py ├── llama_model.py ├── llama_tokenizer.py ├── modelutils.py ├── opt.py ├── pythia.py ├── quant.py ├── retrain ├── prune_utils.py └── train.py ├── rwkv.py └── smart_compressors.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/README.md -------------------------------------------------------------------------------- /llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/llama.py -------------------------------------------------------------------------------- /llama_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/llama_model.py -------------------------------------------------------------------------------- /llama_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/llama_tokenizer.py -------------------------------------------------------------------------------- /modelutils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/modelutils.py -------------------------------------------------------------------------------- /opt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/opt.py -------------------------------------------------------------------------------- /pythia.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/pythia.py -------------------------------------------------------------------------------- /quant.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/quant.py -------------------------------------------------------------------------------- /retrain/prune_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/retrain/prune_utils.py -------------------------------------------------------------------------------- /retrain/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/retrain/train.py -------------------------------------------------------------------------------- /rwkv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/rwkv.py -------------------------------------------------------------------------------- /smart_compressors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NolanoOrg/sparse_quant_llms/HEAD/smart_compressors.py --------------------------------------------------------------------------------