├── .gitignore ├── LICENSE ├── README.md ├── examples └── transformers │ ├── language-modeling │ ├── README.md │ ├── config │ │ ├── iterative_unstructured_magnitude_85_config.json │ │ └── iterative_unstructured_magnitude_90_config.json │ ├── dataset_processing.py │ ├── detokenizer.py │ ├── requirements.txt │ └── run_mlm.py │ ├── question-answering │ ├── README.md │ ├── config │ │ ├── iterative_unstructured_magnitude_85_config.json │ │ ├── lock_config.json │ │ └── quantization_config.json │ ├── requirements.txt │ ├── run_qa.py │ ├── trainer_qa.py │ └── utils_qa.py │ └── text-classification │ ├── README.md │ ├── config │ ├── iterative_unstructured_magnitude_85_config.json │ ├── lock_config.json │ └── quantization_config.json │ ├── requirements.txt │ └── run_glue.py ├── model_compression_research ├── __init__.py ├── api_utils.py ├── distiller.py ├── pruning │ ├── __init__.py │ ├── methods │ │ ├── __init__.py │ │ ├── custom_method.py │ │ ├── magnitude_method.py │ │ ├── method.py │ │ ├── methods_utils.py │ │ ├── neural_wiring_method.py │ │ └── pattern_lock.py │ ├── registry.py │ └── schedulers │ │ ├── __init__.py │ │ ├── iterative_scheduler.py │ │ ├── one_shot_scheduler.py │ │ ├── scheduler.py │ │ └── schedulers_utils.py ├── quantization │ ├── __init__.py │ ├── qat.py │ └── quantizer.py └── utils.py ├── requirements.txt ├── research ├── dynamic-tinybert │ ├── README.md │ ├── length_adaptive_transformer │ │ ├── __init__.py │ │ ├── drop_and_restore_utils.py │ │ ├── evolution.py │ │ ├── modeling_bert.py │ │ ├── modeling_distilbert.py │ │ ├── modeling_roberta.py │ │ ├── modeling_utils.py │ │ ├── trainer.py │ │ └── training_args.py │ ├── requirements.txt │ ├── run-sigopt-search.sh │ └── run_squad.py └── prune-once-for-all │ ├── README.md │ ├── student_pruning.sh │ └── teacher_preparation.sh ├── run_tests.sh ├── setup.py └── tests ├── test_custom_method.py ├── test_iterative_scheduler.py ├── test_magnitude_method.py ├── test_methods_utils.py ├── test_neural_wiring_method.py ├── test_one_shot_scheduler.py ├── test_qat.py └── test_quantizer.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/README.md -------------------------------------------------------------------------------- /examples/transformers/language-modeling/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/language-modeling/README.md -------------------------------------------------------------------------------- /examples/transformers/language-modeling/config/iterative_unstructured_magnitude_85_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/language-modeling/config/iterative_unstructured_magnitude_85_config.json -------------------------------------------------------------------------------- /examples/transformers/language-modeling/config/iterative_unstructured_magnitude_90_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/language-modeling/config/iterative_unstructured_magnitude_90_config.json -------------------------------------------------------------------------------- /examples/transformers/language-modeling/dataset_processing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/language-modeling/dataset_processing.py -------------------------------------------------------------------------------- /examples/transformers/language-modeling/detokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/language-modeling/detokenizer.py -------------------------------------------------------------------------------- /examples/transformers/language-modeling/requirements.txt: -------------------------------------------------------------------------------- 1 | transformers 2 | datasets 3 | nltk 4 | -------------------------------------------------------------------------------- /examples/transformers/language-modeling/run_mlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/language-modeling/run_mlm.py -------------------------------------------------------------------------------- /examples/transformers/question-answering/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/question-answering/README.md -------------------------------------------------------------------------------- /examples/transformers/question-answering/config/iterative_unstructured_magnitude_85_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/question-answering/config/iterative_unstructured_magnitude_85_config.json -------------------------------------------------------------------------------- /examples/transformers/question-answering/config/lock_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/question-answering/config/lock_config.json -------------------------------------------------------------------------------- /examples/transformers/question-answering/config/quantization_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/question-answering/config/quantization_config.json -------------------------------------------------------------------------------- /examples/transformers/question-answering/requirements.txt: -------------------------------------------------------------------------------- 1 | transformers 2 | tqdm 3 | scikit-learn 4 | datasets 5 | -------------------------------------------------------------------------------- /examples/transformers/question-answering/run_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/question-answering/run_qa.py -------------------------------------------------------------------------------- /examples/transformers/question-answering/trainer_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/question-answering/trainer_qa.py -------------------------------------------------------------------------------- /examples/transformers/question-answering/utils_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/question-answering/utils_qa.py -------------------------------------------------------------------------------- /examples/transformers/text-classification/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/text-classification/README.md -------------------------------------------------------------------------------- /examples/transformers/text-classification/config/iterative_unstructured_magnitude_85_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/text-classification/config/iterative_unstructured_magnitude_85_config.json -------------------------------------------------------------------------------- /examples/transformers/text-classification/config/lock_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/text-classification/config/lock_config.json -------------------------------------------------------------------------------- /examples/transformers/text-classification/config/quantization_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/text-classification/config/quantization_config.json -------------------------------------------------------------------------------- /examples/transformers/text-classification/requirements.txt: -------------------------------------------------------------------------------- 1 | transformers 2 | tqdm 3 | scikit-learn 4 | datasets 5 | 6 | -------------------------------------------------------------------------------- /examples/transformers/text-classification/run_glue.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/examples/transformers/text-classification/run_glue.py -------------------------------------------------------------------------------- /model_compression_research/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/__init__.py -------------------------------------------------------------------------------- /model_compression_research/api_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/api_utils.py -------------------------------------------------------------------------------- /model_compression_research/distiller.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/distiller.py -------------------------------------------------------------------------------- /model_compression_research/pruning/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/__init__.py -------------------------------------------------------------------------------- /model_compression_research/pruning/methods/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/methods/__init__.py -------------------------------------------------------------------------------- /model_compression_research/pruning/methods/custom_method.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/methods/custom_method.py -------------------------------------------------------------------------------- /model_compression_research/pruning/methods/magnitude_method.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/methods/magnitude_method.py -------------------------------------------------------------------------------- /model_compression_research/pruning/methods/method.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/methods/method.py -------------------------------------------------------------------------------- /model_compression_research/pruning/methods/methods_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/methods/methods_utils.py -------------------------------------------------------------------------------- /model_compression_research/pruning/methods/neural_wiring_method.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/methods/neural_wiring_method.py -------------------------------------------------------------------------------- /model_compression_research/pruning/methods/pattern_lock.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/methods/pattern_lock.py -------------------------------------------------------------------------------- /model_compression_research/pruning/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/registry.py -------------------------------------------------------------------------------- /model_compression_research/pruning/schedulers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/schedulers/__init__.py -------------------------------------------------------------------------------- /model_compression_research/pruning/schedulers/iterative_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/schedulers/iterative_scheduler.py -------------------------------------------------------------------------------- /model_compression_research/pruning/schedulers/one_shot_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/schedulers/one_shot_scheduler.py -------------------------------------------------------------------------------- /model_compression_research/pruning/schedulers/scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/schedulers/scheduler.py -------------------------------------------------------------------------------- /model_compression_research/pruning/schedulers/schedulers_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/pruning/schedulers/schedulers_utils.py -------------------------------------------------------------------------------- /model_compression_research/quantization/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/quantization/__init__.py -------------------------------------------------------------------------------- /model_compression_research/quantization/qat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/quantization/qat.py -------------------------------------------------------------------------------- /model_compression_research/quantization/quantizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/quantization/quantizer.py -------------------------------------------------------------------------------- /model_compression_research/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/model_compression_research/utils.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | torch 2 | numpy 3 | -------------------------------------------------------------------------------- /research/dynamic-tinybert/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/README.md -------------------------------------------------------------------------------- /research/dynamic-tinybert/length_adaptive_transformer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/length_adaptive_transformer/__init__.py -------------------------------------------------------------------------------- /research/dynamic-tinybert/length_adaptive_transformer/drop_and_restore_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/length_adaptive_transformer/drop_and_restore_utils.py -------------------------------------------------------------------------------- /research/dynamic-tinybert/length_adaptive_transformer/evolution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/length_adaptive_transformer/evolution.py -------------------------------------------------------------------------------- /research/dynamic-tinybert/length_adaptive_transformer/modeling_bert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/length_adaptive_transformer/modeling_bert.py -------------------------------------------------------------------------------- /research/dynamic-tinybert/length_adaptive_transformer/modeling_distilbert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/length_adaptive_transformer/modeling_distilbert.py -------------------------------------------------------------------------------- /research/dynamic-tinybert/length_adaptive_transformer/modeling_roberta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/length_adaptive_transformer/modeling_roberta.py -------------------------------------------------------------------------------- /research/dynamic-tinybert/length_adaptive_transformer/modeling_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/length_adaptive_transformer/modeling_utils.py -------------------------------------------------------------------------------- /research/dynamic-tinybert/length_adaptive_transformer/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/length_adaptive_transformer/trainer.py -------------------------------------------------------------------------------- /research/dynamic-tinybert/length_adaptive_transformer/training_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/length_adaptive_transformer/training_args.py -------------------------------------------------------------------------------- /research/dynamic-tinybert/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/requirements.txt -------------------------------------------------------------------------------- /research/dynamic-tinybert/run-sigopt-search.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/run-sigopt-search.sh -------------------------------------------------------------------------------- /research/dynamic-tinybert/run_squad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/dynamic-tinybert/run_squad.py -------------------------------------------------------------------------------- /research/prune-once-for-all/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/prune-once-for-all/README.md -------------------------------------------------------------------------------- /research/prune-once-for-all/student_pruning.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/prune-once-for-all/student_pruning.sh -------------------------------------------------------------------------------- /research/prune-once-for-all/teacher_preparation.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/research/prune-once-for-all/teacher_preparation.sh -------------------------------------------------------------------------------- /run_tests.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/run_tests.sh -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/setup.py -------------------------------------------------------------------------------- /tests/test_custom_method.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/tests/test_custom_method.py -------------------------------------------------------------------------------- /tests/test_iterative_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/tests/test_iterative_scheduler.py -------------------------------------------------------------------------------- /tests/test_magnitude_method.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/tests/test_magnitude_method.py -------------------------------------------------------------------------------- /tests/test_methods_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/tests/test_methods_utils.py -------------------------------------------------------------------------------- /tests/test_neural_wiring_method.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/tests/test_neural_wiring_method.py -------------------------------------------------------------------------------- /tests/test_one_shot_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/tests/test_one_shot_scheduler.py -------------------------------------------------------------------------------- /tests/test_qat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/tests/test_qat.py -------------------------------------------------------------------------------- /tests/test_quantizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/IntelLabs/Model-Compression-Research-Package/HEAD/tests/test_quantizer.py --------------------------------------------------------------------------------