├── .gitignore ├── LICENSE ├── README.md ├── compute_quant_error.py ├── image_net.py ├── models ├── __init__.py ├── mobilenet_v2.py ├── mobilenet_v2_quantized.py └── resnet_quantized.py ├── quantization ├── __init__.py ├── autoquant_utils.py ├── base_quantized_classes.py ├── base_quantized_model.py ├── hijacker.py ├── quant_error_estimator.py ├── quantization_manager.py ├── quantized_folded_bn.py ├── quantizers │ ├── __init__.py │ ├── base_quantizers.py │ ├── fp8_quantizer.py │ ├── rounding_utils.py │ ├── uniform_quantizers.py │ └── utils.py ├── range_estimators.py └── utils.py ├── requirements.txt └── utils ├── __init__.py ├── click_options.py ├── distributions.py ├── grid.py ├── imagenet_dataloaders.py ├── optimizer_utils.py ├── qat_utils.py ├── stopwatch.py ├── supervised_driver.py └── utils.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/README.md -------------------------------------------------------------------------------- /compute_quant_error.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/compute_quant_error.py -------------------------------------------------------------------------------- /image_net.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/image_net.py -------------------------------------------------------------------------------- /models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/models/__init__.py -------------------------------------------------------------------------------- /models/mobilenet_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/models/mobilenet_v2.py -------------------------------------------------------------------------------- /models/mobilenet_v2_quantized.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/models/mobilenet_v2_quantized.py -------------------------------------------------------------------------------- /models/resnet_quantized.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/models/resnet_quantized.py -------------------------------------------------------------------------------- /quantization/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/__init__.py -------------------------------------------------------------------------------- /quantization/autoquant_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/autoquant_utils.py -------------------------------------------------------------------------------- /quantization/base_quantized_classes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/base_quantized_classes.py -------------------------------------------------------------------------------- /quantization/base_quantized_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/base_quantized_model.py -------------------------------------------------------------------------------- /quantization/hijacker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/hijacker.py -------------------------------------------------------------------------------- /quantization/quant_error_estimator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/quant_error_estimator.py -------------------------------------------------------------------------------- /quantization/quantization_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/quantization_manager.py -------------------------------------------------------------------------------- /quantization/quantized_folded_bn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/quantized_folded_bn.py -------------------------------------------------------------------------------- /quantization/quantizers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/quantizers/__init__.py -------------------------------------------------------------------------------- /quantization/quantizers/base_quantizers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/quantizers/base_quantizers.py -------------------------------------------------------------------------------- /quantization/quantizers/fp8_quantizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/quantizers/fp8_quantizer.py -------------------------------------------------------------------------------- /quantization/quantizers/rounding_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/quantizers/rounding_utils.py -------------------------------------------------------------------------------- /quantization/quantizers/uniform_quantizers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/quantizers/uniform_quantizers.py -------------------------------------------------------------------------------- /quantization/quantizers/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/quantizers/utils.py -------------------------------------------------------------------------------- /quantization/range_estimators.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/range_estimators.py -------------------------------------------------------------------------------- /quantization/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/quantization/utils.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/requirements.txt -------------------------------------------------------------------------------- /utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/utils/__init__.py -------------------------------------------------------------------------------- /utils/click_options.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/utils/click_options.py -------------------------------------------------------------------------------- /utils/distributions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/utils/distributions.py -------------------------------------------------------------------------------- /utils/grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/utils/grid.py -------------------------------------------------------------------------------- /utils/imagenet_dataloaders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/utils/imagenet_dataloaders.py -------------------------------------------------------------------------------- /utils/optimizer_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/utils/optimizer_utils.py -------------------------------------------------------------------------------- /utils/qat_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/utils/qat_utils.py -------------------------------------------------------------------------------- /utils/stopwatch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/utils/stopwatch.py -------------------------------------------------------------------------------- /utils/supervised_driver.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/utils/supervised_driver.py -------------------------------------------------------------------------------- /utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Qualcomm-AI-research/FP8-quantization/HEAD/utils/utils.py --------------------------------------------------------------------------------