@inproceedings{503ee73d1f834d408f04e50e5a95457f,
title = "Multi-Scale Dynamic Fixed-Point Quantization and Training for Deep Neural Networks",
abstract = "State-of-the-art deep neural networks often require extremely high computational power which results in the deployment of deep neural networks on embedded devices being impractical. Therefore, model quantization is important for the deployment of deep neural networks on edge devices. The purpose of this paper is to quantize the deep neural networks from high-precision to low-precision (e.g. INT8) dynamic fixed-point format at the layer-by-layer level quantization. In addition, we further improve the uniform dynamic fixed-point quantization to multi-scale dynamic fixed-point quantization for lower quantization loss. The proposed multi-scale dynamic fixed-point quantization scheme divides the quantization ranges into two regions, and each region is assigned different quantization levels and quantization parameters to better approximate the bell-shaped distributions. The proposed quantization pipeline is composed of post-training quantization followed by model fine-tuning which can keep the accuracy drop of the quantized model within 1% mean average precision (mAP). Furthermore, the proposed quantization and fine-tuning method can be combined with model pruning to obtain a compact and accurate deep neural network with low bit-width.",
keywords = "Deep Learning, Dynamic Fixed-Point Quantization, Model Quantization, Multi-Scale Dynamic Fixed-Point Quantization, Object Detection",
author = "Chen, {Po Yuan} and Lin, {Hung Che} and Guo, {Jiun In}",
note = "Publisher Copyright: {\textcopyright} 2023 IEEE.; 56th IEEE International Symposium on Circuits and Systems, ISCAS 2023 ; Conference date: 21-05-2023 Through 25-05-2023",
year = "2023",
doi = "10.1109/ISCAS46773.2023.10181358",
language = "English",
series = "Proceedings - IEEE International Symposium on Circuits and Systems",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "ISCAS 2023 - 56th IEEE International Symposium on Circuits and Systems, Proceedings",
address = "United States",
}