@inproceedings{ijcai2020p121, title = {Overflow Aware Quantization: Accelerating Neural Network Inference by Low-bit Multiply-Accumulate Operations}, author = {Xie, Hongwei and Song, Yafei and Cai, Ling and Li, Mingyang}, booktitle = {Proceedings of the Twenty-Ninth International Joint Conference on Artificial Intelligence, {IJCAI-20}}, publisher = {International Joint Conferences on Artificial Intelligence Organization}, editor = {Christian Bessiere}, pages = {868--875}, year = {2020}, month = {7}, note = {Main track}, doi = {10.24963/ijcai.2020/121}, url = {https://doi.org/10.24963/ijcai.2020/121}, }