{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,4,5]],"date-time":"2025-04-05T11:28:08Z","timestamp":1743852488212},"reference-count":46,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,5,19]],"date-time":"2024-05-19T00:00:00Z","timestamp":1716076800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,5,19]],"date-time":"2024-05-19T00:00:00Z","timestamp":1716076800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,5,19]]},"DOI":"10.1109\/iscas58744.2024.10558100","type":"proceedings-article","created":{"date-parts":[[2024,7,2]],"date-time":"2024-07-02T17:22:52Z","timestamp":1719940972000},"page":"1-5","source":"Crossref","is-referenced-by-count":2,"title":["BitPruning: Learning Bitlengths for Aggressive and Accurate Quantization"],"prefix":"10.1109","author":[{"given":"Milo\u0161","family":"Nikoli\u0107","sequence":"first","affiliation":[{"name":"University of Toronto,Toronto,Canada"}]},{"given":"Ghouthi Boukli","family":"Hacene","sequence":"additional","affiliation":[{"name":"MILA,Montreal,Canada"}]},{"given":"Ciaran","family":"Bannon","sequence":"additional","affiliation":[{"name":"University of Toronto,Toronto,Canada"}]},{"given":"Alberto Delmas","family":"Lascorz","sequence":"additional","affiliation":[{"name":"University of Toronto,Toronto,Canada"}]},{"given":"Matthieu","family":"Courbariaux","sequence":"additional","affiliation":[{"name":"MILA,Montreal,Canada"}]},{"given":"Omar Mohamed","family":"Awad","sequence":"additional","affiliation":[{"name":"University of Toronto,Toronto,Canada"}]},{"given":"Isak","family":"Edo Vivancos","sequence":"additional","affiliation":[{"name":"University of Toronto,Toronto,Canada"}]},{"given":"Yoshua","family":"Bengio","sequence":"additional","affiliation":[{"name":"MILA,Montreal,Canada"}]},{"given":"Vincent","family":"Gripon","sequence":"additional","affiliation":[{"name":"IMT Atlantique, Lab-STICC,Brest,France"}]},{"given":"Andreas","family":"Moshovos","sequence":"additional","affiliation":[{"name":"University of Toronto,Toronto,Canada"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Lower numerical precision deep learning inference and training","author":"Rodriguez","year":"2018","journal-title":"Intel, Tech. Rep."},{"key":"ref2","article-title":"Low precision inference on GPU","author":"Wu","year":"2019","journal-title":"Nvidia, Tech. Rep."},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO.2016.7783722"},{"key":"ref4","article-title":"Bit Fusion: Bit-level dynamically composable architecture for accelerating deep neural networks","author":"Sharma","year":"2017","journal-title":"CoRR"},{"key":"ref5","first-page":"382","article-title":"Bit-pragmatic deep neural network computing","volume-title":"Proceedings of the 50th Annual IEEE\/ACM International Symposium on Microarchitecture","author":"Albericio"},{"key":"ref6","article-title":"DPRed: Making typical activation values matter in deep learning computing","author":"Lascorz","year":"2017","journal-title":"CoRR"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/DAC.2018.8465915"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/2925426.2926294"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ISCAS.2019.8702332"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/FPL.2018.00059"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA.2018.00012"},{"article-title":"BinaryConnect: Training deep neural networks with binary weights during propagations","year":"2015","author":"Courbariaux","key":"ref12"},{"key":"ref13","article-title":"PACT: parameterized clipping activation for quantized neural networks","author":"Choi","year":"2018","journal-title":"CoRR"},{"key":"ref14","article-title":"Trained uniform quantization for accurate and efficient neural network inference on fixed-point hardware","author":"Jain","year":"2019","journal-title":"CoRR"},{"key":"ref15","article-title":"Learned step size quantization","author":"Esser","year":"2019","journal-title":"CoRR"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00038"},{"article-title":"Reduced-precision strategies for bounded memory in deep neural nets, arXiv:1511.05236v4","year":"2015","author":"Judd","key":"ref17"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ISPASS.2019.00030"},{"article-title":"Incremental network quantization: Towards lossless CNNs with low-precision weights","volume-title":"International Conference on Learning Representations","author":"Zhou","key":"ref19"},{"key":"ref20","article-title":"Heterogeneous bitwidth binarization in convolutional neural networks","author":"Fromm","year":"2018","journal-title":"CoRR"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01225-0_36"},{"key":"ref22","article-title":"Mixed precision quantization of convnets via differentiable neural architecture search","author":"Wu","year":"2018","journal-title":"CoRR"},{"key":"ref23","article-title":"ReLeQ: A reinforcement learning approach for deep quantization of neural networks","author":"Elthakeb","year":"2018","journal-title":"CoRR"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00881"},{"key":"ref25","article-title":"Bayesian bits: Unifying quantization and pruning","author":"Baalen","year":"2020","journal-title":"Advances in Neural Information Processing Systems 33"},{"article-title":"BSQ: Exploring bit-level sparsity for mixed-precision neural network quantization","volume-title":"International Conference on Learning Representations","author":"Yang","key":"ref26"},{"key":"ref27","article-title":"Differentiable quantization of deep neural networks","author":"Uhlich","year":"2019","journal-title":"CoRR"},{"article-title":"Estimating or propagating gradients through stochastic neurons for conditional computation","year":"2013","author":"Bengio","key":"ref28"},{"key":"ref29","article-title":"Learning multiple layers of features from tiny images","author":"Krizhevsky","year":"2009","journal-title":"Tech. Rep."},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref31","first-page":"1097","article-title":"ImageNet classification with deep CNNs","volume-title":"NIPS 25","author":"Krizhevsky","year":"2012"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"article-title":"Automatic differentiation in PyTorch","year":"2017","author":"Paszke","key":"ref33"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr.2018.00474"},{"article-title":"Cacti 6.0: A tool to understand large caches","year":"2007","author":"Muralimanohar","key":"ref35"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/IISWC.2018.8573527"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.544"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.660"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1181"},{"key":"ref40","first-page":"142","article-title":"Learning word vectors for sentiment analysis","volume-title":"Annual Meeting of the ACL: Human Language Technologies","author":"Maas"},{"key":"ref41","article-title":"Semi-supervised classification with graph convolutional networks","author":"Kipf","year":"2016","journal-title":"CoRR"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1609\/aimag.v29i3.2157"},{"article-title":"Simple spectral graph convolution","volume-title":"International Conference on Learning Representations","author":"Zhu","key":"ref43"},{"key":"ref44","article-title":"Deep learning recommendation model for personalization and recommendation systems","author":"Naumov","year":"2019","journal-title":"CoRR"},{"key":"ref45","article-title":"Playing Atari with deep reinforcement learning","author":"Mnih","year":"2013","journal-title":"CoRR"},{"article-title":"OpenAI Gym","year":"2016","author":"Brockman","key":"ref46"}],"event":{"name":"2024 IEEE International Symposium on Circuits and Systems (ISCAS)","start":{"date-parts":[[2024,5,19]]},"location":"Singapore, Singapore","end":{"date-parts":[[2024,5,22]]}},"container-title":["2024 IEEE International Symposium on Circuits and Systems (ISCAS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10557746\/10557828\/10558100.pdf?arnumber=10558100","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,7,3]],"date-time":"2024-07-03T06:20:51Z","timestamp":1719987651000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10558100\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,19]]},"references-count":46,"URL":"https:\/\/doi.org\/10.1109\/iscas58744.2024.10558100","relation":{},"subject":[],"published":{"date-parts":[[2024,5,19]]}}}