{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:23:57Z","timestamp":1750220637010,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":17,"publisher":"ACM","license":[{"start":{"date-parts":[[2020,9,28]],"date-time":"2020-09-28T00:00:00Z","timestamp":1601251200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2020,9,28]]},"DOI":"10.1145\/3422575.3422805","type":"proceedings-article","created":{"date-parts":[[2021,3,22]],"date-time":"2021-03-22T01:43:40Z","timestamp":1616377420000},"page":"335-340","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Neural Network Weight Compression with NNW-BDI"],"prefix":"10.1145","author":[{"given":"Andrei","family":"Bersatti","sequence":"first","affiliation":[{"name":"Georgia Institute of Technology, United States"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nima","family":"Shoghi Ghalehshahi","sequence":"additional","affiliation":[{"name":"Georgia Institute of Technology, United States"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hyesoon","family":"Kim","sequence":"additional","affiliation":[{"name":"Georgia Institute of Technology, United States"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2021,3,21]]},"reference":[{"volume-title":"LATTE-CC: Latency Tolerance Aware Adaptive Cache Compression Management for Energy Efficient GPUs. In 2018 IEEE International Symposium on High Performance Computer Architecture (HPCA). 221\u2013234","author":"Arunkumar A.","key":"e_1_3_2_1_1_1"},{"volume-title":"Jonathan Frankle, and John Guttag.","year":"2020","author":"Blalock Davis","key":"e_1_3_2_1_2_1"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.5555\/2969442.2969588"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00075"},{"volume-title":"2017 IEEE 12th International Conference on ASIC (ASICON). 68\u201371","author":"Fang Y.","key":"e_1_3_2_1_5_1"},{"volume-title":"2016 IEEE International Solid-State Circuits Conference (ISSCC). 82\u201383","author":"Gautschi M.","key":"e_1_3_2_1_6_1"},{"key":"e_1_3_2_1_7_1","unstructured":"Suyog Gupta Ankur Agrawal Kailash Gopalakrishnan and Pritish Narayanan. 2015. Deep Learning with Limited Numerical Precision. CoRR abs\/1502.02551(2015). arxiv:1502.02551http:\/\/arxiv.org\/abs\/1502.02551  Suyog Gupta Ankur Agrawal Kailash Gopalakrishnan and Pritish Narayanan. 2015. Deep Learning with Limited Numerical Precision. CoRR abs\/1502.02551(2015). arxiv:1502.02551http:\/\/arxiv.org\/abs\/1502.02551"},{"volume-title":"CRANIA: Unlocking Data and Value Reuse in Iterative Neural Network Architectures. In 2020 25th Asia and South Pacific Design Automation Conference (ASP-DAC). 295\u2013300","year":"2020","author":"Hemmat M.","key":"e_1_3_2_1_8_1"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO.2018.00034"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA.2018.00070"},{"volume-title":"PyTorch: An Imperative Style","author":"Paszke Adam","key":"e_1_3_2_1_11_1"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/2540708.2540724"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/2370816.2370870"},{"volume-title":"Accuracy and Performance Trade-Offs of Logarithmic Number Units in Multi-Core Clusters. In 2016 IEEE 23nd Symposium on Computer Arithmetic (ARITH). 95\u2013103","author":"Schaffner M.","key":"e_1_3_2_1_14_1"},{"key":"e_1_3_2_1_15_1","unstructured":"Wonyong Sung Sungho Shin and Kyuyeon Hwang. 2015. Resiliency of Deep Neural Networks under Quantization. ArXiv abs\/1511.06488(2015).  Wonyong Sung Sungho Shin and Kyuyeon Hwang. 2015. Resiliency of Deep Neural Networks under Quantization. ArXiv abs\/1511.06488(2015)."},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/30.125072"},{"volume-title":"Enabling Transparent Memory-Compression for Commodity Memory Systems. In 2019 IEEE International Symposium on High Performance Computer Architecture (HPCA). 570\u2013581","year":"2019","author":"Young V.","key":"e_1_3_2_1_17_1"}],"event":{"name":"MEMSYS 2020: The International Symposium on Memory Systems","acronym":"MEMSYS 2020","location":"Washington DC USA"},"container-title":["The International Symposium on Memory Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3422575.3422805","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3422575.3422805","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T22:01:55Z","timestamp":1750197715000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3422575.3422805"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,9,28]]},"references-count":17,"alternative-id":["10.1145\/3422575.3422805","10.1145\/3422575"],"URL":"https:\/\/doi.org\/10.1145\/3422575.3422805","relation":{},"subject":[],"published":{"date-parts":[[2020,9,28]]},"assertion":[{"value":"2021-03-21","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}