{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:23:22Z","timestamp":1750220602871,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":26,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,1,18]],"date-time":"2021-01-18T00:00:00Z","timestamp":1610928000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"National Key R&D Program of China","award":["2017YFB1400303"],"award-info":[{"award-number":["2017YFB1400303"]}]},{"name":"National Natural Science Foundation of China","award":["41871245"],"award-info":[{"award-number":["41871245"]}]},{"name":"Beijing Innovation Center for Future Chips"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,1,18]]},"DOI":"10.1145\/3394885.3431512","type":"proceedings-article","created":{"date-parts":[[2021,1,29]],"date-time":"2021-01-29T11:32:48Z","timestamp":1611919968000},"page":"505-511","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Puncturing the memory wall"],"prefix":"10.1145","author":[{"given":"Qin","family":"Li","sequence":"first","affiliation":[{"name":"Dept. of Electronic Engineering and BNRist. Tsinghua University, Beijing, China"}]},{"given":"Peiyan","family":"Dong","sequence":"additional","affiliation":[{"name":"Northeastern University, Boston, MA USA"}]},{"given":"Zijie","family":"Yu","sequence":"additional","affiliation":[{"name":"Dept. of Electronic Engineering and BNRist. Tsinghua University, Beijing, China"}]},{"given":"Changlu","family":"Liu","sequence":"additional","affiliation":[{"name":"Dept. of Electronic Engineering and BNRist. Tsinghua University, Beijing, China"}]},{"given":"Fei","family":"Qiao","sequence":"additional","affiliation":[{"name":"Dept. of Electronic Engineering and BNRist. Tsinghua University, Beijing, China"}]},{"given":"Yanzhi","family":"Wang","sequence":"additional","affiliation":[{"name":"Northeastern University, Boston, MA USA"}]},{"given":"Huazhong","family":"Yang","sequence":"additional","affiliation":[{"name":"Dept. of Electronic Engineering and BNRist. Tsinghua University, Beijing, China"}]}],"member":"320","published-online":{"date-parts":[[2021,1,29]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1109\/JSSC.2017.2752838"},{"volume-title":"Deep Compression: Compressing Deep Neural Networks with Pruning, Trained Quantization and Huffman Coding.\" ICLR","year":"2016","key":"e_1_3_2_1_2_1"},{"volume-title":"an algorithm-hardware co-design framework of dnns using alternating direction methods of multipliers,\" in ASPLOS","year":"2019","author":"Ren A.","key":"e_1_3_2_1_3_1"},{"volume-title":"Toward Extremely Low Bit and Lossless Accuracy in DNNs with Progressive ADMM [J]","year":"2019","author":"Lin","key":"e_1_3_2_1_4_1"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/3174243.3174253"},{"volume-title":"IEEE","year":"2017","author":"Murmann Boris","key":"e_1_3_2_1_6_1"},{"volume-title":"Great Lakes Symposium on VLSI (GLSVLSI).","year":"2019","author":"Lossy Media Data Compression Enabling Approximate","key":"e_1_3_2_1_7_1"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCSI.2017.2681738"},{"volume-title":"IEEE","year":"2018","author":"Juan Sebastian","key":"e_1_3_2_1_9_1"},{"volume-title":"Of NIPS","year":"2014","author":"Chung J.","key":"e_1_3_2_1_10_1"},{"volume-title":"International Conference on Learning Representations (ICLR)","year":"2016","author":"Han Song","key":"e_1_3_2_1_11_1"},{"volume-title":"EESEN: End to end speech recognition using deep RNN models and WFST based decoding.\" Automatic Speech Recognition and Understan ding (ASRU)","year":"2015","key":"e_1_3_2_1_12_1"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"crossref","unstructured":"Dong P. Wang S. et al. RTMobile: Beyond Real-Time Mobile Acceleration of RNNs for Speech Recognition. arXiv preprint arXiv:2002.11474. (2020)  Dong P. Wang S. et al. RTMobile: Beyond Real-Time Mobile Acceleration of RNNs for Speech Recognition. arXiv preprint arXiv:2002.11474. (2020)","DOI":"10.1109\/DAC18072.2020.9218499"},{"volume-title":"Training low bitwidth convolutional neural networks with low bitwidth gradients.\" arXiv preprint arXiv:1606.06160","year":"2016","key":"e_1_3_2_1_14_1"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00286"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00495"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2019.8851699"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00448"},{"volume-title":"Neural Information Processing Systems (NeurIPS)","year":"2019","author":"Dong Xuanyi","key":"e_1_3_2_1_19_1"},{"volume-title":"Neural Information Processing Systems (NeurIPS)","year":"2018","author":"Zhuang Zhuangwei","key":"e_1_3_2_1_20_1"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00447"},{"key":"e_1_3_2_1_22_1","first-page":"2074","volume-title":"Learning structured sparsity in deep neural networks. In neural information processing systems (NeurIPS)","author":"Wen Wei","year":"2016"},{"volume-title":"Incremental network quantization: Towards lossless cnns with low-precision weights.\" arXiv preprint arXiv:1702.03044","year":"2017","key":"e_1_3_2_1_23_1"},{"volume-title":"Speech and Signal Processing (ICASSP). IEEE","year":"2019","author":"Parcollet Titouan","key":"e_1_3_2_1_24_1"},{"key":"e_1_3_2_1_25_1","first-page":"27403","article-title":"DARPA TIMIT acoustic-phonetic continous speech corpus CD-ROM. NIST speech disc 1-1.1","volume":"93","author":"John","year":"1993","journal-title":"STIN"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3289602.3293898"}],"event":{"name":"ASPDAC '21: 26th Asia and South Pacific Design Automation Conference","sponsor":["SIGDA ACM Special Interest Group on Design Automation","IEEE CAS","IEEE CEDA"],"location":"Tokyo Japan","acronym":"ASPDAC '21"},"container-title":["Proceedings of the 26th Asia and South Pacific Design Automation Conference"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3394885.3431512","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3394885.3431512","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T21:32:02Z","timestamp":1750195922000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3394885.3431512"}},"subtitle":["Joint optimization of network compression with approximate memory for ASR application"],"short-title":[],"issued":{"date-parts":[[2021,1,18]]},"references-count":26,"alternative-id":["10.1145\/3394885.3431512","10.1145\/3394885"],"URL":"https:\/\/doi.org\/10.1145\/3394885.3431512","relation":{},"subject":[],"published":{"date-parts":[[2021,1,18]]},"assertion":[{"value":"2021-01-29","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}