{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,3]],"date-time":"2025-07-03T04:14:35Z","timestamp":1751516075091,"version":"3.41.0"},"reference-count":22,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,4,14]],"date-time":"2024-04-14T00:00:00Z","timestamp":1713052800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,4,14]],"date-time":"2024-04-14T00:00:00Z","timestamp":1713052800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,4,14]]},"DOI":"10.1109\/icassp48485.2024.10446809","type":"proceedings-article","created":{"date-parts":[[2024,3,18]],"date-time":"2024-03-18T18:56:31Z","timestamp":1710788191000},"page":"2905-2909","source":"Crossref","is-referenced-by-count":0,"title":["Bandwidth-Efficient Inference for Nerual Image Compression"],"prefix":"10.1109","author":[{"given":"Shanzhi","family":"Yin","sequence":"first","affiliation":[{"name":"Institute for AI Industry Research (AIR), Tsinghua University"}]},{"given":"Tongda","family":"Xu","sequence":"additional","affiliation":[{"name":"Institute for AI Industry Research (AIR), Tsinghua University"}]},{"given":"Yongsheng","family":"Liang","sequence":"additional","affiliation":[{"name":"Harbin Institute of Technology (Shenzhen)"}]},{"given":"Yuanyuan","family":"Wang","sequence":"additional","affiliation":[{"name":"SenseTime Research"}]},{"given":"Yanghao","family":"Li","sequence":"additional","affiliation":[{"name":"Institute for AI Industry Research (AIR), Tsinghua University"}]},{"given":"Yan","family":"Wang","sequence":"additional","affiliation":[{"name":"Institute for AI Industry Research (AIR), Tsinghua University"}]},{"given":"Jingjing","family":"Liu","sequence":"additional","affiliation":[{"name":"Institute for AI Industry Research (AIR), Tsinghua University"}]}],"member":"263","reference":[{"key":"ref1","first-page":"0","article-title":"Deep residual learning for image compression","volume-title":"CVPR Workshops","author":"Cheng"},{"article-title":"Scale-sim: Systolic cnn accelerator simulator","year":"2018","author":"Samajdar","key":"ref2"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA.2018.00017"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/DCC50243.2021.00033"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC.2014.6757323"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00881"},{"article-title":"Lilnetx: Lightweight networks with extreme model compression and structured sparsification","year":"2022","author":"Girish","key":"ref7"},{"article-title":"Scalable model compression by entropy penalized reparameterization","year":"2019","author":"Oktay","key":"ref8"},{"article-title":"Variational image compression with a scale hyperprior","year":"2018","author":"Ball\u00e9","key":"ref9"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00725"},{"article-title":"Deep compression: Compressing deep neural networks with pruning, trained quantization and huffman coding","year":"2015","author":"Han","key":"ref11"},{"key":"ref12","first-page":"2","article-title":"Efficient inference with tensorrt","volume-title":"GPU Technology Conference","volume":"1","author":"Vanholder"},{"article-title":"Learning n: m fine-grained structured sparse neural networks from scratch","year":"2021","author":"Zhou","key":"ref13"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3084839"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/0020-0190(78)90024-8"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/DCC.1998.672209"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICANMEET.2013.6609386"},{"article-title":"End-to-end optimized image compression","year":"2016","author":"Ball\u00e9","key":"ref18"},{"article-title":"Estimating or propagating gradients through stochastic neurons for conditional computation","year":"2013","author":"Bengio","key":"ref19"},{"article-title":"Compressai: a pytorch library and evaluation platform for end-to-end compression research","year":"2020","author":"B\u00e9gaint","key":"ref20"},{"article-title":"Simple rans encoder\/decoder","year":"2014","author":"Giesen","key":"ref21"},{"key":"ref22","article-title":"Calculation of average psnr differences between rd-curves","author":"Bjontegaard","year":"2001","journal-title":"VCEG-M33"}],"event":{"name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2024,4,14]]},"location":"Seoul, Korea, Republic of","end":{"date-parts":[[2024,4,19]]}},"container-title":["ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10445798\/10445803\/10446809.pdf?arnumber=10446809","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,2]],"date-time":"2025-07-02T17:39:37Z","timestamp":1751477977000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10446809\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,14]]},"references-count":22,"URL":"https:\/\/doi.org\/10.1109\/icassp48485.2024.10446809","relation":{},"subject":[],"published":{"date-parts":[[2024,4,14]]}}}