{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T15:25:02Z","timestamp":1759332302077,"version":"build-2065373602"},"reference-count":32,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"10","license":[{"start":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T00:00:00Z","timestamp":1759276800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T00:00:00Z","timestamp":1759276800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T00:00:00Z","timestamp":1759276800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62172178","62302182","62302179"],"award-info":[{"award-number":["62172178","62302182","62302179"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Comput.-Aided Des. Integr. Circuits Syst."],"published-print":{"date-parts":[[2025,10]]},"DOI":"10.1109\/tcad.2025.3552674","type":"journal-article","created":{"date-parts":[[2025,3,18]],"date-time":"2025-03-18T13:37:17Z","timestamp":1742305037000},"page":"3752-3763","source":"Crossref","is-referenced-by-count":0,"title":["CMD: A Cache-Assisted GPU Memory Deduplication Architecture"],"prefix":"10.1109","volume":"44","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2765-498X","authenticated-orcid":false,"given":"Wei","family":"Zhao","sequence":"first","affiliation":[{"name":"Wuhan National Laboratory for Optoelectronics, Key Laboratory of Information Storage System, Engineering Research Center of Data Storage Systems and Technology, Ministry of Education of China (School of Computer Science and Technology), Huazhong University of Science and Technology, Wuhan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4674-6006","authenticated-orcid":false,"given":"Dan","family":"Feng","sequence":"additional","affiliation":[{"name":"Wuhan National Laboratory for Optoelectronics, Key Laboratory of Information Storage System, Engineering Research Center of Data Storage Systems and Technology, Ministry of Education of China (School of Computer Science and Technology), Huazhong University of Science and Technology, Wuhan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8834-4953","authenticated-orcid":false,"given":"Wei","family":"Tong","sequence":"additional","affiliation":[{"name":"Wuhan National Laboratory for Optoelectronics, Key Laboratory of Information Storage System, Engineering Research Center of Data Storage Systems and Technology, Ministry of Education of China (School of Computer Science and Technology), Huazhong University of Science and Technology, Wuhan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3571-1702","authenticated-orcid":false,"given":"Xueliang","family":"Wei","sequence":"additional","affiliation":[{"name":"Wuhan National Laboratory for Optoelectronics, Key Laboratory of Information Storage System, Engineering Research Center of Data Storage Systems and Technology, Ministry of Education of China (School of Computer Science and Technology), Huazhong University of Science and Technology, Wuhan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5828-8399","authenticated-orcid":false,"given":"Bing","family":"Wu","sequence":"additional","affiliation":[{"name":"Wuhan National Laboratory for Optoelectronics, Key Laboratory of Information Storage System, Engineering Research Center of Data Storage Systems and Technology, Ministry of Education of China (School of Computer Science and Technology), Huazhong University of Science and Technology, Wuhan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2023.3256796"},{"volume-title":"NVIDIA H100 Tensor Core GPU Architecture","year":"2022","key":"ref2"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2022.3169458"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2021.3127148"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3007787.3001163"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA.2019.00055"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO56248.2022.00029"},{"key":"ref8","first-page":"325","article-title":"Lossless and lossy memory I\/O link compression for improving performance of GPGPU workloads","volume-title":"Proc. 21st Int. Conf. Parallel Archit. Compil. Tech.","author":"Sathish"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA.2016.37"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA.2018.00017"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00080"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO.2018.00043"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3445814.3446722"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ISPASS.2009.4919648"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00047"},{"volume-title":"Kernel Profiling Guide","year":"2022","key":"ref16"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2016.2571298"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/MASS.2003.1194858"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/2398776.2398827"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.17487\/rfc1321"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/LANMAN.2015.7114717"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA56546.2023.10071011"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TCSII.2020.3008932"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2012.2185930"},{"volume-title":"Darknet: Open source neural networks in C","year":"2013","author":"Redmon","key":"ref25"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/IISWC.2013.6704684"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/IISWC.2009.5306797"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/2508148.2485964"},{"volume-title":"Compute express link","year":"2019","author":"Sharma","key":"ref29"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/3589013.3596678"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1145\/3655038.3665953"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA57654.2024.00027"}],"container-title":["IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/43\/11155107\/10930882.pdf?arnumber=10930882","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,30]],"date-time":"2025-09-30T14:26:09Z","timestamp":1759242369000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10930882\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10]]},"references-count":32,"journal-issue":{"issue":"10"},"URL":"https:\/\/doi.org\/10.1109\/tcad.2025.3552674","relation":{},"ISSN":["0278-0070","1937-4151"],"issn-type":[{"type":"print","value":"0278-0070"},{"type":"electronic","value":"1937-4151"}],"subject":[],"published":{"date-parts":[[2025,10]]}}}