{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,21]],"date-time":"2025-11-21T05:50:27Z","timestamp":1763704227611,"version":"3.45.0"},"reference-count":46,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,26]],"date-time":"2025-10-26T00:00:00Z","timestamp":1761436800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,26]],"date-time":"2025-10-26T00:00:00Z","timestamp":1761436800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,26]]},"DOI":"10.1109\/iccad66269.2025.11240626","type":"proceedings-article","created":{"date-parts":[[2025,11,20]],"date-time":"2025-11-20T18:39:34Z","timestamp":1763663974000},"page":"1-9","source":"Crossref","is-referenced-by-count":0,"title":["RTPU: Unifying Non-Private and Private Inference with Reconfigurable Architecture"],"prefix":"10.1109","author":[{"given":"Fuping","family":"Li","sequence":"first","affiliation":[{"name":"Institute of Computing Technology, CAS,SKLP"}]},{"given":"Ying","family":"Wang","sequence":"additional","affiliation":[{"name":"Institute of Computing Technology, CAS,CICS"}]},{"given":"Yinghao","family":"Yang","sequence":"additional","affiliation":[{"name":"Institute of Computing Technology, CAS,SKLP"}]},{"given":"Jingxuan","family":"Li","sequence":"additional","affiliation":[{"name":"Institute of Computing Technology, CAS,CICS"}]},{"given":"Yibo","family":"Du","sequence":"additional","affiliation":[{"name":"Institute of Computing Technology, CAS,CICS"}]},{"given":"Huawei","family":"Li","sequence":"additional","affiliation":[{"name":"Institute of Computing Technology, CAS,SKLP"}]},{"given":"Yinhe","family":"Han","sequence":"additional","affiliation":[{"name":"Institute of Computing Technology, CAS,CICS"}]},{"given":"Hang","family":"Lu","sequence":"additional","affiliation":[{"name":"Institute of Computing Technology, CAS,SKLP"}]},{"given":"Xiaowei","family":"Li","sequence":"additional","affiliation":[{"name":"Institute of Computing Technology, CAS,SKLP"}]}],"member":"263","reference":[{"key":"ref1","first-page":"945","article-title":"{MLaaS} in the wild: Workload analysis and scheduling in {Large-Scale} heterogeneous {GPU} clusters","volume-title":"19th USENIX Symposium on Networked Systems Design and Implementation (NSDI 22)","author":"Weng"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/3587135.3592169"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/3561800"},{"article-title":"Enable fully homomorphic encryption with amazon sagemaker endpoints for secure, real-time inferencing","year":"2023","author":"d\u2019Aliberti","key":"ref4"},{"article-title":"The ultimate tool for data privacy: Fully homomorphic encryption","year":"2022","author":"Soceanu","key":"ref5"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA52012.2021.00010"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/3579371.3589053"},{"article-title":"As chip design costs skyrocket, 3nm process node is in jeopardy","year":"2018","author":"Hruska","key":"ref8"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA56546.2023.10071017"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA56546.2023.10070984"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO56248.2022.00086"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA47549.2020.00027"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO50266.2020.00062"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.3390\/electronics13152988"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA51647.2021.00013"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2024.3386977"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3649329.3657331"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/seed61283.2024.00022"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/3649329.3657321"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICPP.2016.15"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/HCS49909.2020.9220735"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-70694-8_15"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3527415"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2022.3205552"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/3466752.3480070"},{"key":"ref26","first-page":"559","article-title":"Alpa: Automating inter-and {Intra-Operator} parallelism for distributed deep learning","volume-title":"16th USENIX Symposium on Operating Systems Design and Implementation","author":"Zheng"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ASP-DAC52403.2022.9712485"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.46586\/tches.v2020.i2.49-72"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TC.2024.3398500"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TC.2017.2677426"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-47721-7_24"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1007\/s10766-015-0366-5"},{"key":"ref33","first-page":"685","article-title":"Mad: Memory-aware design techniques for accelerating fully homomorphic encryption","volume-title":"Proceedings of the 56th Annual IEEE\/ACM International Symposium on Microarchitecture","author":"Agrawal"},{"volume-title":"Principles and practices of interconnection networks","year":"2004","author":"Dally","key":"ref34"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/DATE.2004.1269002"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2020.3012215"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3520142"},{"article-title":"High Bandwidth Memory DRAM","volume-title":"Technical Report JESD235D","year":"2021","key":"ref38"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ICCAD.2017.8203889"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/NOCS.2012.31"},{"key":"ref41","first-page":"6993","article-title":"{DaCapo}: Automatic bootstrapping management for efficient fully homomorphic encryption","volume-title":"33rd USENIX Security Symposium (USENIX Security 24)","author":"Cheon"},{"key":"ref42","article-title":"Pytorch: An imperative style, high-performance deep learning library","volume-title":"Advances in neural information processing systems","volume":"32","author":"Paszke"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00045"},{"article-title":"Measuring gpu utilization one level deeper","year":"2025","author":"Elvinger","key":"ref44"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1145\/3613424.3614279"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/DATE.2009.5090727"}],"event":{"name":"2025 IEEE\/ACM International Conference On Computer Aided Design (ICCAD)","start":{"date-parts":[[2025,10,26]]},"location":"Munich, Germany","end":{"date-parts":[[2025,10,30]]}},"container-title":["2025 IEEE\/ACM International Conference On Computer Aided Design (ICCAD)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11240608\/11240621\/11240626.pdf?arnumber=11240626","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,21]],"date-time":"2025-11-21T05:42:05Z","timestamp":1763703725000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11240626\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,26]]},"references-count":46,"URL":"https:\/\/doi.org\/10.1109\/iccad66269.2025.11240626","relation":{},"subject":[],"published":{"date-parts":[[2025,10,26]]}}}