{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T23:20:55Z","timestamp":1780356055064,"version":"3.54.1"},"publisher-location":"New York, NY, USA","reference-count":49,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,6,21]]},"DOI":"10.1145\/3695053.3731408","type":"proceedings-article","created":{"date-parts":[[2025,6,20]],"date-time":"2025-06-20T16:43:11Z","timestamp":1750437791000},"page":"107-121","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":8,"title":["Neo: Towards Efficient Fully Homomorphic Encryption Acceleration using Tensor Core"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-2555-0773","authenticated-orcid":false,"given":"Dian","family":"Jiao","sequence":"first","affiliation":[{"name":"State Key Laboratory of Cyberspace Security Defense, Institute of Information Engineering, CAS, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-2058-5109","authenticated-orcid":false,"given":"Xianglong","family":"Deng","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Cyberspace Security Defense, Institute of Information Engineering, CAS, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8150-1792","authenticated-orcid":false,"given":"Zhiwei","family":"Wang","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Cyberspace Security Defense, Institute of Information Engineering, CAS, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-9160-8540","authenticated-orcid":false,"given":"Shengyu","family":"Fan","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Cyberspace Security Defense, Institute of Information Engineering, CAS, Beijing, China and School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-0108-3708","authenticated-orcid":false,"given":"Yi","family":"Chen","sequence":"additional","affiliation":[{"name":"Huazhong University of Science and Technology, Wuhan, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-9868-5353","authenticated-orcid":false,"given":"Dan","family":"Meng","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Cyberspace Security Defense, Institute of Information Engineering, CAS, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9215-7632","authenticated-orcid":false,"given":"Rui","family":"Hou","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Cyberspace Security Defense, Institute of Information Engineering, CAS, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6440-7550","authenticated-orcid":false,"given":"Mingzhe","family":"Zhang","sequence":"additional","affiliation":[{"name":"Computing System Lab, Ant Group, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2025,6,20]]},"reference":[{"key":"e_1_3_3_1_2_2","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA56546.2023.10070953"},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"crossref","unstructured":"Ahmad Al\u00a0Badawi Yuriy Polyakov Khin Mi\u00a0Mi Aung Bharadwaj Veeravalli and Kurt Rohloff. 2019. Implementation and performance evaluation of RNS variants of the BFV homomorphic encryption scheme. IEEE Transactions on Emerging Topics in Computing 9 2 (2019) 941\u2013956.","DOI":"10.1109\/TETC.2019.2902799"},{"key":"e_1_3_3_1_4_2","doi-asserted-by":"crossref","unstructured":"Ahmad Al\u00a0Badawi Bharadwaj Veeravalli Chan\u00a0Fook Mun and Khin Mi\u00a0Mi Aung. 2018. High-performance FV somewhat homomorphic encryption on GPUs: An implementation using CUDA. IACR Transactions on Cryptographic Hardware and Embedded Systems (2018) 70\u201395.","DOI":"10.46586\/tches.v2018.i2.70-95"},{"key":"e_1_3_3_1_5_2","first-page":"423","volume-title":"International Conference on Selected Areas in Cryptography","author":"Bajard Jean-Claude","year":"2016","unstructured":"Jean-Claude Bajard, Julien Eynard, M\u00a0Anwar Hasan, and Vincent Zucca. 2016. A full RNS variant of FV like somewhat homomorphic encryption schemes. In International Conference on Selected Areas in Cryptography. Springer, 423\u2013442."},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"publisher","DOI":"10.1109\/EDTM.2018.8421507"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-32009-5_50"},{"key":"e_1_3_3_1_8_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-10970-7_16"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-70694-8_15"},{"key":"e_1_3_3_1_10_2","unstructured":"Jiyang Dong. 2016. Accelerating BGV scheme of fully homomorphic encryption using GPUs. Ph. D. dissertation (2016)."},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"crossref","unstructured":"Phap\u00a0Ngoc Duong and Hanho Lee. 2023. Pipelined key switching accelerator architecture for CKKS-based fully homomorphic encryption. Sensors 23 10 (2023) 4594.","DOI":"10.3390\/s23104594"},{"key":"e_1_3_3_1_12_2","unstructured":"Shengyu Fan Xianglong Deng Zhuoyu Tian Zhicheng Hu Liang Chang Rui Hou Dan Meng and Mingzhe Zhang. 2024. Taiyi: A high-performance CKKS accelerator for Practical Fully Homomorphic Encryption. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2403.10188 (2024)."},{"key":"e_1_3_3_1_13_2","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA56546.2023.10071017"},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"publisher","DOI":"10.1145\/1536414.1536440"},{"key":"e_1_3_3_1_15_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-20465-4_9"},{"key":"e_1_3_3_1_16_2","doi-asserted-by":"crossref","unstructured":"Jia-Zheng Goey Wai-Kong Lee Bok-Min Goi and Wun-She Yap. 2021. Accelerating number theoretic transform in GPU platform for fully homomorphic encryption. The Journal of Supercomputing 77 (2021) 1455\u20131474.","DOI":"10.1007\/s11227-020-03156-7"},{"key":"e_1_3_3_1_17_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-12612-4_5"},{"key":"e_1_3_3_1_18_2","unstructured":"Kyoohyung Han Seungwan Hong Jung\u00a0Hee Cheon and Daejun Park. 2018. Efficient logistic regression on large encrypted data. Cryptology ePrint Archive (2018)."},{"key":"e_1_3_3_1_19_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33019466"},{"key":"e_1_3_3_1_20_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-40186-3_16"},{"key":"e_1_3_3_1_21_2","doi-asserted-by":"publisher","DOI":"10.23919\/DATE54114.2022.9774559"},{"key":"e_1_3_3_1_22_2","doi-asserted-by":"crossref","unstructured":"Junaid Hassan Danish Shehzad Usman Habib Muhammad\u00a0Umar Aftab Muhammad Ahmad Ramil Kuleev and Manuel Mazzara. 2022. [Retracted] The Rise of Cloud Computing: Data Protection Privacy and Open Research Challenges\u2014A Systematic Literature Review (SLR). Computational intelligence and neuroscience 2022 1 (2022) 8303504.","DOI":"10.1155\/2022\/8303504"},{"key":"e_1_3_3_1_23_2","doi-asserted-by":"crossref","unstructured":"Wonkyung Jung Sangpyo Kim Jung\u00a0Ho Ahn Jung\u00a0Hee Cheon and Younho Lee. 2021. Over 100x faster bootstrapping in fully homomorphic encryption through memory-centric optimization with GPUs. IACR Transactions on Cryptographic Hardware and Embedded Systems (2021) 114\u2013148.","DOI":"10.46586\/tches.v2021.i4.114-148"},{"key":"e_1_3_3_1_24_2","doi-asserted-by":"crossref","unstructured":"Wonkyung Jung Eojin Lee Sangpyo Kim Jongmin Kim Namhoon Kim Keewoo Lee Chohong Min Jung\u00a0Hee Cheon and Jung\u00a0Ho Ahn. 2021. Accelerating fully homomorphic encryption through architecture-centric analysis and optimization. IEEE Access 9 (2021) 98772\u201398789.","DOI":"10.1109\/ACCESS.2021.3096189"},{"key":"e_1_3_3_1_25_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-95312-6_6"},{"key":"e_1_3_3_1_26_2","doi-asserted-by":"publisher","DOI":"10.1145\/3579371.3589053"},{"key":"e_1_3_3_1_27_2","unstructured":"Jongmin Kim Gwangho Lee Sangpyo Kim Gina Sohn John Kim Minsoo Rhu and Jung\u00a0Ho Ahn. 2022. ARK: Fully Homomorphic Encryption Accelerator with Runtime Data Generation and Inter-Operation Key Reuse. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2205.00922 (2022)."},{"key":"e_1_3_3_1_28_2","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO56248.2022.00086"},{"key":"e_1_3_3_1_29_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-38551-3_3"},{"key":"e_1_3_3_1_30_2","doi-asserted-by":"publisher","DOI":"10.1109\/IISWC50251.2020.00033"},{"key":"e_1_3_3_1_31_2","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3527415"},{"key":"e_1_3_3_1_32_2","first-page":"12403","volume-title":"International Conference on Machine Learning","author":"Lee Eunsang","year":"2022","unstructured":"Eunsang Lee, Joon-Woo Lee, Junghyun Lee, Young-Sik Kim, Yongjune Kim, Jong-Seon No, and Woosuk Choi. 2022. Low-complexity deep convolutional neural networks on fully homomorphic encryption using multiplexed parallel convolutions. In International Conference on Machine Learning. PMLR, 12403\u201312422."},{"key":"e_1_3_3_1_33_2","doi-asserted-by":"crossref","unstructured":"Joon-Woo Lee HyungChul Kang Yongwoo Lee Woosuk Choi Jieun Eom Maxim Deryabin Eunsang Lee Junghyun Lee Donghoon Yoo Young-Sik Kim et\u00a0al. 2022. Privacy-preserving machine learning with fully homomorphic encryption for deep neural network. iEEE Access 10 (2022) 30039\u201330054.","DOI":"10.1109\/ACCESS.2022.3159694"},{"key":"e_1_3_3_1_34_2","doi-asserted-by":"crossref","unstructured":"Xinxin Mei and Xiaowen Chu. 2016. Dissecting GPU memory hierarchy through microbenchmarking. IEEE Transactions on Parallel and Distributed Systems 28 1 (2016) 72\u201386.","DOI":"10.1109\/TPDS.2016.2549523"},{"key":"e_1_3_3_1_35_2","first-page":"64","volume-title":"Proceedings of the 8th Workshop on Encrypted Computing and Applied Homomorphic Cryptography","author":"Mouchet Christian\u00a0Vincent","year":"2020","unstructured":"Christian\u00a0Vincent Mouchet, Jean-Philippe Bossuat, Juan\u00a0Ram\u00f3n Troncoso-Pastoriza, and Jean-Pierre Hubaux. 2020. Lattigo: A multiparty homomorphic encryption library in go. In Proceedings of the 8th Workshop on Encrypted Computing and Applied Homomorphic Cryptography. 64\u201370."},{"key":"e_1_3_3_1_36_2","volume-title":"NVIDIA A100 Tensor Core GPU Architecture","author":"Corporation NVIDIA","year":"2020","unstructured":"NVIDIA Corporation. 2020. NVIDIA A100 Tensor Core GPU Architecture. Technical Report. NVIDIA. https:\/\/images.nvidia.cn\/aem-dam\/en-zz\/Solutions\/data-center\/nvidia-ampere-architecture-whitepaper.pdf"},{"key":"e_1_3_3_1_37_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-78086-9_4"},{"key":"e_1_3_3_1_38_2","doi-asserted-by":"publisher","DOI":"10.1145\/3373376.3378523"},{"key":"e_1_3_3_1_39_2","doi-asserted-by":"crossref","unstructured":"Sujoy\u00a0Sinha Roy Kimmo J\u00e4rvinen Jo Vliegen Frederik Vercauteren and Ingrid Verbauwhede. 2018. HEPCloud: An FPGA-based multicore processor for FV somewhat homomorphic function evaluation. IEEE Trans. Comput. 67 11 (2018) 1637\u20131650.","DOI":"10.1109\/TC.2018.2816640"},{"key":"e_1_3_3_1_40_2","doi-asserted-by":"crossref","first-page":"387","DOI":"10.1109\/HPCA.2019.00052","volume-title":"2019 IEEE International symposium on high performance computer architecture (HPCA)","author":"Roy Sujoy\u00a0Sinha","year":"2019","unstructured":"Sujoy\u00a0Sinha Roy, Furkan Turan, Kimmo Jarvinen, Frederik Vercauteren, and Ingrid Verbauwhede. 2019. FPGA-based high-performance parallel architecture for homomorphic computing on encrypted data. In 2019 IEEE International symposium on high performance computer architecture (HPCA). IEEE, 387\u2013398."},{"key":"e_1_3_3_1_41_2","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3527393"},{"key":"e_1_3_3_1_42_2","doi-asserted-by":"crossref","unstructured":"Amanpreet\u00a0Kaur Sandhu. 2021. Big data with cloud computing: Discussions and challenges. Big Data Mining and Analytics 5 1 (2021) 32\u201340.","DOI":"10.26599\/BDMA.2021.9020016"},{"key":"e_1_3_3_1_43_2","doi-asserted-by":"crossref","unstructured":"Chao Su and Qingkai Zeng. 2021. Survey of CPU Cache-Based Side-Channel Attacks: Systematic Analysis Security Models and Countermeasures. Security and Communication Networks 2021 1 (2021) 5559552.","DOI":"10.1155\/2021\/5559552"},{"key":"e_1_3_3_1_44_2","doi-asserted-by":"crossref","unstructured":"Yunxuan Su Xu\u00a0An Wang Weidong Du Yu Ge Kaiyang Zhao and Ming Lv. 2023. A secure data fitting scheme based on CKKS homomorphic encryption for medical IoT. Journal of High Speed Networks 29 1 (2023) 41\u201356.","DOI":"10.3233\/JHS-222016"},{"key":"e_1_3_3_1_45_2","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC.2012.6408660"},{"key":"e_1_3_3_1_46_2","doi-asserted-by":"crossref","unstructured":"Zhiwei Wang Peinan Li Rui Hou Zhihao Li Jiangfeng Cao XiaoFeng Wang and Dan Meng. 2023. HE-Booster: an efficient polynomial arithmetic acceleration on GPUs for fully homomorphic encryption. IEEE Transactions on Parallel and Distributed Systems 34 4 (2023) 1067\u20131081.","DOI":"10.1109\/TPDS.2022.3228628"},{"key":"e_1_3_3_1_47_2","doi-asserted-by":"crossref","unstructured":"Chaowei Yang Qunying Huang Zhenlong Li Kai Liu and Fei Hu. 2017. Big Data and cloud computing: innovation opportunities and challenges. International Journal of Digital Earth 10 1 (2017) 13\u201353.","DOI":"10.1080\/17538947.2016.1239771"},{"key":"e_1_3_3_1_48_2","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA56546.2023.10070984"},{"key":"e_1_3_3_1_49_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS53621.2022.00074"},{"key":"e_1_3_3_1_50_2","unstructured":"Ali \u015eah \u00d6zcan and Erkay Sava\u015f. 2024. HEonGPU: a GPU-based Fully Homomorphic Encryption Library 1.0. Cryptology ePrint Archive Paper 2024\/1543. https:\/\/eprint.iacr.org\/2024\/1543"}],"event":{"name":"ISCA '25: Proceedings of the 52nd Annual International Symposium on Computer Architecture","location":"Tokyo Japan","acronym":"SIGARCH '25","sponsor":["SIGARCH ACM Special Interest Group on Computer Architecture"]},"container-title":["Proceedings of the 52nd Annual International Symposium on Computer Architecture"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3695053.3731408","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,21]],"date-time":"2025-06-21T11:07:00Z","timestamp":1750504020000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3695053.3731408"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,20]]},"references-count":49,"alternative-id":["10.1145\/3695053.3731408","10.1145\/3695053"],"URL":"https:\/\/doi.org\/10.1145\/3695053.3731408","relation":{},"subject":[],"published":{"date-parts":[[2025,6,20]]},"assertion":[{"value":"2025-06-20","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}