{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,12]],"date-time":"2026-03-12T01:10:19Z","timestamp":1773277819638,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":64,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,3,30]],"date-time":"2025-03-30T00:00:00Z","timestamp":1743292800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,3,30]]},"DOI":"10.1145\/3676641.3716246","type":"proceedings-article","created":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T16:47:32Z","timestamp":1743094052000},"page":"16-31","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":2,"title":["Affinity-based Optimizations for TFHE on Processing-in-DRAM"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4621-2434","authenticated-orcid":false,"given":"Kevin","family":"Nam","sequence":"first","affiliation":[{"name":"Dept. of ECE &amp; ISRC, Seoul National University, Seoul, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-0612-9085","authenticated-orcid":false,"given":"Heonhui","family":"Jung","sequence":"additional","affiliation":[{"name":"Dept. of ECE &amp; ISRC, Seoul National University, Seoul, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5123-4921","authenticated-orcid":false,"given":"Hyunyoung","family":"Oh","sequence":"additional","affiliation":[{"name":"Department of AI\u2022Software, Gachon University, Seongnam, Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6412-2926","authenticated-orcid":false,"given":"Yunheung","family":"Paek","sequence":"additional","affiliation":[{"name":"Dept. of ECE &amp; ISRC, Seoul National University, Seoul, Republic of Korea"}]}],"member":"320","published-online":{"date-parts":[[2025,3,30]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO50266.2020.00040"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA52012.2021.00013"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC42613.2021.9365862"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2022.3164651"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/HOTCHIPS.2019.8875680"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/1536414.1536440"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/3123939.3123977"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/2508834.2513149"},{"key":"e_1_3_2_1_9_1","volume-title":"Tfhe: Fast fully homomorphic encryption over the torus","author":"Chillotti Ilaria","year":"2018","unstructured":"Ilaria Chillotti, Nicolas Gama, Mariya Georigieva, and Malika Izabachene. Tfhe: Fast fully homomorphic encryption over the torus. 2018. https:\/\/ia.cr\/2018\/421."},{"key":"e_1_3_2_1_10_1","unstructured":"XILINX Inc. Alveo u280 data center accelerator card. https:\/\/www.xilinx.com\/products\/boards-and-kits\/alveo\/u280.html."},{"key":"e_1_3_2_1_11_1","volume-title":"Annual Conference on Neural Information Processing Systems","author":"Lou Qian","year":"2019","unstructured":"Qian Lou and Lei Jiang. She: A fast and accurate deep neural network for encrypted data. In Annual Conference on Neural Information Processing Systems, 2019."},{"key":"e_1_3_2_1_12_1","first-page":"4490","volume-title":"International conference on machine learning","author":"Sanyal Amartya","year":"2018","unstructured":"Amartya Sanyal, Matt J. Kusner, Adria Gascon, and Varun Kanade. Tapas: Tricks to accelerate (encrypted) prediction as a service. In International conference on machine learning, pages 4490--4499. PMLR, 2018."},{"key":"e_1_3_2_1_13_1","volume-title":"USA","author":"Bourse Florian","year":"2018","unstructured":"Florian Bourse, Michele Minelli, Matthias Minihold, and Pascal Paillier. Fast homomorphic evaluation of deep discretized neural networks. In Advances in Cryptology-CRYPTO 2018: 38th Annual International Cryptology Conference, Santa Barbara, CA, USA, August 19-23, 2018, Proceedings, Part III 38, pages 483--512. Springer, 2018."},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-021-05970-3"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/MCI.2022.3180883"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-78086-9_1"},{"key":"e_1_3_2_1_17_1","volume-title":"Yurii Sushko, and Bryant Gipson. A general purpose transpiler for fully homomorphic encryption. Cryptology ePrint Archive, Paper 2021\/811","author":"Gorantala Shruthi","year":"2021","unstructured":"Shruthi Gorantala, Rob Springer, Sean Purser-Haskell, William Lam, Royce Wilson, Asra Ali, Eric P. Astor, Itai Zukerman, Sam Ruth, Christoph Dibak, Phillipp Schoppmann, Sasha Kulankhina, Alain Forget, David Marn, Cameron Tew, Rafael Misoczki, Bernat Guillen, Xinyu Ye, Dennis Kraft, Damien Desfontaines, Aishe Krishnamurthy, Miguel Guevara, Irippuge Milinda Perera, Yurii Sushko, and Bryant Gipson. A general purpose transpiler for fully homomorphic encryption. Cryptology ePrint Archive, Paper 2021\/811, 2021. https: \/\/eprint.iacr.org\/2021\/811."},{"key":"e_1_3_2_1_18_1","volume-title":"TFHE-rs: A Pure Rust Implementation of the TFHE Scheme for Boolean and Integer Arithmetics Over Encrypted Data","year":"2022","unstructured":"Zama. TFHE-rs: A Pure Rust Implementation of the TFHE Scheme for Boolean and Integer Arithmetics Over Encrypted Data, 2022. https: \/\/github.com\/zama-ai\/tfhe-rs."},{"key":"e_1_3_2_1_19_1","volume-title":"August","author":"Chillotti Ilaria","year":"2016","unstructured":"Ilaria Chillotti, Nicolas Gama, Mariya Georgieva, and Malika Izabach. TFHE: Fast fully homomorphic encryption library, August 2016. https:\/\/tfhe.github.io\/tfhe."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2004.840301"},{"key":"e_1_3_2_1_21_1","unstructured":"A gpu implementation of fully homomorphic encryption on torus. https:\/\/github.com\/nucypher\/nufhe."},{"key":"e_1_3_2_1_22_1","volume-title":"CUDA-accelerated fully homomorphic encryption library. https:\/\/github.com\/vernamlab\/cuFHE","author":"Dai W.","year":"2018","unstructured":"W. Dai. CUDA-accelerated fully homomorphic encryption library. https:\/\/github.com\/vernamlab\/cuFHE, 2018."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/3508352.3549413"},{"key":"e_1_3_2_1_24_1","unstructured":"Jung Hee Cheon Andrey Kim Miran Kim and Yongsoo Song. Homomorphic encryption for arithmetic of approximate numbers. Cryptology ePrint Archive Report 2016\/421 2016. https:\/\/ia.cr\/2016\/421."},{"key":"e_1_3_2_1_25_1","unstructured":"J. Fan and F. Vercauteren. Somewhat practical fully homomorphic encryption. Cryptology ePrint Archive Report 2012\/144 2012. https: \/\/ia.cr\/2012\/144."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3569955"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-77287-1_2"},{"key":"e_1_3_2_1_28_1","volume-title":"Paper 2015\/046","author":"Albrecht Martin R.","year":"2015","unstructured":"Martin R. Albrecht, Rachel Player, and Sam Scott. On the concrete hardness of learning with errors. Cryptology ePrint Archive, Paper 2015\/046, 2015. https:\/\/eprint.iacr.org\/2015\/046."},{"key":"e_1_3_2_1_29_1","volume-title":"Matcha: A fast and energye cient accelerator for fully homomorphic encryption over the torus. arXiv preprint arXiv:2202.08814","author":"Jiang Lei","year":"2022","unstructured":"Lei Jiang, Qian Lou, and Nrushad Joshi. Matcha: A fast and energye cient accelerator for fully homomorphic encryption over the torus. arXiv preprint arXiv:2202.08814, 2022."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/3576915.3623159"},{"key":"e_1_3_2_1_31_1","unstructured":"High bandwidth memory (hbm) dram 2021."},{"key":"e_1_3_2_1_32_1","unstructured":"XILINX Inc. Axi high bandwidth memory controller logicore ip product guide. https:\/\/docs.amd.com\/r\/en-US\/pg276-axi-hbm\/Introduction."},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2018.2867655"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-07689-3_1"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2018.2867655"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/TVLSI.2024.3353374"},{"key":"e_1_3_2_1_37_1","unstructured":"Jason Lowe-Power Abdul Mutaal Ahmad Ayaz Akram Mohammad Alian Rico Amslinger Matteo Andreozzi Adri\u00e0 Armejach Nils Asmussen Brad Beckmann Srikant Bharadwaj Gabe Black Gedare Bloom Bobby R. Bruce Daniel Rodrigues Carvalho Jeronimo Castrillon Lizhong Chen Nicolas Derumigny Stephan Diestelhorst Wendy Elsasser Carlos Escuin Marjan Fariborz Amin Farmahini-Farahani Pouya Fotouhi Ryan Gambord Jayneel Gandhi Dibakar Gope Thomas Grass Anthony Gutierrez Bagus Hanindhito Andreas Hansson Swapnil Haria Austin Harris Timothy Hayes Adrian Herrera Matthew Horsnell Syed Ali Raza Jafri Radhika Jagtap Hanhwi Jang Reiley Jeyapaul Timothy M. Jones Matthias Jung Subash Kannoth Hamidreza Khaleghzadeh Yuetsu Kodama Tushar Krishna Tommaso Marinelli Christian Menard Andrea Mondelli Miquel Moreto Tiago M\u00fcck Omar Naji Krishnendra Nathella Hoa Nguyen Nikos Nikoleris Lena E. Olson Marc Orr Binh Pham Pablo Prieto Trivikram Reddy Alec Roelke Mahyar Samani Andreas Sandberg Javier Setoain Boris Shingarov Matthew D. Sinclair Tuan Ta Rahul Thakur Giacomo Travaglini Michael Upton Nilay Vaish Ilias Vougioukas William Wang Zhengrong Wang Norbert Wehn Christian Weis David A. Wood Hongil Yoon and \u00c9der F. Zulian. The gem5 simulator: Version 20.0. arXiv preprint arXiv:2007.03152 2020."},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC55821.2022.9926381"},{"key":"e_1_3_2_1_39_1","volume-title":"Proceedings of the 2022 ACM\/SIGDA International Symposium on Field-Programmable Gate Arrays.","author":"Kang Shinhaeng","unstructured":"Shinhaeng Kang, Sukhan Lee, Byeongho Kim, Hweesoo Kim, Kyomin Sohn, Nam Sung Kim, and Eojin Lee. An fpga-based rnn-t inference accelerator with pim-hbm. In Proceedings of the 2022 ACM\/SIGDA International Symposium on Field-Programmable Gate Arrays."},{"key":"e_1_3_2_1_40_1","unstructured":"SYNOPSYS Inc. Synopsys design cimpiler. https:\/\/www.synopsys.com\/implementation-and-signoff\/rtl-synthesis-test\/dc-ultra.html."},{"key":"e_1_3_2_1_41_1","first-page":"30","article-title":"Vivado design suite","volume":"5","author":"Feist T.","year":"2012","unstructured":"T. Feist. Vivado design suite. White Paper, 5:30, 2012.","journal-title":"White Paper"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/LCA.2020.2973991"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/DAC56929.2023.10247747"},{"key":"e_1_3_2_1_44_1","volume-title":"Dramaton: A near-dram accelerator for large number theoretic transforms","author":"Park Yongmo","year":"2024","unstructured":"Yongmo Park, Subhankar Pal, Aporva Amarnath, Karthik Swaminathan, Wei D Lu, Alper Buyuktosunoglu, and Pradip Bose. Dramaton: A near-dram accelerator for large number theoretic transforms. IEEE Computer Architecture Letters, 2024."},{"key":"e_1_3_2_1_45_1","unstructured":"Austin Hartshorn Humberto Leon Noel Qiao and Scott Weber. Number theoretic transform (ntt) fpga accelerator. Worcester Polytech. Inst. Worcester MA USA Tech. Rep. E-project-051420--162339 pages 1--37 2020."},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO.2018.00062"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA47549.2020.00033"},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.3390\/jlpea10040030"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-9260(99)00006-1"},{"key":"e_1_3_2_1_50_1","volume-title":"Intel Vtune Profiler","author":"Intel Inc.","year":"2023","unstructured":"Intel Inc. Intel Vtune Profiler, 2023. https:\/\/www.intel.com\/content\/www\/us\/en\/develop\/documentation\/vtune-help\/top.html\/."},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.1109\/PACT58117.2023.00018"},{"key":"e_1_3_2_1_52_1","volume-title":"Algebra","author":"Herstein IN","year":"1964","unstructured":"IN Herstein. Topics. Algebra. Waltham: Blaisdell Publishing Company, 1964."},{"key":"e_1_3_2_1_53_1","first-page":"1","volume-title":"Nektarios Georgios Tsoutsos. REDsec: Running Encrypted Discretized Neural Networks in Seconds. In Network and Distributed System Security Symposium (NDSS)","author":"Folkerts Lars","year":"2023","unstructured":"Lars Folkerts, Charles Gouert, and Nektarios Georgios Tsoutsos. REDsec: Running Encrypted Discretized Neural Networks in Seconds. In Network and Distributed System Security Symposium (NDSS), pages 1--17, 2023."},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-52426-4_10"},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"publisher","DOI":"10.1145\/3605759.3625260"},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.1145\/3296957.3173171"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"publisher","DOI":"10.1109\/DAC18072.2020.9218730"},{"key":"e_1_3_2_1_58_1","doi-asserted-by":"publisher","DOI":"10.1109\/TVLSI.2022.3151321"},{"key":"e_1_3_2_1_59_1","volume-title":"Strix: An end-to-end streaming architecture with two-level ciphertext batching for fully homomorphic encryption with programmable bootstrapping. arXiv preprint arXiv:2305.11423","author":"Putra Adiwena","year":"2023","unstructured":"Adiwena Putra, Prasetiyo, Yi Chen, John Kim, and Joo-Young Kim. Strix: An end-to-end streaming architecture with two-level ciphertext batching for fully homomorphic encryption with programmable bootstrapping. arXiv preprint arXiv:2305.11423, 2023."},{"key":"e_1_3_2_1_60_1","first-page":"249","volume-title":"2024 IEEE International Symposium on High-Performance Computer Architecture (HPCA)","author":"Putra A.","year":"2024","unstructured":"Prasetiyo, A. Putra, and J. Kim. Morphling: A throughput-maximized tfhe-based accelerator using transform-domain reuse. In 2024 IEEE International Symposium on High-Performance Computer Architecture (HPCA), pages 249--262. IEEE, 2024."},{"key":"e_1_3_2_1_61_1","doi-asserted-by":"publisher","DOI":"10.1145\/3385412.3386023"},{"key":"e_1_3_2_1_62_1","doi-asserted-by":"publisher","DOI":"10.1145\/3314221.3314628"},{"key":"e_1_3_2_1_63_1","doi-asserted-by":"publisher","DOI":"10.1145\/3613424.3614279"},{"key":"e_1_3_2_1_64_1","doi-asserted-by":"publisher","DOI":"10.1145\/3613424.3614302"}],"event":{"name":"ASPLOS '25: 30th ACM International Conference on Architectural Support for Programming Languages and Operating Systems","location":"Rotterdam Netherlands","acronym":"ASPLOS '25","sponsor":["SIGPLAN ACM Special Interest Group on Programming Languages","SIGOPS ACM Special Interest Group on Operating Systems","SIGARCH ACM Special Interest Group on Computer Architecture"]},"container-title":["Proceedings of the 30th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 2"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3676641.3716246","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3676641.3716246","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T11:08:26Z","timestamp":1755774506000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3676641.3716246"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,30]]},"references-count":64,"alternative-id":["10.1145\/3676641.3716246","10.1145\/3676641"],"URL":"https:\/\/doi.org\/10.1145\/3676641.3716246","relation":{},"subject":[],"published":{"date-parts":[[2025,3,30]]},"assertion":[{"value":"2025-03-30","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}