{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,23]],"date-time":"2026-04-23T08:03:02Z","timestamp":1776931382679,"version":"3.51.2"},"publisher-location":"New York, NY, USA","reference-count":38,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,11,15]],"date-time":"2025-11-15T00:00:00Z","timestamp":1763164800000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/100006228","name":"Oak Ridge National Laboratory","doi-asserted-by":"publisher","award":["MAGNET: MAthematics, ComputinG, and NETworking for Resource-Efficient Computational Science"],"award-info":[{"award-number":["MAGNET: MAthematics, ComputinG, and NETworking for Resource-Efficient Computational Science"]}],"id":[{"id":"10.13039\/100006228","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000028","name":"Semiconductor Research Corporation","doi-asserted-by":"publisher","award":["JUMP 2.0 PRISM"],"award-info":[{"award-number":["JUMP 2.0 PRISM"]}],"id":[{"id":"10.13039\/100000028","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,11,16]]},"DOI":"10.1145\/3731599.3767530","type":"proceedings-article","created":{"date-parts":[[2025,11,7]],"date-time":"2025-11-07T16:18:44Z","timestamp":1762532324000},"page":"1684-1693","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["A RISC-V Vector Extension for Multi-word Arithmetic"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-8246-7802","authenticated-orcid":false,"given":"Yunhao","family":"Lan","sequence":"first","affiliation":[{"name":"Carnegie Mellon University, Pittsburgh, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-7749-6196","authenticated-orcid":false,"given":"Larry","family":"Tang","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University, Pittsburgh, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-0190-4041","authenticated-orcid":false,"given":"Naifeng","family":"Zhang","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University, Pittsburgh, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-9621-6689","authenticated-orcid":false,"given":"Youngjin","family":"Eum","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University, Pittsburgh, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9302-5287","authenticated-orcid":false,"given":"James","family":"Hoe","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University, Pittsburgh, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3529-8973","authenticated-orcid":false,"given":"Franz","family":"Franchetti","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University, Pittsburgh, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,11,15]]},"reference":[{"key":"e_1_3_3_1_2_2","unstructured":"2021. RISC-V \u201cV\u201d Vector Extension. GitHub https:\/\/github.com\/riscv\/riscv-v-spec\/releases\/download\/v1.0\/riscv-v-spec-1.0.pdf."},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA56546.2023.10070953"},{"key":"e_1_3_3_1_4_2","first-page":"327","volume-title":"Proceedings of the 25th USENIX Security Symposium (USENIX Security \u201916)","author":"Alkim Erdem","year":"2016","unstructured":"Erdem Alkim, L\u00e9o Ducas, Thomas P\u00f6ppelmann, and Peter Schwabe. 2016. Post\u2011Quantum Key Exchange\u2014A New Hope. In Proceedings of the 25th USENIX Security Symposium (USENIX Security \u201916). 327\u2013343."},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"publisher","DOI":"10.1145\/1465482.1465560"},{"key":"e_1_3_3_1_6_2","volume-title":"Introducing SVE2","author":"Limited Arm","year":"2023","unstructured":"Arm Limited. 2023. Introducing SVE2. Arm Limited. https:\/\/developer.arm.com\/documentation\/102340\/0100\/Introducing-SVE2 Arm Developer Documentation, DDMS 102340\/0100."},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"publisher","unstructured":"Zahra Azad Guowei Yang Rashmi Agrawal Daniel Petrisko Michael Taylor and Ajay Joshi. 2023. RISE: RISC\u2013V SoC for En\/Decryption Acceleration on the Edge for Homomorphic Encryption. IEEE Transactions on Very Large Scale Integration (VLSI) Systems 31 10 (Oct 2023) 1523\u20131536. 10.1109\/TVLSI.2023.3288754","DOI":"10.1109\/TVLSI.2023.3288754"},{"key":"e_1_3_3_1_8_2","doi-asserted-by":"publisher","DOI":"10.1109\/ARITH51176.2021.00028"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"publisher","DOI":"10.1145\/3649329.3657347"},{"key":"e_1_3_3_1_10_2","doi-asserted-by":"publisher","unstructured":"J.\u00a0W. Cooley and J.\u00a0W. Tukey. 1965. An Algorithm for the Machine Calculation of Complex Fourier Series. Math. Comp. 19 90 (1965) 297\u2013301. 10.2307\/2003354","DOI":"10.2307\/2003354"},{"key":"e_1_3_3_1_11_2","volume-title":"Tech. Rep., Carnegie Mellon University","author":"Eum Youngjin","year":"2023","unstructured":"Youngjin Eum, Naifeng Zhang, Larry Tang, and Franz Franchetti. 2023. Towards a RISC-V Instruction Set Extension for Multi-word Arithmetic. In Tech. Rep., Carnegie Mellon University."},{"key":"e_1_3_3_1_12_2","doi-asserted-by":"publisher","unstructured":"F. Franchetti T.\u00a0M. Low D.\u00a0T. Popovici R.\u00a0M. Veras D.\u00a0G. Spampinato J.\u00a0R. Johnson M. P\u00fcschel J.\u00a0C. Hoe and J.\u00a0M.\u00a0F. Moura. 2018. SPIRAL: Extreme Performance Portability. Proc. IEEE 106 11 (Nov. 2018) 1935\u20131968. 10.1109\/JPROC.2018.2873289","DOI":"10.1109\/JPROC.2018.2873289"},{"key":"e_1_3_3_1_13_2","first-page":"1","volume-title":"Proc. ACM Int. Conference on Parallel Architectures and Compilation Techniques (PACT)","author":"Fu Sophia","year":"2024","unstructured":"Sophia Fu, Naifeng Zhang, and Franz Franchetti. 2024. Accelerating High-Precision Number Theoretic Transforms using Intel AVX-512. In Proc. ACM Int. Conference on Parallel Architectures and Compilation Techniques (PACT). 1\u201310."},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"publisher","DOI":"10.1109\/ARITH.2001.930115"},{"key":"e_1_3_3_1_15_2","unstructured":"Karthik Inbasekar Yuval Shekel and Michael Asa. 2024. ICICLE v2: Polynomial API for Coding ZK Provers to Run on Specialized Hardware. Cryptology ePrint Archive (2024)."},{"key":"e_1_3_3_1_16_2","volume-title":"Intel Architecture Instruction Set Extensions Programming Reference","author":"Corporation Intel","year":"2013","unstructured":"Intel Corporation. 2013. Intel Architecture Instruction Set Extensions Programming Reference. Intel Corporation. https:\/\/web.archive.org\/web\/20130929035331http:\/\/download-software.intel.com\/sites\/default\/files\/319433-015.pdf Archived at web.archive.org."},{"key":"e_1_3_3_1_17_2","volume-title":"Intel 64 and IA-32 Architectures Software Developer\u2019s Manual, Volume 2A: Instruction Set Reference, A\u2013M","author":"Corporation Intel","year":"2022","unstructured":"Intel Corporation. 2022. Intel 64 and IA-32 Architectures Software Developer\u2019s Manual, Volume 2A: Instruction Set Reference, A\u2013M. Intel Corporation, Santa Clara, CA, USA. https:\/\/www.intel.com\/content\/www\/us\/en\/developer\/articles\/technical\/intel-sdm.html Includes the full AVX-512 instruction set."},{"key":"e_1_3_3_1_18_2","unstructured":"Sangpyo Kim Wonkyung Jung Jaiyoung Park and Jung\u00a0Ho Ahn. 2020. Accelerating Number Theoretic Transformations for Bootstrappable Homomorphic Encryption on GPUs. IACR Cryptology ePrint Archive 2020 1198 (2020)."},{"key":"e_1_3_3_1_19_2","doi-asserted-by":"publisher","DOI":"10.1109\/CISCE52179.2021.9445982"},{"key":"e_1_3_3_1_20_2","doi-asserted-by":"publisher","DOI":"10.1145\/3489517.3530552"},{"key":"e_1_3_3_1_21_2","doi-asserted-by":"crossref","unstructured":"Chiara Marcolla Victor Sucasas Marc Manzano Riccardo Bassoli Frank H.\u00a0P. Fitzek and Najwa Aaraj. 2022. Survey on Fully Homomorphic Encryption Theory and Applications. IACR Cryptology ePrint Archive Paper 2022\/1602. https:\/\/eprint.iacr.org\/2022\/1602.pdf","DOI":"10.36227\/techrxiv.19315202.v4"},{"key":"e_1_3_3_1_22_2","unstructured":"Konstantina Miteloudi Joppe Bos Olivier Bronchain Bj\u00f6rn Fay and Joost Renes. 2023. PQ.V.ALU.E: Post-Quantum RISC-V Custom ALU Extensions on Dilithium and Kyber. Cryptology ePrint Archive Paper 2023\/1505. https:\/\/eprint.iacr.org\/2023\/1505"},{"key":"e_1_3_3_1_23_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISCAS46773.2023.10181714"},{"key":"e_1_3_3_1_24_2","doi-asserted-by":"publisher","unstructured":"Rog\u00e9rio Paludo and Leonel Sousa. 2022. NTT Architecture for a Linux-Ready RISC-V Fully-Homomorphic Encryption Accelerator. IEEE Transactions on Circuits and Systems I: Regular Papers 69 7 (July 2022) 2669\u20132682. 10.1109\/TCSI.2022.3166550","DOI":"10.1109\/TCSI.2022.3166550"},{"key":"e_1_3_3_1_25_2","doi-asserted-by":"publisher","DOI":"10.1145\/3466752.3480070"},{"key":"e_1_3_3_1_26_2","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3527393"},{"key":"e_1_3_3_1_27_2","doi-asserted-by":"publisher","DOI":"10.5555\/800048.801719"},{"key":"e_1_3_3_1_28_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISPASS57527.2023.00034"},{"key":"e_1_3_3_1_29_2","doi-asserted-by":"publisher","unstructured":"Zhuoyu Tian Lei Chen Shengyu Fan Xianglong Deng Rui Hou Dan Meng and Mingzhe Zhang. 2025. LP\u2011HENN: Fully Homomorphic Encryption Accelerator with High Energy Efficiency. Cybersecurity 8 1 (2025) 98. 10.1186\/s42400-025-00360-x","DOI":"10.1186\/s42400-025-00360-x"},{"key":"e_1_3_3_1_30_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCAD57390.2023.10323744"},{"key":"e_1_3_3_1_31_2","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC58863.2023.10363559"},{"key":"e_1_3_3_1_32_2","volume-title":"Proceedings of the IEEE\/ACM International Symposium on Code Generation and Optimization (CGO)","author":"Zhang Naifeng","year":"2023","unstructured":"Naifeng Zhang and Franz Franchetti. 2023. Generating Number Theoretic Transforms for Multi-Word Integer Data Types. In Proceedings of the IEEE\/ACM International Symposium on Code Generation and Optimization (CGO)."},{"key":"e_1_3_3_1_33_2","doi-asserted-by":"publisher","DOI":"10.1145\/3696443.3708948"},{"key":"e_1_3_3_1_34_2","doi-asserted-by":"crossref","unstructured":"Naifeng Zhang Sophia Fu and Franz Franchetti. 2025. Towards Closing the Performance Gap for Cryptographic Kernels Between CPUs and Specialized Hardware. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2509.12494 (2025).","DOI":"10.1145\/3725843.3756120"},{"key":"e_1_3_3_1_35_2","first-page":"1","volume-title":"Proc. IEEE High Performance Extreme Computing Conference (HPEC)","author":"Zhang Naifeng","year":"2022","unstructured":"Naifeng Zhang, Homer Gamil, Patrick Brinich, Benedict Reynwar, Ahmad\u00a0Al Badawi, Negar Neda, Deepraj Soni, Kellie Canida, Yuriy Polyakov, Patrick Broderick, Michail Maniatakos, Andrew Schmidt, Mike Franusich, Jeremy Johnson, Brandon Reagen, David\u00a0Bruce Cousins, and Franz Franchetti. 2022. Towards Full-Stack Acceleration for Fully Homomorphic Encryption. In Proc. IEEE High Performance Extreme Computing Conference (HPEC). 1\u20138."},{"key":"e_1_3_3_1_36_2","unstructured":"J. Zhao D. Grubb M. Rusch T. Wei K. Anderson B. Nikoli\u0107 and K. Asanovi\u0107. 2024. Instruction Scheduling in the Saturn Vector Unit. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2412.00997 (Dec. 2024). Available: https:\/\/arxiv.org\/abs\/2412.00997."},{"key":"e_1_3_3_1_37_2","volume-title":"The Saturn Microarchitecture Manual","author":"Zhao Jerry","year":"2024","unstructured":"Jerry Zhao, Daniel Grubb, Miles Rusch, Tianrui Wei, Kevin Anderson, Borivoje Nikoli\u0107, and Krste Asanovi\u0107. 2024. The Saturn Microarchitecture Manual. Technical Report UCB\/EECS-2024-215. EECS Department, University of California, Berkeley. [Online]. Available: http:\/\/www2.eecs.berkeley.edu\/Pubs\/TechRpts\/2024\/EECS-2024-215.html."},{"key":"e_1_3_3_1_38_2","volume-title":"GPU Technology Conference","author":"Zhao Kaiyong","year":"2009","unstructured":"Kaiyong Zhao. 2009. Implementation of multiple-precision modular multiplication on GPU. In GPU Technology Conference."},{"key":"e_1_3_3_1_39_2","doi-asserted-by":"publisher","DOI":"10.1109\/CIT.2010.211"}],"event":{"name":"SC Workshops '25: Workshops of the International Conference for High Performance Computing, Networking, Storage and Analysis","location":"St Louis MO USA","acronym":"SC Workshops '25","sponsor":["SIGHPC ACM Special Interest Group on High Performance Computing, Special Interest Group on High Performance Computing"]},"container-title":["Proceedings of the SC '25 Workshops of the International Conference for High Performance Computing, Networking, Storage and Analysis"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/abs\/10.1145\/3731599.3767530","content-type":"text\/html","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3731599.3767530","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3731599.3767530","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,9]],"date-time":"2026-01-09T19:32:10Z","timestamp":1767987130000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3731599.3767530"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11,15]]},"references-count":38,"alternative-id":["10.1145\/3731599.3767530","10.1145\/3731599"],"URL":"https:\/\/doi.org\/10.1145\/3731599.3767530","relation":{},"subject":[],"published":{"date-parts":[[2025,11,15]]},"assertion":[{"value":"2025-11-15","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}