{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,2]],"date-time":"2025-10-02T00:47:22Z","timestamp":1759366042129,"version":"build-2065373602"},"publisher-location":"New York, NY, USA","reference-count":126,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,10,13]]},"DOI":"10.1145\/3731569.3764800","type":"proceedings-article","created":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T12:43:24Z","timestamp":1759322604000},"page":"1062-1081","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["How to Copy Memory? Coordinated Asynchronous Copy as a First-Class OS Service"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-9024-7588","authenticated-orcid":false,"given":"Jingkai","family":"He","sequence":"first","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-5434-0435","authenticated-orcid":false,"given":"Yunpeng","family":"Dong","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7945-8430","authenticated-orcid":false,"given":"Dong","family":"Du","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-2655-2911","authenticated-orcid":false,"given":"Mo","family":"Zou","sequence":"additional","affiliation":[{"name":"Huawei Technologies, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9893-6939","authenticated-orcid":false,"given":"Zhitai","family":"Yu","sequence":"additional","affiliation":[{"name":"Huawei Technologies, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2678-9225","authenticated-orcid":false,"given":"Yuxin","family":"Ren","sequence":"additional","affiliation":[{"name":"Huawei Technologies, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-8246-4713","authenticated-orcid":false,"given":"Ning","family":"Jia","sequence":"additional","affiliation":[{"name":"Huawei Technologies, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6558-5298","authenticated-orcid":false,"given":"Yubin","family":"Xia","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9720-0361","authenticated-orcid":false,"given":"Haibo","family":"Chen","sequence":"additional","affiliation":[{"name":"Shanghai JiaoTong University, Shanghai, China"}]}],"member":"320","published-online":{"date-parts":[[2025,10,12]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.5555\/3585938.3585961"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/3694715.3695946"},{"key":"e_1_3_2_1_3_1","volume-title":"CBMM: Financial Advice for Kernel Memory Managers. In 2022 USENIX Annual Technical Conference (USENIX ATC 22)","author":"Mansi Mark","unstructured":"Mark Mansi, Bijan Tabatabai, and Michael M. Swift. 2022. CBMM: Financial Advice for Kernel Memory Managers. In 2022 USENIX Annual Technical Conference (USENIX ATC 22). USENIX Association, Carlsbad, CA, 593\u2013608. https:\/\/www.usenix.org\/conference\/atc22\/presentation\/mansi"},{"key":"e_1_3_2_1_4_1","volume-title":"Microkernel Goes General: Performance and Compatibility in the HongMeng Production Microkernel. In 18th USENIX Symposium on Operating Systems Design and Implementation (OSDI 24)","author":"Chen Haibo","year":"2024","unstructured":"Haibo Chen, Xie Miao, Ning Jia, Nan Wang, Yu Li, Nian Liu, Yutao Liu, Fei Wang, Qiang Huang, Kun Li, Hongyang Yang, Hui Wang, Jie Yin, Yu Peng, and Fengwei Xu. 2024. Microkernel Goes General: Performance and Compatibility in the HongMeng Production Microkernel. In 18th USENIX Symposium on Operating Systems Design and Implementation (OSDI 24). USENIX Association, Santa Clara, CA, 465\u2013485. https:\/\/www.usenix.org\/conference\/osdi24\/presentation\/chen-haibo"},{"key":"e_1_3_2_1_5_1","volume-title":"15th USENIX Symposium on Operating Systems Design and Implementation (OSDI 21)","author":"Bhardwaj Ankit","year":"2021","unstructured":"Ankit Bhardwaj, Chinmay Kulkarni, Reto Achermann, Irina Calciu, Sanidhya Kashyap, Ryan Stutsman, Amy Tai, and Gerd Zellweger. 2021. NrOS: Effective Replication and Sharing in an Operating System. In 15th USENIX Symposium on Operating Systems Design and Implementation (OSDI 21). USENIX Association, 295\u2013312. https:\/\/www.usenix.org\/conference\/osdi21\/presentation\/bhardwaj"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/3132747.3132770"},{"key":"e_1_3_2_1_7_1","volume-title":"16th USENIX Symposium on Operating Systems Design and Implementation (OSDI 22)","author":"Stamler Timothy","year":"2022","unstructured":"Timothy Stamler, Deukyeon Hwang, Amanda Raybuck, Wei Zhang, and Simon Peter. 2022. zIO: Accelerating IO-Intensive Applications with Transparent Zero-Copy IO. In 16th USENIX Symposium on Operating Systems Design and Implementation (OSDI 22). USENIX Association, Carlsbad, CA, 431\u2013445. https:\/\/www.usenix.org\/conference\/osdi22\/presentation\/stamler"},{"key":"e_1_3_2_1_8_1","unstructured":"2025. Redis Documentation. https:\/\/redis.io\/docs\/."},{"key":"e_1_3_2_1_9_1","unstructured":"2024. Tinyproxy: lightweight http(s) proxy daemon. https:\/\/tinyproxy.github.io."},{"key":"e_1_3_2_1_10_1","unstructured":"2024. Nginx. https:\/\/nginx.org\/en\/."},{"key":"e_1_3_2_1_11_1","volume-title":"Proceedings of the 7th Symposium on Operating Systems Design and Implementation","author":"Weil Sage A.","year":"2006","unstructured":"Sage A. Weil, Scott A. Brandt, Ethan L. Miller, Darrell D. E. Long, and Carlos Maltzahn. 2006. Ceph: a scalable, high-performance distributed file system. In Proceedings of the 7th Symposium on Operating Systems Design and Implementation (Seattle, Washington) (OSDI '06). USENIX Association, USA, 307\u2013320. https:\/\/www.usenix.org\/legacy\/events\/osdi06\/tech\/full_papers\/weil\/weil_html\/"},{"key":"e_1_3_2_1_12_1","unstructured":"2024. MongoDB. https:\/\/www.mongodb.com\/."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/3452296.3472888"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/3307650.3322218"},{"key":"e_1_3_2_1_15_1","unstructured":"2022. Fast memcpy A System Design. https:\/\/www.sigarch.org\/fast-memcpy-a-system-design\/."},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/3037697.3037736"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/2749469.2750392"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/3579371.3589082"},{"key":"e_1_3_2_1_19_1","unstructured":"2018. Avoid barrier_nospec() in 64-bit copy_from_user() (Linux patch). https:\/\/git.kernel.org\/pub\/scm\/linux\/kernel\/git\/torvalds\/linux.git\/commit\/?id=0fc810ae3ae110f9e2fcccce80fc8c8d62f97907."},{"key":"e_1_3_2_1_20_1","unstructured":"2022. AArch64: Add SVE memcpy (glibc patch). https:\/\/sourceware.org\/pipermail\/glibc-cvs\/2024q2\/084846.html."},{"key":"e_1_3_2_1_21_1","unstructured":"2022. Imporve 64bit memcpy performance for Haswell CPU with AVX instruction (glibc patch). https:\/\/sourceware.org\/pipermail\/libc-alpha\/2014-June\/051959.html."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/3190508.3190523"},{"key":"e_1_3_2_1_23_1","unstructured":"2025. Intel Advanced Vector Extensions 2 (Intel AVX2). https:\/\/edc.intel.com\/content\/www\/us\/en\/design\/ipla\/software-development-platforms\/client\/platforms\/alder-lake-desktop\/12th-generation-intel-core-processors-datasheet-volume-1-of-2\/002\/intel-advanced-vector-extensions-2-intel-avx2\/."},{"key":"e_1_3_2_1_24_1","unstructured":"2024. MSG_ZEROCOPY Document. https:\/\/www.kernel.org\/doc\/html\/v4.18\/networking\/msg_zerocopy.html."},{"key":"e_1_3_2_1_25_1","unstructured":"Jonathan Corbet. 2020. The rapid growth of io_uring. https:\/\/lwn.net\/Articles\/810414\/."},{"key":"e_1_3_2_1_26_1","volume-title":"Proceedings of the 9th USENIX Conference on Operating Systems Design and Implementation","author":"Soares Livio","year":"2010","unstructured":"Livio Soares and Michael Stumm. 2010. FlexSC: flexible system call scheduling with exception-less system calls. In Proceedings of the 9th USENIX Conference on Operating Systems Design and Implementation (Vancouver, BC, Canada) (OSDI'10). USENIX Association, USA, 33\u201346. https:\/\/www.usenix.org\/conference\/osdi10\/flexsc-flexible-system-call-scheduling-exception-less-system-calls"},{"key":"e_1_3_2_1_27_1","volume-title":"22nd USENIX Conference on File and Storage Technologies (FAST 24)","author":"Cho Kyu-Jin","year":"2024","unstructured":"Kyu-Jin Cho, Jaewon Choi, Hyungjoon Kwon, and Jin-Soo Kim. 2024. RFUSE: Modernizing Userspace Filesystem Framework through Scalable Kernel-Userspace Communication. In 22nd USENIX Conference on File and Storage Technologies (FAST 24). 141\u2013157."},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/3620665.3640401"},{"key":"e_1_3_2_1_29_1","unstructured":"2016. (GNU C library patch) Initial Enhanced REP MOVSB\/STOSB (ERMS) support. https:\/\/patchwork.ozlabs.org\/project\/glibc\/patch\/20160328204830.GA402@intel.com."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/168619.168633"},{"key":"e_1_3_2_1_31_1","unstructured":"2024. sendfile(2) \u2014 Linux manual page. https:\/\/man7.org\/linux\/man-pages\/man2\/sendfile.2.html."},{"key":"e_1_3_2_1_32_1","unstructured":"2024. vmsplice(2) \u2014 Linux manual page. https:\/\/man7.org\/linux\/man-pages\/man2\/vmsplice.2.html."},{"key":"e_1_3_2_1_33_1","volume-title":"Proceedings of the 11th USENIX Conference on Operating Systems Design and Implementation","author":"Peter Simon","year":"2014","unstructured":"Simon Peter, Jialin Li, Irene Zhang, Dan R. K. Ports, Doug Woos, Arvind Krishnamurthy, Thomas Anderson, and Timothy Roscoe. 2014. Arrakis: the operating system is the control plane. In Proceedings of the 11th USENIX Conference on Operating Systems Design and Implementation (Broomfield, CO) (OSDI'14). USENIX Association, USA, 1\u201316. https:\/\/www.usenix.org\/conference\/osdi14\/technical-sessions\/presentation\/peter"},{"key":"e_1_3_2_1_34_1","volume-title":"16th USENIX Symposium on Operating Systems Design and Implementation (OSDI 22)","author":"Zhong Yuhong","year":"2022","unstructured":"Yuhong Zhong, Haoyu Li, Yu Jian Wu, Ioannis Zarkadas, Jeffrey Tao, Evan Mesterhazy, Michael Makris, Junfeng Yang, Amy Tai, Ryan Stutsman, and Asaf Cidon. 2022. XRP: In-Kernel Storage Functions with eBPF. In 16th USENIX Symposium on Operating Systems Design and Implementation (OSDI 22). USENIX Association, Carlsbad, CA, 375\u2013393. https:\/\/www.usenix.org\/conference\/osdi22\/presentation\/zhong"},{"key":"e_1_3_2_1_35_1","unstructured":"2024. HarmonyOS 5.0.0 Release Notes. https:\/\/developer.huawei.com\/consumer\/en\/doc\/atomic-releases\/atomic-releasenotes-500."},{"key":"e_1_3_2_1_36_1","unstructured":"2024. Protocol Buffers Documentation. https:\/\/protobuf.dev."},{"key":"e_1_3_2_1_37_1","volume-title":"Deep Dive into Android IPC\/Binder Framework at Android Builders Summit","year":"2013","unstructured":"2025. Deep Dive into Android IPC\/Binder Framework at Android Builders Summit 2013. https:\/\/events.static.linuxfound.org\/images\/stories\/slides\/abs2013_gargentas.pdf."},{"key":"e_1_3_2_1_38_1","unstructured":"2024. zlib - A Massively Spiffy Yet Delicately Unobtrusive Compression Library. https:\/\/github.com\/openssl\/openssl."},{"key":"e_1_3_2_1_39_1","unstructured":"2024. OpenSSL - TLS\/SSL and crypto library. https:\/\/github.com\/openssl\/openssl."},{"key":"e_1_3_2_1_40_1","unstructured":"2025. Libpng is the official PNG reference library. http:\/\/www.libpng.org\/pub\/png\/libpng.html."},{"key":"e_1_3_2_1_41_1","unstructured":"2024. ffmpeg - A complete cross-platform solution to record convert and stream audio and video. https:\/\/ffmpeg.org."},{"key":"e_1_3_2_1_42_1","unstructured":"2010. The new linux 'perf' tools. http:\/\/oldvger.kernel.org\/~acme\/perf\/lk2010-perf-paper.pdf."},{"key":"e_1_3_2_1_43_1","unstructured":"2024. F-Stack: High Performance Network Framework Based On DPDK. http:\/\/www.f-stack.org\/."},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1145\/3302424.3303985"},{"key":"e_1_3_2_1_45_1","unstructured":"2022. Intel Architecture Instruction Set Extensions and Future Features. https:\/\/www.intel.com\/content\/www\/us\/en\/support\/articles\/000005779\/processors.html."},{"key":"e_1_3_2_1_46_1","unstructured":"2018. Why can the kernel not use SSE\/AVX registers and instructions? https:\/\/unix.stackexchange.com\/questions\/475956."},{"key":"e_1_3_2_1_47_1","unstructured":"2006. Accelerating High-Speed Networking with Intel I\/O Acceleration Technology. https:\/\/www.intel.com\/content\/dam\/doc\/white-paper\/i-o-acceleration-technology-paper.pdf."},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.5555\/1268299.1268320"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1145\/3173162.3173175"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1145\/3458336.3465287"},{"key":"e_1_3_2_1_51_1","unstructured":"2020. Tencent Photo Cache traces - SNIA. http:\/\/iotta.snia.org\/traces\/parallel\/27476."},{"key":"e_1_3_2_1_52_1","unstructured":"2020. Twitter Memcached traces - SNIA. http:\/\/iotta.snia.org\/traces\/key-value."},{"key":"e_1_3_2_1_53_1","unstructured":"2020. Alibaba Block Traces. https:\/\/github.com\/alibaba\/block-traces."},{"key":"e_1_3_2_1_54_1","unstructured":"2024. Kernel Samepage Merging. https:\/\/www.kernel.org\/doc\/html\/latest\/admin-guide\/mm\/ksm.html."},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"publisher","DOI":"10.1145\/3477132.3483569"},{"key":"e_1_3_2_1_56_1","unstructured":"2025. Intel Data Streaming Accelerator (Intel DSA). https:\/\/www.intel.com\/content\/www\/us\/en\/products\/docs\/accelerator-engines\/data-streaming-accelerator.html."},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"publisher","DOI":"10.1145\/2540708.2540725"},{"key":"e_1_3_2_1_58_1","unstructured":"2024. NAPI Document. https:\/\/docs.kernel.org\/networking\/napi.html."},{"key":"e_1_3_2_1_59_1","unstructured":"2022. io_uring: add napi busy polling support. https:\/\/lwn.net\/Articles\/915657\/."},{"key":"e_1_3_2_1_60_1","unstructured":"2024. cgroups - Linux control groups. http:\/\/man7.org\/linux\/man-pages\/man7\/cgroups.7.html."},{"key":"e_1_3_2_1_61_1","unstructured":"2025. Kubernetes: Production-Grade Container Orchestration. https:\/\/kubernetes.io."},{"key":"e_1_3_2_1_62_1","doi-asserted-by":"publisher","DOI":"10.5555\/1594371.1594375"},{"key":"e_1_3_2_1_63_1","unstructured":"2025. Linux Virtual Memory Area (VMA). https:\/\/litux.nl\/mirror\/kerneldevelopment\/0672327201\/ch14lev1sec2.html."},{"key":"e_1_3_2_1_64_1","unstructured":"2019. Explicit pinning of user-space pages. https:\/\/lwn.net\/Articles\/807108\/."},{"key":"e_1_3_2_1_65_1","unstructured":"2024. DPDK. https:\/\/www.dpdk.org\/."},{"key":"e_1_3_2_1_66_1","unstructured":"2021. Storage Performance Development Kit. https:\/\/spdk.io\/."},{"key":"e_1_3_2_1_67_1","volume-title":"16th USENIX Symposium on Networked Systems Design and Implementation (NSDI 19)","author":"Kalia Anuj","year":"2019","unstructured":"Anuj Kalia, Michael Kaminsky, and David Andersen. 2019. Datacenter RPCs can be General and Fast. In 16th USENIX Symposium on Networked Systems Design and Implementation (NSDI 19). USENIX Association, Boston, MA, 1\u201316. https:\/\/www.usenix.org\/conference\/nsdi19\/presentation\/kalia"},{"key":"e_1_3_2_1_68_1","doi-asserted-by":"publisher","DOI":"10.1145\/3132747.3132772"},{"key":"e_1_3_2_1_69_1","doi-asserted-by":"publisher","DOI":"10.1145\/3542929.3563470"},{"key":"e_1_3_2_1_70_1","unstructured":"2024. memcached - a distributed memory object caching system. https:\/\/www.memcached.org."},{"key":"e_1_3_2_1_71_1","unstructured":"2024. Apache HTTP Server - the Number One HTTP Server On The Internet. https:\/\/httpd.apache.org."},{"key":"e_1_3_2_1_72_1","volume-title":"Proceedings of the 2012 USENIX Conference on Annual Technical Conference (Boston, MA) (USENIX ATC'12). USENIX Association, USA, 28","author":"Serebryany Konstantin","year":"2012","unstructured":"Konstantin Serebryany, Derek Bruening, Alexander Potapenko, and Dmitry Vyukov. 2012. AddressSanitizer: a fast address sanity checker. In Proceedings of the 2012 USENIX Conference on Annual Technical Conference (Boston, MA) (USENIX ATC'12). USENIX Association, USA, 28. https:\/\/www.usenix.org\/conference\/atc12\/technical-sessions\/presentation\/serebryany"},{"key":"e_1_3_2_1_73_1","doi-asserted-by":"publisher","DOI":"10.1145\/1791194.1791203"},{"key":"e_1_3_2_1_74_1","unstructured":"2025. Valgrind Memcheck: a memory error detector. https:\/\/valgrind.org\/docs\/manual\/mc-manual.html."},{"key":"e_1_3_2_1_75_1","unstructured":"2015. AddressSanitizer Manual of the Poisoning APIs. https:\/\/github.com\/google\/sanitizers\/wiki\/AddressSanitizerManualPoisoning."},{"key":"e_1_3_2_1_76_1","unstructured":"2024. Kernel Address Sanitizer (KASAN) \u2014 The Linux Kernel documentation. https:\/\/www.kernel.org\/doc\/html\/latest\/dev-tools\/kasan.html."},{"key":"e_1_3_2_1_77_1","doi-asserted-by":"publisher","DOI":"10.1145\/3600006.3613157"},{"key":"e_1_3_2_1_78_1","unstructured":"2024. Multi-Level Intermediate Representation Overview. https:\/\/mlir.llvm.org\/docs\/Tutorials\/DataFlowAnalysis\/."},{"key":"e_1_3_2_1_79_1","unstructured":"2024. Passes - MLIR. https:\/\/mlir.llvm.org\/docs\/Passes\/."},{"key":"e_1_3_2_1_80_1","unstructured":"2024. Checksum Offloads. https:\/\/www.kernel.org\/doc\/html\/v5.8\/networking\/checksum-offloads.html."},{"key":"e_1_3_2_1_81_1","first-page":"9","volume":"4","year":"2024","unstructured":"2024. OFED Documentation Rev 4.9-2.2.4.0 LTS - Checksum Offload. https:\/\/docs.nvidia.com\/networking\/display\/mlnxofedv492240\/checksum+offload.","journal-title":"OFED Documentation Rev"},{"key":"e_1_3_2_1_82_1","doi-asserted-by":"publisher","DOI":"10.1145\/3317550.3321435"},{"key":"e_1_3_2_1_83_1","doi-asserted-by":"publisher","DOI":"10.5555\/1855741.1855763"},{"key":"e_1_3_2_1_84_1","unstructured":"2024. Parcel. https:\/\/developer.android.com\/reference\/android\/os\/Parcel."},{"key":"e_1_3_2_1_85_1","unstructured":"2016. Intel Xeon Processor E5-2650 v4. https:\/\/www.intel.com\/content\/www\/us\/en\/products\/sku\/91767\/intel-xeon-processor-e52650-v4-30m-cache-2-20-ghz\/specifications.html."},{"key":"e_1_3_2_1_86_1","unstructured":"2023. Linus Torvalds Cleans Up The x86 Memory Copy Code For Linux 6.4. https:\/\/git.kernel.org\/pub\/scm\/linux\/kernel\/git\/torvalds\/linux.git\/commit\/?id=a5624566431de76b17862383d9ae254d9606cba9."},{"key":"e_1_3_2_1_87_1","volume-title":"Userspace Bypass: Accelerating Syscall-intensive Applications. In 17th USENIX Symposium on Operating Systems Design and Implementation (OSDI 23)","author":"Zhou Zhe","year":"2023","unstructured":"Zhe Zhou, Yanxiang Bi, Junpeng Wan, Yangfan Zhou, and Zhou Li. 2023. Userspace Bypass: Accelerating Syscall-intensive Applications. In 17th USENIX Symposium on Operating Systems Design and Implementation (OSDI 23). USENIX Association, Boston, MA, 33\u201349. https:\/\/www.usenix.org\/conference\/osdi23\/presentation\/zhou-zhe"},{"key":"e_1_3_2_1_88_1","unstructured":"2018. Zero-copy TCP receive. https:\/\/lwn.net\/Articles\/752188\/."},{"key":"e_1_3_2_1_89_1","unstructured":"2021. Header-Data Split Architecture. https:\/\/learn.microsoft.com\/en-us\/windows-hardware\/drivers\/network\/header-data-split-architecture."},{"key":"e_1_3_2_1_90_1","unstructured":"2024. Redis Benchmark Documentation. https:\/\/redis.io\/docs\/management\/optimization\/benchmarks\/."},{"key":"e_1_3_2_1_91_1","unstructured":"2020. Intel Xeon Gold 6238R Processor. https:\/\/www.intel.com\/content\/www\/us\/en\/products\/sku\/199345\/intel-xeon-gold-6238r-processor-38-5m-cache-2-20-ghz\/specifications.html."},{"key":"e_1_3_2_1_92_1","unstructured":"2024. Knative is an Open-Source Enterprise-level solution to build Serverless and Event Driven Applications. https:\/\/knative.dev\/docs\/."},{"key":"e_1_3_2_1_93_1","unstructured":"2024. gRPC Documentation. https:\/\/grpc.io\/docs\/."},{"key":"e_1_3_2_1_94_1","unstructured":"2024. zlib replacement with optimizations for \"next generation\" systems. https:\/\/github.com\/zlib-ng\/zlib-ng."},{"key":"e_1_3_2_1_95_1","unstructured":"2006. Add memcpy_uncached_read a memcpy that tries to reduce cache pressure. https:\/\/lwn.net\/Articles\/213971\/."},{"key":"e_1_3_2_1_96_1","unstructured":"2022. DPDK non-temporal memcpy. https:\/\/mails.dpdk.org\/archives\/dev\/2022-August\/247795.html."},{"key":"e_1_3_2_1_97_1","volume-title":"Automatically Reasoning About How Systems Code Uses the CPU Cache. In 18th USENIX Symposium on Operating Systems Design and Implementation (OSDI 24)","author":"Iyer Rishabh","year":"2024","unstructured":"Rishabh Iyer, Katerina Argyraki, and George Candea. 2024. Automatically Reasoning About How Systems Code Uses the CPU Cache. In 18th USENIX Symposium on Operating Systems Design and Implementation (OSDI 24). USENIX Association, Santa Clara, CA, 581\u2013598. https:\/\/www.usenix.org\/conference\/osdi24\/presentation\/iyer"},{"key":"e_1_3_2_1_98_1","doi-asserted-by":"publisher","DOI":"10.1145\/1755913.1755947"},{"key":"e_1_3_2_1_99_1","volume-title":"DMon: Efficient Detection and Correction of Data Locality Problems Using Selective Profiling. In 15th USENIX Symposium on Operating Systems Design and Implementation (OSDI 21)","author":"Khan Tanvir Ahmed","year":"2021","unstructured":"Tanvir Ahmed Khan, Ian Neal, Gilles Pokam, Barzan Mozafari, and Baris Kasikci. 2021. DMon: Efficient Detection and Correction of Data Locality Problems Using Selective Profiling. In 15th USENIX Symposium on Operating Systems Design and Implementation (OSDI 21). USENIX Association, 163\u2013181. https:\/\/www.usenix.org\/conference\/osdi21\/presentation\/khan"},{"key":"e_1_3_2_1_100_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA59077.2024.00084"},{"key":"e_1_3_2_1_101_1","doi-asserted-by":"publisher","DOI":"10.1145\/3503222.3507774"},{"key":"e_1_3_2_1_102_1","unstructured":"2022. NVIDIA H100 Tensor Core GPU Architecture. https:\/\/resources.nvidia.com\/en-us-hopper-architecture\/nvidia-h100-tensor-c."},{"key":"e_1_3_2_1_103_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA51647.2021.00071"},{"key":"e_1_3_2_1_104_1","volume-title":"Fast","author":"Heiser Gernot","unstructured":"Gernot Heiser, Ivan Velickovic, Peter Chubb, Alwin Joshy, Anuraag Ganesh, Bill Nguyen, Cheng Li, Courtney Darville, Guangtao Zhu, James Archer, Jingyao Zhou, Krishnan Winter, Lucy Parker, Szymon Duchniewicz, and Tianyi Bai. 2025. Fast, Secure, Adaptable: LionsOS Design, Implementation and Performance. arXiv:2501.06234 [cs.OS] https:\/\/arxiv.org\/abs\/2501.06234"},{"key":"e_1_3_2_1_105_1","volume-title":"Proceedings of the 2011 USENIX Conference on USENIX Annual Technical Conference (Portland, OR) (USENIX ATC'11). USENIX Association, USA, 10","author":"Soares Livio","year":"2011","unstructured":"Livio Soares and Michael Stumm. 2011. Exception-less system calls for event-driven servers. In Proceedings of the 2011 USENIX Conference on USENIX Annual Technical Conference (Portland, OR) (USENIX ATC'11). USENIX Association, USA, 10. https:\/\/www.usenix.org\/conference\/usenixatc11\/exception-less-system-calls-event-driven-servers"},{"key":"e_1_3_2_1_106_1","doi-asserted-by":"publisher","DOI":"10.1145\/2699681"},{"key":"e_1_3_2_1_107_1","doi-asserted-by":"publisher","DOI":"10.1145\/2048066.2048134"},{"key":"e_1_3_2_1_108_1","doi-asserted-by":"publisher","DOI":"10.1145\/1629575.1629579"},{"key":"e_1_3_2_1_109_1","doi-asserted-by":"publisher","DOI":"10.1145\/3477132.3483543"},{"key":"e_1_3_2_1_110_1","doi-asserted-by":"publisher","DOI":"10.1145\/3694715.3695983"},{"key":"e_1_3_2_1_111_1","volume-title":"Proceedings of the 11th USENIX Conference on Operating Systems Design and Implementation","author":"Belay Adam","year":"2014","unstructured":"Adam Belay, George Prekas, Ana Klimovic, Samuel Grossman, Christos Kozyrakis, and Edouard Bugnion. 2014. IX: a protected dataplane operating system for high throughput and low latency. In Proceedings of the 11th USENIX Conference on Operating Systems Design and Implementation (Broomfield, CO) (OSDI'14). USENIX Association, USA, 49\u201365. https:\/\/www.usenix.org\/conference\/osdi14\/technical-sessions\/presentation\/belay"},{"key":"e_1_3_2_1_112_1","volume-title":"StackMap: Low-Latency Networking with the OS Stack and Dedicated NICs. In 2016 USENIX Annual Technical Conference (USENIX ATC 16)","author":"Yasukata Kenichi","year":"2016","unstructured":"Kenichi Yasukata, Michio Honda, Douglas Santry, and Lars Eggert. 2016. StackMap: Low-Latency Networking with the OS Stack and Dedicated NICs. In 2016 USENIX Annual Technical Conference (USENIX ATC 16). USENIX Association, Denver, CO, 43\u201356. https:\/\/www.usenix.org\/conference\/atc16\/technical-sessions\/presentation\/yasukata"},{"key":"e_1_3_2_1_113_1","volume-title":"Proceedings of the 10th USENIX Conference on Operating Systems Design and Implementation","author":"Han Sangjin","year":"2012","unstructured":"Sangjin Han, Scott Marshall, Byung-Gon Chun, and Sylvia Ratnasamy. 2012. MegaPipe: a new programming interface for scalable network I\/O. In Proceedings of the 10th USENIX Conference on Operating Systems Design and Implementation (Hollywood, CA, USA) (OSDI'12). USENIX Association, USA, 135\u2013148. https:\/\/www.usenix.org\/conference\/osdi12\/technical-sessions\/presentation\/han."},{"key":"e_1_3_2_1_114_1","doi-asserted-by":"publisher","DOI":"10.5555\/3386691.3386699"},{"key":"e_1_3_2_1_115_1","volume-title":"11th USENIX Symposium on Networked Systems Design and Implementation (NSDI 14)","author":"Jeong EunYoung","year":"2014","unstructured":"EunYoung Jeong, Shinae Wood, Muhammad Jamshed, Haewon Jeong, Sunghwan Ihm, Dongsu Han, and KyoungSoo Park. 2014. mTCP: a Highly Scalable User-level TCP Stack for Multicore Systems. In 11th USENIX Symposium on Networked Systems Design and Implementation (NSDI 14). 489\u2013502."},{"key":"e_1_3_2_1_116_1","doi-asserted-by":"publisher","DOI":"10.1145\/3600006.3613137"},{"key":"e_1_3_2_1_117_1","volume-title":"2023 IEEE Symposium on Security and Privacy (SP). IEEE, 2956\u20132973","author":"Peng Dinglan","year":"2023","unstructured":"Dinglan Peng, Congyu Liu, Tapti Palit, Pedro Fonseca, Anjo Vahldiek-Oberwagner, and Mona Vij. 2023. \u03bcSwitch: Fast Kernel Context Isolation with Implicit Context Switches. In 2023 IEEE Symposium on Security and Privacy (SP). IEEE, 2956\u20132973."},{"key":"e_1_3_2_1_118_1","volume-title":"20th USENIX Symposium on Networked Systems Design and Implementation (NSDI 23)","author":"Chen Jingrong","year":"2023","unstructured":"Jingrong Chen, Yongji Wu, Shihan Lin, Yechen Xu, Xinhao Kong, Thomas Anderson, Matthew Lentz, Xiaowei Yang, and Danyang Zhuo. 2023. Remote Procedure Call as a Managed System Service. In 20th USENIX Symposium on Networked Systems Design and Implementation (NSDI 23). USENIX Association, Boston, MA, 141\u2013159. https:\/\/www.usenix.org\/conference\/nsdi23\/presentation\/chen-jingrong"},{"key":"e_1_3_2_1_119_1","volume-title":"Shenango: Achieving High CPU Efficiency for Latency-sensitive Datacenter Workloads. In 16th USENIX Symposium on Networked Systems Design and Implementation (NSDI 19)","author":"Ousterhout Amy","year":"2019","unstructured":"Amy Ousterhout, Joshua Fried, Jonathan Behrens, Adam Belay, and Hari Balakrishnan. 2019. Shenango: Achieving High CPU Efficiency for Latency-sensitive Datacenter Workloads. In 16th USENIX Symposium on Networked Systems Design and Implementation (NSDI 19). USENIX Association, Boston, MA, 361\u2013378. https:\/\/www.usenix.org\/conference\/nsdi19\/presentation\/ousterhout"},{"key":"e_1_3_2_1_120_1","volume-title":"14th USENIX Symposium on Operating Systems Design and Implementation (OSDI 20)","author":"Fried Joshua","year":"2020","unstructured":"Joshua Fried, Zhenyuan Ruan, Amy Ousterhout, and Adam Belay. 2020. Caladan: Mitigating Interference at Microsecond Timescales. In 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI 20). USENIX Association, 281\u2013297. https:\/\/www.usenix.org\/conference\/osdi20\/presentation\/fried"},{"key":"e_1_3_2_1_121_1","doi-asserted-by":"publisher","DOI":"10.5555\/3357062.3357081"},{"key":"e_1_3_2_1_122_1","doi-asserted-by":"publisher","DOI":"10.1145\/605397.605429"},{"key":"e_1_3_2_1_123_1","doi-asserted-by":"publisher","DOI":"10.1145\/1095810.1095814"},{"key":"e_1_3_2_1_124_1","doi-asserted-by":"publisher","DOI":"10.1109\/SP.2015.9"},{"key":"e_1_3_2_1_125_1","doi-asserted-by":"publisher","DOI":"10.1145\/2872362.2872371"},{"key":"e_1_3_2_1_126_1","doi-asserted-by":"publisher","DOI":"10.1145\/2103656.2103711"}],"event":{"name":"SOSP '25: ACM SIGOPS 31st Symposium on Operating Systems Principles","location":"Lotte Hotel World Seoul Republic of Korea","acronym":"SOSP '25","sponsor":["SIGOPS ACM Special Interest Group on Operating Systems","USENIX"]},"container-title":["Proceedings of the ACM SIGOPS 31st Symposium on Operating Systems Principles"],"original-title":[],"deposited":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T12:45:35Z","timestamp":1759322735000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3731569.3764800"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,12]]},"references-count":126,"alternative-id":["10.1145\/3731569.3764800","10.1145\/3731569"],"URL":"https:\/\/doi.org\/10.1145\/3731569.3764800","relation":{},"subject":[],"published":{"date-parts":[[2025,10,12]]},"assertion":[{"value":"2025-10-12","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}