{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,10]],"date-time":"2025-12-10T09:04:30Z","timestamp":1765357470704,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":44,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,10,30]],"date-time":"2023-10-30T00:00:00Z","timestamp":1698624000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,10,30]]},"DOI":"10.1145\/3620678.3624794","type":"proceedings-article","created":{"date-parts":[[2023,10,31]],"date-time":"2023-10-31T13:58:07Z","timestamp":1698760687000},"page":"597-610","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":6,"title":["Chitu"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0004-2170-6560","authenticated-orcid":false,"given":"Zhengyu","family":"Lei","sequence":"first","affiliation":[{"name":"ICT, CAS, UCAS, Zhongguancun Lab"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7105-8355","authenticated-orcid":false,"given":"Xiao","family":"Shi","sequence":"additional","affiliation":[{"name":"ICT, CAS, Nanjing Institute of InforSuperBahn"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-7089-0315","authenticated-orcid":false,"given":"Cunchi","family":"Lv","sequence":"additional","affiliation":[{"name":"ICT, CAS, UCAS Zhongguancun Lab"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-2017-5871","authenticated-orcid":false,"given":"Xiaobing","family":"Yu","sequence":"additional","affiliation":[{"name":"ICT, CAS, UCAS"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1898-1359","authenticated-orcid":false,"given":"Xiaofang","family":"Zhao","sequence":"additional","affiliation":[{"name":"ICT, CAS, UCAS, IICT, Suzhou, CAS UCAS, Nanjing Zhongguancun Lab"}]}],"member":"320","published-online":{"date-parts":[[2023,10,31]]},"reference":[{"volume-title":"Anna: A kvs for any scale","unstructured":"2019. Anna: A kvs for any scale. Vol. 33. IEEE.","key":"e_1_3_2_1_1_1"},{"volume-title":"Stateful serverless computing with crucial","unstructured":"2022. Stateful serverless computing with crucial. Vol. 31. ACM New York, NY.","key":"e_1_3_2_1_2_1"},{"unstructured":"2023. AWS Lambda. https:\/\/aws.amazon.com\/cn\/lambda","key":"e_1_3_2_1_3_1"},{"unstructured":"2023. AWS Step Functions. https:\/\/aws.amazon.com\/step-functions","key":"e_1_3_2_1_4_1"},{"unstructured":"2023. Azure Functions. https:\/\/azure.microsoft.com\/en-us\/services\/functions\/","key":"e_1_3_2_1_5_1"},{"unstructured":"2023. Beam model. https:\/\/beam.apache.org\/documentation\/basics","key":"e_1_3_2_1_6_1"},{"unstructured":"2023. Big Data Benchmark. https:\/\/amplab.cs.berkeley.edu\/benchmark\/","key":"e_1_3_2_1_7_1"},{"unstructured":"2023. Google Cloud Functions. https:\/\/cloud.google.com\/functions","key":"e_1_3_2_1_8_1"},{"unstructured":"2023. Knix Microfunctions. https:\/\/github.com\/knix-microfunctions\/knix","key":"e_1_3_2_1_9_1"},{"unstructured":"2023. OpenFaaS. https:\/\/www.openfaas.com.","key":"e_1_3_2_1_10_1"},{"key":"e_1_3_2_1_11_1","volume-title":"2018 Usenix Annual Technical Conference (ATC'18)","author":"Akkus Istemi Ekin","year":"2018","unstructured":"Istemi Ekin Akkus, Ruichuan Chen, Ivica Rimac, Manuel Stein, Klaus Satzke, Andre Beck, Paarijaat Aditya, and Volker Hilt. 2018. {SAND}: Towards High-Performance serverless computing. In 2018 Usenix Annual Technical Conference (ATC'18). 923--935."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_12_1","DOI":"10.1145\/3267809.3267815"},{"key":"e_1_3_2_1_13_1","volume-title":"14th USENIX Symposium on Operating Systems Design and Implementation (OSDI'20)","author":"Bai Zhihao","year":"2020","unstructured":"Zhihao Bai, Zhen Zhang, Yibo Zhu, and Xin Jin. 2020. {PipeSwitch}: Fast pipelined context switching for deep learning applications. In 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI'20). 499--514."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_14_1","DOI":"10.1145\/3448016.3457560"},{"key":"e_1_3_2_1_15_1","volume-title":"Apache flink: Stream and batch processing in a single engine. The Bulletin of the Technical Committee on Data Engineering 38, 4","author":"Carbone Paris","year":"2015","unstructured":"Paris Carbone, Asterios Katsifodimos, Stephan Ewen, Volker Markl, Seif Haridi, and Kostas Tzoumas. 2015. Apache flink: Stream and batch processing in a single engine. The Bulletin of the Technical Committee on Data Engineering 38, 4 (2015)."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_16_1","DOI":"10.1145\/3357223.3362711"},{"key":"e_1_3_2_1_17_1","volume-title":"rFaaS: Enabling High Performance Serverless with RDMA and Decentralization. arXiv preprint arXiv:2106.13859","author":"Copik Marcin","year":"2021","unstructured":"Marcin Copik, Konstantin Taranov, Alexandru Calotoiu, and Torsten Hoefler. 2021. rFaaS: Enabling High Performance Serverless with RDMA and Decentralization. arXiv preprint arXiv:2106.13859 (2021)."},{"key":"e_1_3_2_1_18_1","volume-title":"14th USENIX Symposium on Networked Systems Design and Implementation (NSDI'17)","author":"Fouladi Sadjad","year":"2017","unstructured":"Sadjad Fouladi, Riad S Wahby, Brennan Shacklett, Karthikeyan Vasuki Balasubramaniam, William Zeng, Rahul Bhalerao, Anirudh Sivaraman, George Porter, and Keith Winstein. 2017. Encoding, fast and slow: {Low-Latency} video processing using thousands of tiny threads. In 14th USENIX Symposium on Networked Systems Design and Implementation (NSDI'17). 363--376."},{"key":"e_1_3_2_1_19_1","first-page":"779","article-title":"Hydrozoa: Dynamic Hybrid-Parallel DNN Training on Serverless Containers","volume":"4","author":"Guo Runsheng","year":"2022","unstructured":"Runsheng Guo, Victor Guo, Antonio Kim, Josh Hildred, and Khuzaima Daudjee. 2022. Hydrozoa: Dynamic Hybrid-Parallel DNN Training on Serverless Containers. Proceedings of Machine Learning and Systems 4, 779--794.","journal-title":"Proceedings of Machine Learning and Systems"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_20_1","DOI":"10.1145\/2594291.2594324"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_21_1","DOI":"10.1145\/3477132.3483541"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_22_1","DOI":"10.1145\/3448016.3459240"},{"unstructured":"Eric Jonas Johann Schleier-Smith Vikram Sreekanti Chia-Che Tsai Anurag Khandelwal Qifan Pu Vaishaal Shankar Joao Carreira Karl Krauth Neeraja Yadwadkar et al. 2019. Cloud programming simplified: A berkeley view on serverless computing. arXiv preprint arXiv:1902.03383 (2019).","key":"e_1_3_2_1_23_1"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_24_1","DOI":"10.1145\/301104.301116"},{"key":"e_1_3_2_1_25_1","volume-title":"13th USENIX Symposium on Operating Systems Design and Implementation (OSDI'18)","author":"Klimovic Ana","year":"2018","unstructured":"Ana Klimovic, Yawen Wang, Patrick Stuedi, Animesh Trivedi, Jonas Pfefferle, and Christos Kozyrakis. 2018. Pocket: Elastic ephemeral storage for serverless analytics. In 13th USENIX Symposium on Operating Systems Design and Implementation (OSDI'18). 427--444."},{"key":"e_1_3_2_1_26_1","volume-title":"2021 USENIX Annual Technical Conference (USENIX ATC '21)","author":"Kotni Swaroop","year":"2021","unstructured":"Swaroop Kotni, Ajay Nayak, Vinod Ganapathy, and Arkaprava Basu. 2021. Faastlane: Accelerating {Function-as-a-Service} Workflows. In 2021 USENIX Annual Technical Conference (USENIX ATC '21). 805--820."},{"volume-title":"Big learning NIPS workshop","author":"Li Mu","unstructured":"Mu Li, Li Zhou, Zichao Yang, Aaron Li, Fei Xia, David G Andersen, and Alexander Smola. 2013. Parameter server for distributed machine learning. In Big learning NIPS workshop, Vol. 6.","key":"e_1_3_2_1_27_1"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_28_1","DOI":"10.1145\/3570607"},{"key":"e_1_3_2_1_29_1","volume-title":"In Proceedings of the 6th Biennial Conference on Innovative Data Systems Research (CIDR'13)","author":"McSherry Frank","year":"2013","unstructured":"Frank McSherry, Derek Gordon Murray, Rebecca Isaacs, and Michael Isard. 2013. Differential Dataflow.. In In Proceedings of the 6th Biennial Conference on Innovative Data Systems Research (CIDR'13)."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_30_1","DOI":"10.1145\/3318464.3389758"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_31_1","DOI":"10.1145\/3341301.3359646"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_32_1","DOI":"10.1145\/3341301.3359642"},{"key":"e_1_3_2_1_33_1","volume-title":"16th USENIX symposium on networked systems design and implementation (NSDI'19)","author":"Pu Qifan","year":"2019","unstructured":"Qifan Pu, Shivaram Venkataraman, and Ion Stoica. 2019. Shuffling, fast and slow: Scalable analytics on serverless infrastructure. In 16th USENIX symposium on networked systems design and implementation (NSDI'19). 193--206."},{"key":"e_1_3_2_1_34_1","volume-title":"Numpywren: Serverless linear algebra. arXiv preprint arXiv:1810.09679","author":"Shankar Vaishaal","year":"2018","unstructured":"Vaishaal Shankar, Karl Krauth, Qifan Pu, Eric Jonas, Shivaram Venkataraman, Ion Stoica, Benjamin Recht, and Jonathan Ragan-Kelley. 2018. Numpywren: Serverless linear algebra. arXiv preprint arXiv:1810.09679 (2018)."},{"key":"e_1_3_2_1_35_1","volume-title":"2020 USENIX Annual Technical Conference (ATC'20)","author":"Shillaker Simon","year":"2020","unstructured":"Simon Shillaker and Peter Pietzuch. 2020. Faasm: Lightweight isolation for efficient stateful serverless computing. In 2020 USENIX Annual Technical Conference (ATC'20). 419--433."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_36_1","DOI":"10.14778\/3407790.3407836"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_37_1","DOI":"10.1109\/CLOUD49709.2020.00049"},{"key":"e_1_3_2_1_38_1","volume-title":"15th USENIX Symposium on Operating Systems Design and Implementation (OSDI'21)","author":"Thorpe John","year":"2021","unstructured":"John Thorpe, Yifan Qiao, Jonathan Eyolfson, Shen Teng, Guanzhou Hu, Zhihao Jia, Jinliang Wei, Keval Vora, Ravi Netravali, Miryung Kim, et al. 2021. Dorylus: Affordable, scalable, and accurate GNN training with distributed CPU servers and serverless threads. In 15th USENIX Symposium on Operating Systems Design and Implementation (OSDI'21). 495--514."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_39_1","DOI":"10.1145\/3458336.3465302"},{"key":"e_1_3_2_1_40_1","volume-title":"No Provisioned Concurrency: Fast RDMA-codesigned Remote Fork for Serverless Computing. In 17th USENIX Symposium on Operating Systems Design and Implementation (OSDI'23)","author":"Wei Xingda","year":"2023","unstructured":"Xingda Wei, Fangming Lu, Tianxia Wang, Jinyu Gu, Yuhan Yang, Rong Chen, and Haibo Chen. 2023. No Provisioned Concurrency: Fast RDMA-codesigned Remote Fork for Serverless Computing. In 17th USENIX Symposium on Operating Systems Design and Implementation (OSDI'23). 497--517."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_41_1","DOI":"10.14778\/3311880.3311881"},{"key":"e_1_3_2_1_42_1","volume-title":"20th USENIX Symposium on Networked Systems Design and Implementation (NSDI'23)","author":"Yu Minchen","year":"2023","unstructured":"Minchen Yu, Tingjia Cao, Wei Wang, and Ruichuan Chen. 2023. Following the data, not the function: Rethinking function orchestration in serverless computing. In 20th USENIX Symposium on Networked Systems Design and Implementation (NSDI'23). 1489--1504."},{"key":"e_1_3_2_1_43_1","volume-title":"14th USENIX Symposium on Operating Systems Design and Implementation (OSDI'20)","author":"Zhang Haoran","year":"2020","unstructured":"Haoran Zhang, Adney Cardoza, Peter Baile Chen, Sebastian Angel, and Vincent Liu. 2020. Fault-tolerant and transactional stateful serverless workflows. In 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI'20). 1187--1204."},{"key":"e_1_3_2_1_44_1","volume-title":"2017 USENIX Annual Technical Conference (ATC'17)","author":"Zhang Hao","year":"2017","unstructured":"Hao Zhang, Zeyu Zheng, Shizhen Xu, Wei Dai, Qirong Ho, Xiaodan Liang, Zhiting Hu, Jinliang Wei, Pengtao Xie, and Eric P Xing. 2017. Poseidon: An efficient communication architecture for distributed deep learning on {GPU} clusters. In 2017 USENIX Annual Technical Conference (ATC'17). 181--193."}],"event":{"sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGOPS ACM Special Interest Group on Operating Systems"],"acronym":"SoCC '23","name":"SoCC '23: ACM Symposium on Cloud Computing","location":"Santa Cruz CA USA"},"container-title":["Proceedings of the 2023 ACM Symposium on Cloud Computing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3620678.3624794","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3620678.3624794","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T15:53:45Z","timestamp":1755878025000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3620678.3624794"}},"subtitle":["Accelerating Serverless Workflows with Asynchronous State Replication Pipelines"],"short-title":[],"issued":{"date-parts":[[2023,10,30]]},"references-count":44,"alternative-id":["10.1145\/3620678.3624794","10.1145\/3620678"],"URL":"https:\/\/doi.org\/10.1145\/3620678.3624794","relation":{},"subject":[],"published":{"date-parts":[[2023,10,30]]},"assertion":[{"value":"2023-10-31","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}