{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,9]],"date-time":"2026-04-09T14:33:06Z","timestamp":1775745186872,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":48,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,10,30]],"date-time":"2023-10-30T00:00:00Z","timestamp":1698624000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,10,30]]},"DOI":"10.1145\/3620678.3624645","type":"proceedings-article","created":{"date-parts":[[2023,10,31]],"date-time":"2023-10-31T13:58:07Z","timestamp":1698760687000},"page":"32-47","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":24,"title":["Golgi"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3921-9037","authenticated-orcid":false,"given":"Suyi","family":"Li","sequence":"first","affiliation":[{"name":"HKUST"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4585-4152","authenticated-orcid":false,"given":"Wei","family":"Wang","sequence":"additional","affiliation":[{"name":"HKUST"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-8532-1262","authenticated-orcid":false,"given":"Jun","family":"Yang","sequence":"additional","affiliation":[{"name":"WeBank"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-1751-2685","authenticated-orcid":false,"given":"Guangzhen","family":"Chen","sequence":"additional","affiliation":[{"name":"WeBank"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-9916-3620","authenticated-orcid":false,"given":"Daohe","family":"Lu","sequence":"additional","affiliation":[{"name":"WeBank"}]}],"member":"320","published-online":{"date-parts":[[2023,10,31]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Proceedings of the 17th USENIX Symposium on Networked Systems Design and Implementation (NSDI 20)","author":"Agache Alexandru","year":"2020","unstructured":"Alexandru Agache, Marc Brooker, Alexandra Iordache, Anthony Liguori, Rolf Neugebauer, Phil Piwonka, and Diana-Maria Popa. 2020. Firecracker: Lightweight Virtualization for Serverless Applications. In Proceedings of the 17th USENIX Symposium on Networked Systems Design and Implementation (NSDI 20)."},{"key":"e_1_3_2_1_2_1","volume-title":"Proceedings of the 2018 USENIX Annual Technical Conference (USENIX ATC 18)","author":"Amvrosiadis George","year":"2018","unstructured":"George Amvrosiadis, Jun Woo Park, Gregory R. Ganger, Garth A. Gibson, Elisabeth Baseman, and Nathan DeBardeleben. 2018. On the diversity of cluster workloads and its impact on research results. In Proceedings of the 2018 USENIX Annual Technical Conference (USENIX ATC 18)."},{"key":"e_1_3_2_1_3_1","unstructured":"The Kubernetes Authors. 2023. Kubernetes Scheduling Framework. https:\/\/kubernetes.io\/docs\/concepts\/scheduling-eviction\/scheduling-framework\/."},{"key":"e_1_3_2_1_4_1","unstructured":"Microsoft Azure. 2022. Azure Functions Pricing. https:\/\/azure.microsoft.com\/en-us\/pricing\/details\/functions\/."},{"key":"e_1_3_2_1_5_1","unstructured":"Microsoft Azure. 2022. Concurrency in Azure Functions. https:\/\/docs.microsoft.com\/en-us\/azure\/azure-functions\/functions-concurrency."},{"key":"e_1_3_2_1_6_1","unstructured":"Microsoft Azure. 2022. What are Durable Functions? https:\/\/learn.microsoft.com\/en-us\/azure\/azure-functions\/durable\/durable-functions-overview?tabs=csharp."},{"key":"e_1_3_2_1_7_1","volume-title":"Proceedings of the MLSys 2021, NeurIPS 2020 Workshop on Machine Learning for Systems.","author":"Balaji Bharathan","year":"2020","unstructured":"Bharathan Balaji, Christopher Kakovitch, and Balakrishnan (Murali) Narayanaswamy. 2020. FirePlace: Placing FireCracker virtual machines with hindsight imitation. In Proceedings of the MLSys 2021, NeurIPS 2020 Workshop on Machine Learning for Systems."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/3447786.3456259"},{"key":"e_1_3_2_1_9_1","unstructured":"Alibaba Cloud. 2022. Aliyun Function Compute Pricing. https:\/\/www.alibabacloud.com\/help\/en\/doc-detail\/54301.html."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/3132747.3132772"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"crossref","unstructured":"Alex Ellis. 2022. OpenFaaS: Server Functions Made Simple. https:\/\/www.openfaas.com\/.","DOI":"10.1002\/9781119682318.ch17"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/3190508.3190549"},{"key":"e_1_3_2_1_13_1","unstructured":"Google. 2022. Overcommitting CPUs on sole-tenant VMs. https:\/\/cloud.google.com\/compute\/docs\/nodes\/overcommitting-cpus-sole-tenant-vms."},{"key":"e_1_3_2_1_14_1","unstructured":"Google. 2022. Vertical Pod autoscaling. https:\/\/cloud.google.com\/kubernetes-engine\/docs\/concepts\/verticalpodautoscaler."},{"key":"e_1_3_2_1_15_1","volume-title":"Proceedings of the 14th USENIX Conference on Operating Systems Design and Implementation.","author":"Hao Mingzhe","unstructured":"Mingzhe Hao, Levent Toksoz, Nanqinqin Li, Edward Edberg Halim, Henry Hoffmann, and Haryadi S. Gunawi. 2020. LinnOS: Predictability on Unpredictable Flash Storage with a Light Neural Network. In Proceedings of the 14th USENIX Conference on Operating Systems Design and Implementation."},{"key":"e_1_3_2_1_16_1","unstructured":"Eric Jonas Johann Schleier-Smith Vikram Sreekanti Chia-Che Tsai Anurag Khandelwal Qifan Pu Vaishaal Shankar Joao Carreira Karl Krauth Neeraja Yadwadkar et al. 2019. Cloud programming simplified: A berkeley view on serverless computing. arXiv preprint arXiv:1902.03383 (2019)."},{"key":"e_1_3_2_1_17_1","volume-title":"Proceedings of the 13th USENIX Symposium on Operating Systems Design and Implementation (OSDI 18)","author":"Klimovic Ana","year":"2018","unstructured":"Ana Klimovic, Yawen Wang, Patrick Stuedi, Animesh Trivedi, Jonas Pfefferle, and Christos Kozyrakis. 2018. Pocket: Elastic Ephemeral Storage for Serverless Analytics. In Proceedings of the 13th USENIX Symposium on Operating Systems Design and Implementation (OSDI 18)."},{"key":"e_1_3_2_1_18_1","volume-title":"Proceedings of the Advances in Neural Information Processing Systems (NeurIPS 14)","author":"Lakshminarayanan Balaji","year":"2014","unstructured":"Balaji Lakshminarayanan, Daniel M Roy, and Yee Whye Teh. 2014. Mondrian Forests: Efficient Online Random Forests. In Proceedings of the Advances in Neural Information Processing Systems (NeurIPS 14)."},{"key":"e_1_3_2_1_19_1","unstructured":"AWS Lambda. 2022. AWS Lambda Pricing. https:\/\/aws.amazon.com\/lambda\/pricing\/."},{"key":"e_1_3_2_1_20_1","unstructured":"AWS Lambda. 2022. How do I request a concurrency limit increase for my Lambda function? https:\/\/aws.amazon.com\/premiumsupport\/knowledge-center\/lambda-concurrency-limit-increase\/."},{"key":"e_1_3_2_1_21_1","unstructured":"AWS Lambda. 2022. Lambda function scaling. https:\/\/docs.aws.amazon.com\/lambda\/latest\/dg\/invocation-scaling.html."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/3472883.3486971"},{"key":"e_1_3_2_1_23_1","volume-title":"Proceedings of the 2021 USENIX Annual Technical Conference (ATC 21)","author":"Mahgoub Ashraf","year":"2021","unstructured":"Ashraf Mahgoub, Karthick Shankar, Subrata Mitra, Ana Klimovic, Somali Chaterji, and Saurabh Bagchi. 2021. SONIC: Application-aware Data Passing for Chained Serverless Applications. In Proceedings of the 2021 USENIX Annual Technical Conference (ATC 21)."},{"key":"e_1_3_2_1_24_1","volume-title":"Proceedings of the 16th USENIX Symposium on Operating Systems Design and Implementation (OSDI 22)","author":"Mahgoub Ashraf","year":"2022","unstructured":"Ashraf Mahgoub, Edgardo Barsallo Yi, Karthick Shankar, Sameh Elnikety, Somali Chaterji, and Saurabh Bagchi. 2022. ORION and the Three Rights: Sizing, Bundling, and Prewarming for Serverless DAGs. In Proceedings of the 16th USENIX Symposium on Operating Systems Design and Implementation (OSDI 22)."},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/71.963420"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3447786.3456239"},{"key":"e_1_3_2_1_27_1","volume-title":"Tensorflow-serving: Flexible, high-performance ml serving. arXiv preprint arXiv:1712.06139","author":"Olston Christopher","year":"2017","unstructured":"Christopher Olston, Noah Fiedel, Kiril Gorovoy, Jeremiah Harmsen, Li Lao, Fangwei Li, Vinu Rajashekhar, Sukriti Ramesh, and Jordan Soyke. 2017. Tensorflow-serving: Flexible, high-performance ml serving. arXiv preprint arXiv:1712.06139 (2017)."},{"key":"e_1_3_2_1_28_1","volume-title":"Scikit-learn: Machine Learning in Python. Journal of Machine Learning Research","author":"Pedregosa F.","year":"2011","unstructured":"F. Pedregosa, G. Varoquaux, A. Gramfort, V. Michel, B. Thirion, O. Grisel, M. Blondel, P. Prettenhofer, R. Weiss, V. Dubourg, J. Vanderplas, A. Passos, D. Cournapeau, M. Brucher, M. Perrot, and E. Duchesnay. 2011. Scikit-learn: Machine Learning in Python. Journal of Machine Learning Research (2011)."},{"key":"e_1_3_2_1_29_1","volume-title":"Proceedings of the 16th USENIX Symposium on Networked Systems Design and Implementation (NSDI 19)","author":"Pu Qifan","year":"2019","unstructured":"Qifan Pu, Shivaram Venkataraman, and Ion Stoica. 2019. Shuffling, Fast and Slow: Scalable Analytics on Serverless Infrastructure. In Proceedings of the 16th USENIX Symposium on Networked Systems Design and Implementation (NSDI 19)."},{"key":"e_1_3_2_1_30_1","unstructured":"Ran Ribenzaft. 2019. What AWS Lambda's Performance Stats Reveal. https:\/\/epsagon.com\/observability\/what-aws-lambda-performance-stats-reveal-key-metrics\/."},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/3472883.3486974"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/3342195.3387524"},{"key":"e_1_3_2_1_33_1","volume-title":"Joseph E Gonzalez, Ion Stoica, and David A Patterson.","author":"Schleier-Smith Johann","year":"2021","unstructured":"Johann Schleier-Smith, Vikram Sreekanti, Anurag Khandelwal, Joao Carreira, Neeraja J Yadwadkar, Raluca Ada Popa, Joseph E Gonzalez, Ion Stoica, and David A Patterson. 2021. What serverless computing is and should become: The next phase of cloud computing. Commun. ACM (2021)."},{"key":"e_1_3_2_1_34_1","volume-title":"Proceedings of the 2020 USENIX Annual Technical Conference (ATC 20)","author":"Shahrad Mohammad","year":"2020","unstructured":"Mohammad Shahrad, Rodrigo Fonseca, Inigo Goiri, Gohar Chaudhry, Paul Batum, Jason Cooke, Eduardo Laureano, Colby Tresness, Mark Russinovich, and Ricardo Bianchini. 2020. Serverless in the Wild: Characterizing and Optimizing the Serverless Workload at a Large Cloud Provider. In Proceedings of the 2020 USENIX Annual Technical Conference (ATC 20)."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/3472883.3486981"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.14778\/3407790.3407836"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1145\/3542929.3563470"},{"key":"e_1_3_2_1_38_1","volume-title":"Owl: Performance-Aware Scheduling for Resource-Efficient Function-as-a-Service Cloud. https:\/\/www.cse.ust.hk\/~weiwa\/papers\/owl-techreport.pdf.","author":"Tian Huangshi","year":"2022","unstructured":"Huangshi Tian, Suyi Li, Ao Wang, Wei Wang, Tianlong Wu, and Haoran Yang. 2022. Owl: Performance-Aware Scheduling for Resource-Efficient Function-as-a-Service Cloud. https:\/\/www.cse.ust.hk\/~weiwa\/papers\/owl-techreport.pdf."},{"key":"e_1_3_2_1_39_1","volume-title":"Random sampling with a reservoir. ACM Transactions on Mathematical Software (TOMS)","author":"Vitter Jeffrey S","year":"1985","unstructured":"Jeffrey S Vitter. 1985. Random sampling with a reservoir. ACM Transactions on Mathematical Software (TOMS) (1985)."},{"key":"e_1_3_2_1_40_1","volume-title":"Proceedings of the 2018 USENIX Annual Technical Conference (ATC 18)","author":"Wang Liang","year":"2018","unstructured":"Liang Wang, Mengyuan Li, Yinqian Zhang, Thomas Ristenpart, and Michael Swift. 2018. Peeking Behind the Curtains of Serverless Platforms. In Proceedings of the 2018 USENIX Annual Technical Conference (ATC 18)."},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/SC41405.2020.00072"},{"key":"e_1_3_2_1_42_1","volume-title":"StepConf: SLO-Aware Dynamic Resource Configuration for Serverless Function Workflows. In IEEE INFOCOM 2022-IEEE Conference on Computer Communications.","author":"Wen Zhaojie","year":"2022","unstructured":"Zhaojie Wen, Yishuo Wang, and Fangming Liu. 2022. StepConf: SLO-Aware Dynamic Resource Configuration for Serverless Function Workflows. In IEEE INFOCOM 2022-IEEE Conference on Computer Communications."},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2020.2970013"},{"key":"e_1_3_2_1_44_1","volume-title":"Proceedings of the 20th USENIX Symposium on Networked Systems Design and Implementation (NSDI 23)","author":"Yu Minchen","year":"2023","unstructured":"Minchen Yu, Tingjia Cao, Wei Wang, and Ruichuan Chen. 2023. Following the Data, Not the Function: Rethinking Function Orchestration in Serverless Computing. In Proceedings of the 20th USENIX Symposium on Networked Systems Design and Implementation (NSDI 23)."},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1145\/3419111.3421280"},{"key":"e_1_3_2_1_46_1","volume-title":"Proceedings of the 2019 USENIX Annual Technical Conference (ATC 19)","author":"Zhang Chengliang","year":"2019","unstructured":"Chengliang Zhang, Minchen Yu, Wei Wang, and Feng Yan. 2019. MArk: Exploiting Cloud Services for Cost-Effective, SLO-Aware Machine Learning Inference Serving. In Proceedings of the 2019 USENIX Annual Technical Conference (ATC 19)."},{"key":"e_1_3_2_1_47_1","volume-title":"Proceedings of the 18th USENIX Symposium on Networked Systems Design and Implementation (NSDI 21)","author":"Zhang Hong","year":"2021","unstructured":"Hong Zhang, Yupeng Tang, Anurag Khandelwal, Jingrong Chen, and Ion Stoica. 2021. Caerus: NIMBLE Task Scheduling for Serverless Analytics. In Proceedings of the 18th USENIX Symposium on Networked Systems Design and Implementation (NSDI 21)."},{"key":"e_1_3_2_1_48_1","volume-title":"Proceedings of the SIGOPS European Conference on Computer Systems (EuroSys 13)","author":"Zhang Xiao","year":"2013","unstructured":"Xiao Zhang, Eric Tune, Robert Hagmann, Rohit Jnagal, Vrigo Gokhale, and John Wilkes. 2013. CPI2: CPU performance isolation for shared compute clusters. In Proceedings of the SIGOPS European Conference on Computer Systems (EuroSys 13)."}],"event":{"name":"SoCC '23: ACM Symposium on Cloud Computing","location":"Santa Cruz CA USA","acronym":"SoCC '23","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGOPS ACM Special Interest Group on Operating Systems"]},"container-title":["Proceedings of the 2023 ACM Symposium on Cloud Computing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3620678.3624645","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3620678.3624645","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T15:55:43Z","timestamp":1755878143000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3620678.3624645"}},"subtitle":["Performance-Aware, Resource-Efficient Function Scheduling for Serverless Computing"],"short-title":[],"issued":{"date-parts":[[2023,10,30]]},"references-count":48,"alternative-id":["10.1145\/3620678.3624645","10.1145\/3620678"],"URL":"https:\/\/doi.org\/10.1145\/3620678.3624645","relation":{},"subject":[],"published":{"date-parts":[[2023,10,30]]},"assertion":[{"value":"2023-10-31","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}