{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,12]],"date-time":"2026-03-12T08:43:43Z","timestamp":1773305023737,"version":"3.50.1"},"reference-count":54,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2026,1,26]],"date-time":"2026-01-26T00:00:00Z","timestamp":1769385600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2026,3,11]],"date-time":"2026-03-11T00:00:00Z","timestamp":1773187200000},"content-version":"vor","delay-in-days":44,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"name":"the Joint Innova- tion Initiative of the Yangtze River Delta Science and Technology Innovation Community","award":["YDZX20223100004022-3"],"award-info":[{"award-number":["YDZX20223100004022-3"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J. King Saud Univ. Comput. Inf. Sci."],"published-print":{"date-parts":[[2026,4]]},"DOI":"10.1007\/s44443-026-00473-4","type":"journal-article","created":{"date-parts":[[2026,1,26]],"date-time":"2026-01-26T12:24:49Z","timestamp":1769430289000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["LACE: Mitigating cold-starts in serverless with a multi-task mixture-of-experts caching"],"prefix":"10.1007","volume":"38","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6328-0669","authenticated-orcid":false,"given":"Chunpu","family":"Huang","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1773-6623","authenticated-orcid":false,"given":"Yukai","family":"Huang","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0002-1739-8249","authenticated-orcid":false,"given":"Jingqi","family":"Feng","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0005-8526-0446","authenticated-orcid":false,"given":"Sicheng","family":"Liang","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1176-0238","authenticated-orcid":false,"given":"Ming","family":"Yan","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0404-0707","authenticated-orcid":false,"given":"Jie","family":"Wu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,1,26]]},"reference":[{"key":"473_CR1","unstructured":"Agache A, Brooker M, Iordache A et\u00a0al (2020) Firecracker: lightweight virtualization for serverless applications. In: 17th USENIX symposium on networked systems design and implementation (NSDI 20), pp 419\u2013434"},{"key":"473_CR2","doi-asserted-by":"crossref","unstructured":"Akhtar Z, Li Y, Govindan R et\u00a0al (2019) Avic: a cache for adaptive bitrate video. In: Proceedings of the 15th International conference on emerging networking experiments and technologies, pp 305\u2013317","DOI":"10.1145\/3359989.3365423"},{"key":"473_CR3","unstructured":"Amazon Web Services (2025) AWS Lambda Limits. Available at https:\/\/docs.aws.amazon.com\/lambda\/latest\/dg\/gettingstarted-limits.html"},{"key":"473_CR4","unstructured":"Apache (2025) Openwhisk. https:\/\/github.com\/apache\/openwhisk"},{"key":"473_CR5","unstructured":"AWS (2025) Lambda. https:\/\/aws.amazon.com\/cn\/lambda\/"},{"issue":"8","key":"473_CR6","doi-asserted-by":"publisher","first-page":"2337","DOI":"10.1109\/TC.2014.2360518","volume":"64","author":"S Baek","year":"2014","unstructured":"Baek S, Lee HG, Nicopoulos C et al (2014) Size-aware cache management for compressed cache architectures. IEEE Trans Comput 64(8):2337\u20132352","journal-title":"IEEE Trans Comput"},{"key":"473_CR7","doi-asserted-by":"publisher","first-page":"99337","DOI":"10.1109\/ACCESS.2022.3206366","volume":"10","author":"A Barrak","year":"2022","unstructured":"Barrak A, Petrillo F, Jaafar F (2022) Serverless on machine learning: a systematic mapping study. IEEE Access 10:99337\u201399352","journal-title":"IEEE Access"},{"issue":"2","key":"473_CR8","doi-asserted-by":"publisher","first-page":"78","DOI":"10.1147\/sj.52.0078","volume":"5","author":"LA Belady","year":"1966","unstructured":"Belady LA (1966) A study of replacement algorithms for a virtual-storage computer. IBM Syst J 5(2):78\u2013101","journal-title":"IBM Syst J"},{"key":"473_CR9","unstructured":"Blankstein A, Sen S, Freedman MJ (2017) Hyperbolic caching: flexible caching for web applications. In: 2017 USENIX Annual Technical Conference (USENIX ATC 17), pp 499\u2013511"},{"key":"473_CR10","doi-asserted-by":"crossref","unstructured":"Chen T, Guestrin C (2016) Xgboost: A scalable tree boosting system. In: Proceedings of the 22nd acm sigkdd international conference on knowledge discovery and data mining, pp 785\u2013794","DOI":"10.1145\/2939672.2939785"},{"key":"473_CR11","unstructured":"Cherkasova L (1998) Improving WWW proxies performance with greedy-dual-size-frequency caching policy. Hewlett-Packard Laboratories Palo Alto, CA, USA"},{"issue":"2","key":"473_CR12","doi-asserted-by":"publisher","first-page":"180","DOI":"10.1007\/PL00009255","volume":"23","author":"M Chrobak","year":"1999","unstructured":"Chrobak M, Noga J (1999) Lru is better than fifo. Algorithmica 23(2):180\u2013185","journal-title":"Algorithmica"},{"key":"473_CR13","doi-asserted-by":"crossref","unstructured":"Dhakal A, Raith P, Ward L et\u00a0al (2023) Fine-grained accelerator partitioning for machine learning and scientific computing in function as a service platform. In: Proceedings of the SC\u201923 Workshops of the International Conference on High Performance Computing, Network, Storage, and Analysis, pp 1606\u20131613","DOI":"10.1145\/3624062.3624238"},{"key":"473_CR14","doi-asserted-by":"crossref","unstructured":"Ding J, Minhas UF, Yu J et\u00a0al (2020) Alex: an updatable adaptive learned index. In: Proceedings of the 2020 ACM SIGMOD international conference on management of data, pp 969\u2013984","DOI":"10.1145\/3318464.3389711"},{"key":"473_CR15","doi-asserted-by":"crossref","unstructured":"Du D, Yu T, Xia Y et\u00a0al (2020) Catalyzer: Sub-millisecond startup for serverless computing with initialization-less booting. In: Proceedings of the Twenty-Fifth International conference on architectural support for programming languages and operating systems, pp 467\u2013481","DOI":"10.1145\/3373376.3378512"},{"key":"473_CR16","doi-asserted-by":"crossref","unstructured":"Fuerst A, Sharma P (2021) Faascache: keeping serverless computing alive with greedy-dual caching. In: Proceedings of the 26th ACM international conference on architectural support for programming languages and operating systems, pp 386\u2013400","DOI":"10.1145\/3445814.3446757"},{"issue":"4","key":"473_CR17","doi-asserted-by":"publisher","first-page":"1140","DOI":"10.1108\/JEIM-09-2022-0317","volume":"37","author":"B Gammelgaard","year":"2024","unstructured":"Gammelgaard B, Nowicka K (2024) Next generation supply chain management: the impact of cloud computing. J Enterp Inf Manag 37(4):1140\u20131160","journal-title":"J Enterp Inf Manag"},{"key":"473_CR18","unstructured":"Google (2025) Cloud functions. https:\/\/cloud.google.com\/functions"},{"issue":"1","key":"473_CR19","first-page":"3323","volume":"13","author":"CH Ho","year":"2012","unstructured":"Ho CH, Lin CJ (2012) Large-scale linear support vector regression. J Mach Learn Res 13(1):3323\u20133348","journal-title":"J Mach Learn Res"},{"issue":"3","key":"473_CR20","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1007\/s44443-025-00002-9","volume":"37","author":"S Hou","year":"2025","unstructured":"Hou S, Hu Y, Tian L et al (2025) Poly-hqos: a polymorphic packet scheduler for traffic isolation in multi-tenant cloud environment. J King Saud Univ Comput Inf Sci 37(3):21","journal-title":"J King Saud Univ Comput Inf Sci"},{"key":"473_CR21","doi-asserted-by":"crossref","unstructured":"Huang Q, Birman K, Van\u00a0Renesse R et\u00a0al (2013) An analysis of facebook photo caching. In: Proceedings of the Twenty-Fourth ACM Symposium on Operating Systems Principles, pp 167\u2013181","DOI":"10.1145\/2517349.2522722"},{"key":"473_CR22","doi-asserted-by":"crossref","unstructured":"Jia Z, Witchel E (2021) Nightcore: efficient and scalable serverless computing for latency-sensitive, interactive microservices. In: Proceedings of the 26th ACM international conference on architectural support for programming languages and operating systems, pp 152\u2013166","DOI":"10.1145\/3445814.3446701"},{"key":"473_CR23","unstructured":"Jonas E, Schleier-Smith J, Sreekanti V et\u00a0al (2019) Cloud programming simplified: A berkeley view on serverless computing. arXiv:1902.03383"},{"issue":"5","key":"473_CR24","doi-asserted-by":"publisher","first-page":"102067","DOI":"10.1016\/j.jksuci.2024.102067","volume":"36","author":"S Karim","year":"2024","unstructured":"Karim S, Qureshi KN, Ibrahim AO et al (2024) Enhanced centroid-based energy-efficient clustering routing protocol for serverless based wireless sensor networks. J King Saud Univ Comput Inf Sci 36(5):102067","journal-title":"J King Saud Univ Comput Inf Sci"},{"key":"473_CR25","unstructured":"Ke G, Meng Q, Finley T et\u00a0al (2017) Lightgbm: A highly efficient gradient boosting decision tree. Adv Neural Inf Process Syst 30"},{"key":"473_CR26","doi-asserted-by":"crossref","unstructured":"Koschel A, Klassen S, Jdiya K et\u00a0al (2021) Cloud computing: serverless. In: 2021 12th International Conference on Information, Intelligence, Systems & Applications (IISA). IEEE, pp 1\u20137","DOI":"10.1109\/IISA52424.2021.9555534"},{"key":"473_CR27","doi-asserted-by":"crossref","unstructured":"Kraska T, Beutel A, Chi EH et\u00a0al (2018) The case for learned index structures. In: Proceedings of the 2018 international conference on management of data, pp 489\u2013504","DOI":"10.1145\/3183713.3196909"},{"key":"473_CR28","doi-asserted-by":"crossref","unstructured":"Kuenzer S, B\u0103doiu VA, Lefeuvre H et\u00a0al (2021) Unikraft: fast, specialized unikernels the easy way. In: Proceedings of the Sixteenth European conference on computer systems, pp 376\u2013394","DOI":"10.1145\/3447786.3456248"},{"issue":"12","key":"473_CR29","doi-asserted-by":"publisher","first-page":"1352","DOI":"10.1109\/TC.2001.970573","volume":"50","author":"D Lee","year":"2001","unstructured":"Lee D, Choi J, Kim JH et al (2001) Lrfu: A spectrum of policies that subsumes the least recently used and least frequently used policies. IEEE Trans Comput 50(12):1352\u20131361","journal-title":"IEEE Trans Comput"},{"key":"473_CR30","unstructured":"Matani D, Shah K, Mitra A (2021) An o (1) algorithm for implementing the lfu cache eviction scheme. arXiv:2110.11602"},{"key":"473_CR31","unstructured":"MS (2025) Azure functions. https:\/\/azure.microsoft.com\/en-us\/products\/functions"},{"key":"473_CR32","doi-asserted-by":"crossref","unstructured":"O\u2019neil EJ, O\u2019neil PE, Weikum G (1993) The lru-k page replacement algorithm for database disk buffering. ACM SIGMOD Rec 22(2):297\u2013306","DOI":"10.1145\/170036.170081"},{"issue":"5","key":"473_CR33","doi-asserted-by":"publisher","first-page":"81","DOI":"10.1007\/s44443-025-00092-5","volume":"37","author":"J Pan","year":"2025","unstructured":"Pan J, Wei Y, Meng L et al (2025) A dual scheduling framework for task and resource allocation in clouds using deep reinforcement learning. J King Saud Univ Comput Inf Sci 37(5):81","journal-title":"J King Saud Univ Comput Inf Sci"},{"issue":"3","key":"473_CR34","doi-asserted-by":"publisher","first-page":"2110","DOI":"10.1109\/TNSM.2023.3239672","volume":"20","author":"E Paraskevoulakou","year":"2023","unstructured":"Paraskevoulakou E, Kyriazis D (2023) Ml-faas: Toward exploiting the serverless paradigm to facilitate machine learning functions as a service. IEEE Trans Netw Serv Manage 20(3):2110\u20132123","journal-title":"IEEE Trans Netw Serv Manage"},{"key":"473_CR35","doi-asserted-by":"crossref","unstructured":"Pintea SL, Lin Y (2023) A step towards understanding why classification helps regression. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 19972\u201319981","DOI":"10.1109\/ICCV51070.2023.01828"},{"issue":"1","key":"473_CR36","first-page":"2007","volume":"1","author":"G Ridgeway","year":"2007","unstructured":"Ridgeway G (2007) Generalized boosted models: a guide to the gbm package. Update 1(1):2007","journal-title":"Update"},{"key":"473_CR37","first-page":"8583","volume":"34","author":"C Riquelme","year":"2021","unstructured":"Riquelme C, Puigcerver J, Mustafa B et al (2021) Scaling vision with sparse mixture of experts. Adv Neural Inf Process Syst 34:8583\u20138595","journal-title":"Adv Neural Inf Process Syst"},{"key":"473_CR38","doi-asserted-by":"crossref","unstructured":"Ristov S, Hollaus C, Hautz M (2022) Colder than the warm start and warmer than the cold start! experience the spawn start in faas providers. In: Proceedings of the 2022 Workshop on Advanced tools, programming languages, and PLatforms for Implementing and Evaluating algorithms for Distributed systems, pp 35\u201339","DOI":"10.1145\/3524053.3542751"},{"key":"473_CR39","doi-asserted-by":"crossref","unstructured":"Romano S, ElAarag H (2008) A quantitative study of recency and frequency based web cache replacement strategies. In: Proceedings of the 11th communications and networking simulation symposium, pp 70\u201378","DOI":"10.1145\/1400713.1400725"},{"key":"473_CR40","doi-asserted-by":"crossref","unstructured":"Roy RB, Patel T, Tiwari D (2022) Icebreaker: Warming serverless functions better with heterogeneity. In: Proceedings of the 27th ACM International conference on architectural support for programming languages and operating systems, pp 753\u2013767","DOI":"10.1145\/3503222.3507750"},{"key":"473_CR41","doi-asserted-by":"crossref","unstructured":"Saxena D, Ji T, Singhvi A (2022) Memory deduplication for serverless computing with medes. In: Proceedings of the Seventeenth European Conference on Computer Systems, pp 714\u2013729","DOI":"10.1145\/3492321.3524272"},{"key":"473_CR42","unstructured":"Shahrad M, Fonseca R, Goiri I et\u00a0al (2020) Serverless in the wild: characterizing and optimizing the serverless workload at a large cloud provider. In: 2020 USENIX annual technical conference (USENIX ATC 20), pp 205\u2013218"},{"key":"473_CR43","doi-asserted-by":"crossref","unstructured":"Sharma P, Chaufournier L, Shenoy P et\u00a0al (2016) Containers and virtual machines at scale: a comparative study. In: Proceedings of the 17th international middleware conference, pp 1\u201313","DOI":"10.1145\/2988336.2988337"},{"key":"473_CR44","unstructured":"Song Z, Berger DS (2020) Learning relaxed belady for content distribution network caching. In: 17th USENIX Symposium on Networked Systems Design and Implementation (NSDI 20), pp 529\u2013544"},{"key":"473_CR45","unstructured":"Vietri G, Rodriguez LV, Martinez WA, et\u00a0al (2018) Driving cache replacement with $$\\{$$ML-based$$\\}$$$$\\{$$LeCaR$$\\}$$. In: 10th USENIX Workshop on Hot Topics in Storage and File Systems (HotStorage 18)"},{"key":"473_CR46","doi-asserted-by":"crossref","unstructured":"Wang Y, Zhang W, Wang L et\u00a0al (2022) Multi-source uncertainty mining for deep unsupervised saliency detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 11727\u201311736","DOI":"10.1109\/CVPR52688.2022.01143"},{"issue":"3","key":"473_CR47","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3468520","volume":"17","author":"X Wei","year":"2021","unstructured":"Wei X, Chen R, Chen H et al (2021) Xstore: Fast rdma-based ordered key-value store using remote learned cache. ACM Transactions on Storage (TOS) 17(3):1\u201332","journal-title":"ACM Transactions on Storage (TOS)"},{"key":"473_CR48","doi-asserted-by":"crossref","unstructured":"Wilkes MV (1965) Slave memories and dynamic storage allocation. IEEE Trans Electron Comput (2):270\u2013271","DOI":"10.1109\/PGEC.1965.264263"},{"key":"473_CR49","doi-asserted-by":"crossref","unstructured":"Yang Y, Zhao L, Li Y et\u00a0al (2022) Infless: a native serverless system for low-latency, high-throughput inference. In: Proceedings of the 27th ACM International conference on architectural support for programming languages and operating systems, pp 768\u2013781","DOI":"10.1145\/3503222.3507709"},{"key":"473_CR50","doi-asserted-by":"crossref","unstructured":"Young (2002) On-line file caching. Algorithmica 33(3):371\u2013383","DOI":"10.1007\/s00453-001-0124-5"},{"key":"473_CR51","doi-asserted-by":"crossref","unstructured":"Yu H, Basu\u00a0Roy R, Fontenot C et\u00a0al (2024) Rainbowcake: Mitigating cold-starts in serverless with layer-wise container caching and sharing. In: Proceedings of the 29th ACM International conference on architectural support for programming languages and operating systems, Volume 1, pp 335\u2013350","DOI":"10.1145\/3617232.3624871"},{"key":"473_CR52","doi-asserted-by":"crossref","unstructured":"Zhang M, Wang F, Zhu Y et\u00a0al (2021) Towards cloud-edge collaborative online video analytics with fine-grained serverless pipelines. In: Proceedings of the 12th ACM multimedia systems conference, pp 80\u201393","DOI":"10.1145\/3458305.3463377"},{"key":"473_CR53","doi-asserted-by":"crossref","unstructured":"Zhong C, Gursoy MC (2018) A deep reinforcement learning-based framework for content caching. In: 2018 52nd Annual Conference on Information Sciences and Systems (CISS). IEEE, pp 1\u20136","DOI":"10.1109\/CISS.2018.8362276"},{"key":"473_CR54","unstructured":"Zhou Y, Philbin J, Li K (2001) The multi-queue replacement algorithm for second level buffer caches. In: USENIX Annual Technical Conference, General Track, pp 91\u2013104"}],"container-title":["Journal of King Saud University Computer and Information Sciences"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s44443-026-00473-4","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s44443-026-00473-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s44443-026-00473-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,11]],"date-time":"2026-03-11T14:13:02Z","timestamp":1773238382000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s44443-026-00473-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1,26]]},"references-count":54,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2026,4]]}},"alternative-id":["473"],"URL":"https:\/\/doi.org\/10.1007\/s44443-026-00473-4","relation":{},"ISSN":["1319-1578","2213-1248"],"issn-type":[{"value":"1319-1578","type":"print"},{"value":"2213-1248","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,1,26]]},"assertion":[{"value":"12 October 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 January 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no relevant financial or non-financial interests to disclose.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing Interests"}}],"article-number":"93"}}