{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,13]],"date-time":"2026-01-13T23:06:33Z","timestamp":1768345593587,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":83,"publisher":"ACM","funder":[{"name":"IBM-Illinois Discovery Accelerator Institute IIDAI"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,11,19]]},"DOI":"10.1145\/3772052.3772219","type":"proceedings-article","created":{"date-parts":[[2026,1,13]],"date-time":"2026-01-13T16:19:00Z","timestamp":1768321140000},"page":"125-133","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["CPU-Limits kill Performance: Time to rethink Resource Control"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-1308-769X","authenticated-orcid":false,"given":"Chirag C.","family":"Shetty","sequence":"first","affiliation":[{"name":"University of Illinois Urbana-Champaign, Urbana-Champaign, Illinois, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2051-7424","authenticated-orcid":false,"given":"Sarthak","family":"Chakraborty","sequence":"additional","affiliation":[{"name":"University of Illinois Urbana-Champaign, Urbana-Champaign, Illinois, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-0150-1055","authenticated-orcid":false,"given":"Hubertus","family":"Franke","sequence":"additional","affiliation":[{"name":"IBM Research, Yorktown Heights, New York, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5878-0765","authenticated-orcid":false,"given":"Larisa","family":"Shwartz","sequence":"additional","affiliation":[{"name":"IBM Research, Yorktown Heights, New York, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4242-5352","authenticated-orcid":false,"given":"Chandra","family":"Narayanaswami","sequence":"additional","affiliation":[{"name":"IBM Research, Yorktown Heights, New York, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9372-5937","authenticated-orcid":false,"given":"Indranil","family":"Gupta","sequence":"additional","affiliation":[{"name":"University of Illinois Urbana-Champaign, Urbana-Champaign, Illinois, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0926-0776","authenticated-orcid":false,"given":"Saurabh","family":"Jha","sequence":"additional","affiliation":[{"name":"IBM Research, Yorktown Heights, New York, USA"}]}],"member":"320","published-online":{"date-parts":[[2026,1,13]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"https:\/\/kernelnewbies.org\/Linux_3.2\/","author":"Prominent","year":"2012","unstructured":"Prominent features in linux 3.2. https:\/\/kernelnewbies.org\/Linux_3.2\/, 2012."},{"key":"e_1_3_2_1_2_1","volume-title":"https:\/\/stressgrid.com\/blog\/beam_cpu_usage\/","author":"The","year":"2019","unstructured":"The curious case of beam cpu usage. https:\/\/stressgrid.com\/blog\/beam_cpu_usage\/, 2019."},{"key":"e_1_3_2_1_3_1","volume-title":"https:\/\/lwn.net\/Articles\/805317\/","author":"Fixing","year":"2019","unstructured":"Fixing sched_idle. https:\/\/lwn.net\/Articles\/805317\/, 2019."},{"key":"e_1_3_2_1_4_1","volume-title":"https:\/\/www.youtube.com\/watch?v=eBChCFD9hfs&ab_channel=HighLoadChannel","author":"Optimizing","year":"2019","unstructured":"Optimizing kubernetes resource requests\/limits for cost-efficiency and latency. https:\/\/www.youtube.com\/watch?v=eBChCFD9hfs&ab_channel=HighLoadChannel, 2019."},{"key":"e_1_3_2_1_5_1","volume-title":"top-level kubernetes maintainer, google. https:\/\/x.com\/thockin\/status\/1134193838841401345?lang=en","author":"Tim","year":"2019","unstructured":"Tim hockin, top-level kubernetes maintainer, google. https:\/\/x.com\/thockin\/status\/1134193838841401345?lang=en, 2019."},{"key":"e_1_3_2_1_6_1","unstructured":"Artifact of \u201cfirm: An intelligent fine-grained resource management framework for slo-oriented microservices\u201d. https:\/\/gitlab.engr.illinois.edu\/DEPEND\/firm\/-\/blob\/master\/actions.py?ref_type=heads 2020."},{"key":"e_1_3_2_1_7_1","volume-title":"Make your services faster by removing cpu limits, hackernews discussion. https:\/\/news.ycombinator.com\/item?id=24351566","author":"Kubernetes","year":"2020","unstructured":"Kubernetes: Make your services faster by removing cpu limits, hackernews discussion. https:\/\/news.ycombinator.com\/item?id=24351566, 2020."},{"key":"e_1_3_2_1_8_1","volume-title":"Pod quality of service classes. https:\/\/kubernetes.io\/docs\/concepts\/workloads\/pods\/pod-qos\/","author":"Kubernetes","year":"2020","unstructured":"Kubernetes: Pod quality of service classes. https:\/\/kubernetes.io\/docs\/concepts\/workloads\/pods\/pod-qos\/, 2020."},{"key":"e_1_3_2_1_9_1","volume-title":"https:\/\/www.datadoghq.com\/container-report-2021\/","year":"2021","unstructured":"10 trends in real-world container use. https:\/\/www.datadoghq.com\/container-report-2021\/, 2021."},{"key":"e_1_3_2_1_10_1","volume-title":"https:\/\/static.sched.com\/hosted_files\/kccncna2022\/d5\/misadventure_Multitenant.pdf","year":"2022","unstructured":"73,000 pods a day misadventures in multi-tenant. https:\/\/static.sched.com\/hosted_files\/kccncna2022\/d5\/misadventure_Multitenant.pdf, 2022."},{"key":"e_1_3_2_1_11_1","volume-title":"Stop Using CPU Limits on Kubernetes. https:\/\/home.robusta.dev\/blog\/stop-using-cpu-limits","author":"God For","year":"2022","unstructured":"For the Love of God, Stop Using CPU Limits on Kubernetes. https:\/\/home.robusta.dev\/blog\/stop-using-cpu-limits, 2022."},{"key":"e_1_3_2_1_12_1","volume-title":"https:\/\/dnastacio.medium.com\/why-you-should-keep-using-cpu-limits-on-kubernetes-60c4e50dfc61","author":"Should Keep Why You","year":"2022","unstructured":"Why You Should Keep Using CPU Limits on Kubernetes. https:\/\/dnastacio.medium.com\/why-you-should-keep-using-cpu-limits-on-kubernetes-60c4e50dfc61, 2022."},{"key":"e_1_3_2_1_13_1","volume-title":"https:\/\/www.datadoghq.com\/container-report\/","year":"2023","unstructured":"10 insights on real-world container use. https:\/\/www.datadoghq.com\/container-report\/, 2023."},{"key":"e_1_3_2_1_14_1","unstructured":"Artifact of \u201ccilantro: Performance-aware resource allocation for general objectives via online feedback\u201d. https:\/\/github.com\/romilbhardwaj\/cilantro\/blob\/main\/experiments\/microservices\/starters\/hotel-res\/hotel-res-core\/frontend\/frontend-deployment.yaml 2023."},{"key":"e_1_3_2_1_15_1","volume-title":"https:\/\/www.ibm.com\/docs\/en\/spectrum-symphony\/7.3.0?topic=limits-control-groups-cgroups-limiting-resource-usage-linux","author":"Control","year":"2023","unstructured":"Control groups (cgroups) for limiting resource usage on linux. https:\/\/www.ibm.com\/docs\/en\/spectrum-symphony\/7.3.0?topic=limits-control-groups-cgroups-limiting-resource-usage-linux, 2023."},{"key":"e_1_3_2_1_16_1","volume-title":"https:\/\/lwn.net\/Articles\/925371\/","author":"An","year":"2023","unstructured":"An eevdf cpu scheduler for linux. https:\/\/lwn.net\/Articles\/925371\/, 2023."},{"key":"e_1_3_2_1_17_1","volume-title":"https:\/\/www.reddit.com\/r\/googlecloud\/comments\/r2pzpz\/first_experiences_with_gke_autopilot_in\/","author":"First","year":"2023","unstructured":"First experiences with GKE autopilot in production - question about requests\/limits inefficiency. https:\/\/www.reddit.com\/r\/googlecloud\/comments\/r2pzpz\/first_experiences_with_gke_autopilot_in\/, 2023."},{"key":"e_1_3_2_1_18_1","volume-title":"https:\/\/www.ivinco.com\/blog\/how-to-optimize-kubernetes-performance-for-machine-learning-workloads?utm_source=chatgpt.com","author":"How","year":"2023","unstructured":"How to optimize kubernetes performance for machine learning workloads. https:\/\/www.ivinco.com\/blog\/how-to-optimize-kubernetes-performance-for-machine-learning-workloads?utm_source=chatgpt.com, 2023."},{"key":"e_1_3_2_1_19_1","volume-title":"https:\/\/access.redhat.com\/documentation\/en-us\/red_hat_enterprise_linux\/6\/html\/resource_management_guide\/ch01","author":"Introduction","year":"2023","unstructured":"Introduction to control groups. https:\/\/access.redhat.com\/documentation\/en-us\/red_hat_enterprise_linux\/6\/html\/resource_management_guide\/ch01, 2023."},{"key":"e_1_3_2_1_20_1","volume-title":"The silent killer of response time - and what to do about it, ibm. https:\/\/community.ibm.com\/community\/user\/aiops\/blogs\/dina-henderson\/2022\/06\/29\/kubernetes-cpu-throttling-the-silent-killer-of-res","author":"Kubernetes","year":"2023","unstructured":"Kubernetes cpu throttling: The silent killer of response time - and what to do about it, ibm. https:\/\/community.ibm.com\/community\/user\/aiops\/blogs\/dina-henderson\/2022\/06\/29\/kubernetes-cpu-throttling-the-silent-killer-of-res, 2023."},{"key":"e_1_3_2_1_21_1","volume-title":"The silent killer of response time. https:\/\/www.ibm.com\/blog\/kubernetes-cpu-throttling-the-silent-killer-of-response-time\/","author":"Kubernetes CPU","year":"2023","unstructured":"Kubernetes CPU throttling: The silent killer of response time. https:\/\/www.ibm.com\/blog\/kubernetes-cpu-throttling-the-silent-killer-of-response-time\/, 2023."},{"key":"e_1_3_2_1_22_1","volume-title":"minimizing costs: Right-sizing Kubernetes workloads. https:\/\/cloud.google.com\/blog\/products\/containers-kubernetes\/proactive-kubernetes-workload-management","author":"Maximizing","year":"2023","unstructured":"Maximizing reliability, minimizing costs: Right-sizing Kubernetes workloads. https:\/\/cloud.google.com\/blog\/products\/containers-kubernetes\/proactive-kubernetes-workload-management, 2023."},{"key":"e_1_3_2_1_23_1","volume-title":"https:\/\/www.datadoghq.com\/blog\/rightsize-kubernetes-workloads\/","author":"Practical","year":"2023","unstructured":"Practical tips for rightsizing your Kubernetes workloads. https:\/\/www.datadoghq.com\/blog\/rightsize-kubernetes-workloads\/, 2023."},{"key":"e_1_3_2_1_24_1","unstructured":"Artifact of \u201cautothrottle: A practical bi-level approach to resource management for slo-targeted microservices\u201d. https:\/\/github.com\/microsoft\/autothrottle\/blob\/main\/worker-daemon.py 2024."},{"key":"e_1_3_2_1_25_1","volume-title":"https:\/\/www.loft.sh\/blog\/best-practices-for-achieving-isolation-in-kubernetes-multi-tenant-environments","author":"Best","year":"2024","unstructured":"Best practices for achieving isolation in kubernetes multi-tenant environments. https:\/\/www.loft.sh\/blog\/best-practices-for-achieving-isolation-in-kubernetes-multi-tenant-environments, 2024."},{"key":"e_1_3_2_1_26_1","volume-title":"oracle. https:\/\/docs.oracle.com\/en-us\/iaas\/Content\/ContEng\/Tasks\/contengbestpractices_topic-Multi-Tenancy-best-practices.htm","author":"Best","year":"2024","unstructured":"Best practices for multi-tenant environments, oracle. https:\/\/docs.oracle.com\/en-us\/iaas\/Content\/ContEng\/Tasks\/contengbestpractices_topic-Multi-Tenancy-best-practices.htm, 2024."},{"key":"e_1_3_2_1_27_1","volume-title":"https:\/\/github.com\/bitnami\/charts\/blob\/main\/bitnami\/common\/templates\/_resources.tpl","author":"Bitnami","year":"2024","unstructured":"Bitnami resource templates. https:\/\/github.com\/bitnami\/charts\/blob\/main\/bitnami\/common\/templates\/_resources.tpl, 2024."},{"key":"e_1_3_2_1_28_1","unstructured":"Can cpu throttling results in oomkilled states in k8s? https:\/\/stackoverflow.com\/questions\/76153774\/can-cpu- throttling-results-in-oomkilled-states-in-k8s 2024."},{"key":"e_1_3_2_1_29_1","volume-title":"https:\/\/learn.microsoft.com\/en-us\/azure\/developer\/java\/containers\/kubernetes","author":"Containerizing","year":"2024","unstructured":"Containerizing java applications. https:\/\/learn.microsoft.com\/en-us\/azure\/developer\/java\/containers\/kubernetes, 2024."},{"key":"e_1_3_2_1_30_1","volume-title":"https:\/\/stressgrid.com\/blog\/benchmarking_go_vs_node_vs_elixir\/","author":"Elixir","year":"2024","unstructured":"Elixir vs go vs node. https:\/\/stressgrid.com\/blog\/benchmarking_go_vs_node_vs_elixir\/, 2024."},{"key":"e_1_3_2_1_31_1","volume-title":"https:\/\/www.erlang.org\/blog\/otp-23-highlights\/#take-cpu-quotas-into-account","author":"Erlang","year":"2024","unstructured":"Erlang quota awareness. https:\/\/www.erlang.org\/blog\/otp-23-highlights\/#take-cpu-quotas-into-account, 2024."},{"key":"e_1_3_2_1_32_1","volume-title":"https:\/\/platform9.com\/kb\/kubernetes\/how-to-prevent-a-run-away-pod-or-container-from-using-all-resou","author":"How","year":"2024","unstructured":"How to prevent a run away pod or container from using all resources on the node. https:\/\/platform9.com\/kb\/kubernetes\/how-to-prevent-a-run-away-pod-or-container-from-using-all-resou, 2024."},{"key":"e_1_3_2_1_33_1","volume-title":"https:\/\/heiioncall.com\/blog\/kubernetes-liveness-probes-and-cpu-limits-risks-self-reinforcing-crashloopbackoff","author":"Kubernetes","year":"2024","unstructured":"Kubernetes liveness probes and cpu limit risks self-reinforcing crashloopbackoff. https:\/\/heiioncall.com\/blog\/kubernetes-liveness-probes-and-cpu-limits-risks-self-reinforcing-crashloopbackoff, 2024."},{"key":"e_1_3_2_1_34_1","volume-title":"Production-grade container orchestration. https:\/\/kubernetes.io\/","author":"Kubernetes","year":"2024","unstructured":"Kubernetes: Production-grade container orchestration. https:\/\/kubernetes.io\/, 2024."},{"key":"e_1_3_2_1_35_1","volume-title":"https:\/\/kubernetes.io\/docs\/concepts\/scheduling-eviction\/kube-scheduler\/","author":"Kubernetes","year":"2024","unstructured":"Kubernetes scheduler. https:\/\/kubernetes.io\/docs\/concepts\/scheduling-eviction\/kube-scheduler\/, 2024."},{"key":"e_1_3_2_1_36_1","volume-title":"https:\/\/docs.redhat.com\/en\/documentation\/red_hat_enterprise_linux\/6\/html\/resource_management_guide\/sec-cpu","author":"Linux","year":"2024","unstructured":"Linux cpu management. https:\/\/docs.redhat.com\/en\/documentation\/red_hat_enterprise_linux\/6\/html\/resource_management_guide\/sec-cpu, 2024."},{"key":"e_1_3_2_1_37_1","volume-title":"redhat. https:\/\/www.redhat.com\/en\/blog\/managing-compute-resources-openshiftkubernetes","author":"Managing","year":"2024","unstructured":"Managing compute resources with openshift\/kubernetes, redhat. https:\/\/www.redhat.com\/en\/blog\/managing-compute-resources-openshiftkubernetes, 2024."},{"key":"e_1_3_2_1_38_1","volume-title":"google cloud. https:\/\/cloud.google.com\/kubernetes-engine\/docs\/best-practices\/enterprise-multitenancy","year":"2024","unstructured":"Multi-tenancy, google cloud. https:\/\/cloud.google.com\/kubernetes-engine\/docs\/best-practices\/enterprise-multitenancy, 2024."},{"key":"e_1_3_2_1_39_1","volume-title":"kubernetes. https:\/\/kubernetes.io\/docs\/concepts\/security\/multi-tenancy\/","year":"2024","unstructured":"Multi-tenancy, kubernetes. https:\/\/kubernetes.io\/docs\/concepts\/security\/multi-tenancy\/, 2024."},{"key":"e_1_3_2_1_40_1","volume-title":"https:\/\/www.rabbitmq.com\/docs\/runtime#scheduling","author":"Rabbitmq","year":"2024","unstructured":"Rabbitmq runtime schedulers. https:\/\/www.rabbitmq.com\/docs\/runtime#scheduling, 2024."},{"key":"e_1_3_2_1_41_1","volume-title":"Google sre handbook. https:\/\/sre.google\/sre-book\/service-level-objectives\/","author":"Service","year":"2024","unstructured":"Service level objectives: Google sre handbook. https:\/\/sre.google\/sre-book\/service-level-objectives\/, 2024."},{"key":"e_1_3_2_1_42_1","volume-title":"gke. https:\/\/cloud.google.com\/blog\/products\/containers-kubernetes\/tuning-the-kubernetes-hpa-in-gke","author":"The","year":"2024","unstructured":"The surprising economics of horizontal pod autoscaling tuning, gke. https:\/\/cloud.google.com\/blog\/products\/containers-kubernetes\/tuning-the-kubernetes-hpa-in-gke, 2024."},{"key":"e_1_3_2_1_43_1","volume-title":"https:\/\/cloud.google.com\/kubernetes-engine\/docs\/concepts\/cluster-autoscaler","author":"About","year":"2025","unstructured":"About cluster autoscaling. https:\/\/cloud.google.com\/kubernetes-engine\/docs\/concepts\/cluster-autoscaler, 2025."},{"key":"e_1_3_2_1_44_1","volume-title":"https:\/\/www.youtube.com\/watch?v=0W49z8hVn0k","author":"Cluster","year":"2025","unstructured":"Cluster management at google with borg. https:\/\/www.youtube.com\/watch?v=0W49z8hVn0k, 2025."},{"key":"e_1_3_2_1_45_1","volume-title":"https:\/\/kubernetes.io\/docs\/tasks\/administer-cluster\/manage-resources\/quota-memory-cpu-namespace\/","author":"Configure","year":"2025","unstructured":"Configure memory and cpu quotas for a namespace. https:\/\/kubernetes.io\/docs\/tasks\/administer-cluster\/manage-resources\/quota-memory-cpu-namespace\/, 2025."},{"key":"e_1_3_2_1_46_1","volume-title":"https:\/\/kubernetes.io\/docs\/tasks\/administer-cluster\/cpu-management-policies\/","author":"Control","year":"2025","unstructured":"Control cpu management policies on the node. https:\/\/kubernetes.io\/docs\/tasks\/administer-cluster\/cpu-management-policies\/, 2025."},{"key":"e_1_3_2_1_47_1","volume-title":"limit deep dive. https:\/\/www.datadoghq.com\/blog\/kubernetes-cpu-requests-limits\/","author":"Datadog","year":"2025","unstructured":"Datadog cpu request, limit deep dive. https:\/\/www.datadoghq.com\/blog\/kubernetes-cpu-requests-limits\/, 2025."},{"key":"e_1_3_2_1_48_1","volume-title":"https:\/\/elixirforum.com\/t\/performance-issue-when-running-in-kubernetes\/31239\/11","author":"Erlang","year":"2025","unstructured":"Erlang performance issues with limit. https:\/\/elixirforum.com\/t\/performance-issue-when-running-in-kubernetes\/31239\/11, 2025."},{"key":"e_1_3_2_1_49_1","volume-title":"https:\/\/kubernetes.io\/docs\/tasks\/run-application\/horizontal-pod-autoscale\/","author":"Horizontal","year":"2025","unstructured":"Horizontal pod autoscaling. https:\/\/kubernetes.io\/docs\/tasks\/run-application\/horizontal-pod-autoscale\/, 2025."},{"key":"e_1_3_2_1_50_1","volume-title":"https:\/\/www.intel.com\/content\/www\/us\/en\/developer\/articles\/technical\/introduction-to-cache-allocation-technology.html","author":"Introduction","year":"2025","unstructured":"Introduction to cache allocation technology. https:\/\/www.intel.com\/content\/www\/us\/en\/developer\/articles\/technical\/introduction-to-cache-allocation-technology.html, 2025."},{"key":"e_1_3_2_1_51_1","volume-title":"https:\/\/www.intel.com\/content\/www\/us\/en\/developer\/articles\/technical\/introduction-to-memory-bandwidth-allocation.html","author":"Introduction","year":"2025","unstructured":"Introduction to memory bandwidth allocation. https:\/\/www.intel.com\/content\/www\/us\/en\/developer\/articles\/technical\/introduction-to-memory-bandwidth-allocation.html, 2025."},{"key":"e_1_3_2_1_52_1","volume-title":"https:\/\/karpenter.sh\/","year":"2025","unstructured":"Karpenter.sh. https:\/\/karpenter.sh\/, 2025."},{"key":"e_1_3_2_1_53_1","volume-title":"https:\/\/kubernetes.io\/docs\/concepts\/workloads\/pods\/pod-qos\/","author":"Kubernetes","year":"2025","unstructured":"Kubernetes pod quality of service classes. https:\/\/kubernetes.io\/docs\/concepts\/workloads\/pods\/pod-qos\/, 2025."},{"key":"e_1_3_2_1_54_1","volume-title":"https:\/\/kubernetes.io\/docs\/concepts\/scheduling-eviction\/kube-scheduler\/","author":"Kubernetes","year":"2025","unstructured":"Kubernetes scheduler. https:\/\/kubernetes.io\/docs\/concepts\/scheduling-eviction\/kube-scheduler\/, 2025."},{"key":"e_1_3_2_1_55_1","volume-title":"https:\/\/www.spectrocloud.com\/blog\/managing-the-noisy-neighbor-problem-in-kubernetes-multi-tenancy?utm_source=chatgpt.com","author":"Managing","year":"2025","unstructured":"Managing the noisy neighbor problem in kubernetes. https:\/\/www.spectrocloud.com\/blog\/managing-the-noisy-neighbor-problem-in-kubernetes-multi-tenancy?utm_source=chatgpt.com, 2025."},{"key":"e_1_3_2_1_56_1","volume-title":"https:\/\/docs.oracle.com\/en-us\/iaas\/Content\/ContEng\/Tasks\/contengbestpractices_topic-Multi-Tenancy-best-practices.htm","year":"2025","unstructured":"Multi-tenancy best practices. https:\/\/docs.oracle.com\/en-us\/iaas\/Content\/ContEng\/Tasks\/contengbestpractices_topic-Multi-Tenancy-best-practices.htm, 2025."},{"key":"e_1_3_2_1_57_1","volume-title":"https:\/\/kubernetes.io\/docs\/tasks\/administer-cluster\/reserve-compute-resources\/","author":"Reserve","year":"2025","unstructured":"Reserve compute resources for system daemons. https:\/\/kubernetes.io\/docs\/tasks\/administer-cluster\/reserve-compute-resources\/, 2025."},{"key":"e_1_3_2_1_58_1","volume-title":"https:\/\/kubernetes.io\/docs\/concepts\/configuration\/manage-resources-containers\/","author":"Resource","year":"2025","unstructured":"Resource management for pods and containers. https:\/\/kubernetes.io\/docs\/concepts\/configuration\/manage-resources-containers\/, 2025."},{"key":"e_1_3_2_1_59_1","volume-title":"https:\/\/github.com\/kubernetes\/autoscaler\/tree\/master\/vertical-pod-autoscaler","author":"Vertical","year":"2025","unstructured":"Vertical pod autoscaling. https:\/\/github.com\/kubernetes\/autoscaler\/tree\/master\/vertical-pod-autoscaler, 2025."},{"key":"e_1_3_2_1_60_1","unstructured":"Why are you setting cpu limits ? https:\/\/www.reddit.com\/r\/kubernetes\/comments\/utvr4e\/why_are_you_setting_cpu_limits\/ 2025."},{"key":"e_1_3_2_1_61_1","volume-title":"Lessons learned migrating an existing product to a multi tenant cloud native environment - natalia angulo & carlos sanchez, adobe, kubecon north america","author":"Angulo Natalia","year":"2023","unstructured":"Natalia Angulo and Carlos Sanchez. Lessons learned migrating an existing product to a multi tenant cloud native environment - natalia angulo & carlos sanchez, adobe, kubecon north america 2023. https:\/\/youtu.be\/RmZh67vSjNY?si=koTvH6aWLbQszYfU&t=1361, 2023."},{"key":"e_1_3_2_1_62_1","first-page":"417","volume-title":"15th USENIX Symposium on Networked Systems Design and Implementation (NSDI 18)","author":"Ardelean Dan","year":"2018","unstructured":"Dan Ardelean, Amer Diwan, and Chandra Erdman. Performance analysis of cloud applications. In 15th USENIX Symposium on Networked Systems Design and Implementation (NSDI 18), pages 405\u2013417, Renton, WA, April 2018. USENIX Association."},{"key":"e_1_3_2_1_63_1","first-page":"441","volume-title":"Fatahi Baarzi and George Kesidis. SHOWAR: Right-Sizing And Efficient Scheduling of Microservices. In Proceedings of the ACM Symposium on Cloud Computing, SoCC '21","author":"Ataollah","year":"2021","unstructured":"Ataollah Fatahi Baarzi and George Kesidis. SHOWAR: Right-Sizing And Efficient Scheduling of Microservices. In Proceedings of the ACM Symposium on Cloud Computing, SoCC '21, page 427\u2013441, New York, NY, USA, 2021. Association for Computing Machinery."},{"key":"e_1_3_2_1_64_1","first-page":"643","volume-title":"17th USENIX Symposium on Operating Systems Design and Implementation (OSDI 23)","author":"Bhardwaj Romil","year":"2023","unstructured":"Romil Bhardwaj, Kirthevasan Kandasamy, Asim Biswal, Wenshuo Guo, Benjamin Hindman, Joseph Gonzalez, Michael Jordan, and Ion Stoica. Cilantro: Performance-Aware resource allocation for general objectives via online feedback. In 17th USENIX Symposium on Operating Systems Design and Implementation (OSDI 23), pages 623\u2013643, Boston, MA, July 2023. USENIX Association."},{"key":"e_1_3_2_1_65_1","first-page":"204","volume-title":"22nd USENIX Symposium on Networked Systems Design and Implementation (NSDI 25)","author":"Cao Tingjia","year":"2025","unstructured":"Tingjia Cao, Andrea C. Arpaci-Dusseau, Remzi H. Arpaci-Dusseau, and Tyler Caraza-Harter. Making serverless Pay-For-Use a reality with leopard. In 22nd USENIX Symposium on Networked Systems Design and Implementation (NSDI 25), pages 189\u2013204, Philadelphia, PA, April 2025. USENIX Association."},{"key":"e_1_3_2_1_66_1","first-page":"134","volume-title":"2017 IEEE International Symposium on Workload Characterization (IISWC)","author":"Chen Shuang","unstructured":"Shuang Chen, Shay GalOn, Christina Delimitrou, Srilatha Manne, and Jose F Martinez. Workload characterization of interactive cloud services on big and small server platforms. In 2017 IEEE International Symposium on Workload Characterization (IISWC), pages 125\u2013134. IEEE, 2017."},{"key":"e_1_3_2_1_67_1","first-page":"297","volume-title":"14th USENIX Symposium on Operating Systems Design and Implementation (OSDI 20)","author":"Fried Joshua","year":"2020","unstructured":"Joshua Fried, Zhenyuan Ruan, Amy Ousterhout, and Adam Belay. Caladan: Mitigating interference at microsecond timescales. In 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI 20), pages 281\u2013297, 2020."},{"key":"e_1_3_2_1_68_1","doi-asserted-by":"publisher","DOI":"10.1145\/3297858.3304013"},{"key":"e_1_3_2_1_69_1","first-page":"252","volume-title":"Kishwar Ahmed. Practical Efficient Microservice Autoscaling with QoS Assurance. In Proceedings of the 31st Inter-national Symposium on High-Performance Parallel and Distributed Computing, HPDC '22","author":"Hossen Md Rajib","year":"2022","unstructured":"Md Rajib Hossen, Mohammad A. Islam, and Kishwar Ahmed. Practical Efficient Microservice Autoscaling with QoS Assurance. In Proceedings of the 31st Inter-national Symposium on High-Performance Parallel and Distributed Computing, HPDC '22, page 240\u2013252, New York, NY, USA, 2022. Association for Computing Machinery."},{"key":"e_1_3_2_1_70_1","volume-title":"Proceedings of the 14th USENIX Conference on Operating Systems Design and Implementation, OSDI'20, USA","author":"Li Shaohong","year":"2020","unstructured":"Shaohong Li, Xi Wang, Xiao Zhang, Vasileios Kontorinis, Sreekumar Kodakara, David Lo, and Parthasarathy Ranganathan. Thunderbolt: throughput-optimized, quality-of-service-aware power capping at scale. In Proceedings of the 14th USENIX Conference on Operating Systems Design and Implementation, OSDI'20, USA, 2020. USENIX Association."},{"key":"e_1_3_2_1_71_1","first-page":"462","volume-title":"Proceedings of the 42nd Annual International Symposium on Computer Architecture, ISCA '15","author":"Lo David","year":"2015","unstructured":"David Lo, Liqun Cheng, Rama Govindaraju, Parthasarathy Ranganathan, and Christos Kozyrakis. Heracles: improving resource efficiency at scale. In Proceedings of the 42nd Annual International Symposium on Computer Architecture, ISCA '15, page 450\u2013462, New York, NY, USA, 2015. Association for Computing Machinery."},{"key":"e_1_3_2_1_72_1","first-page":"825","volume-title":"14th USENIX Symposium on Operating Systems Design and Implementation (OSDI 20)","author":"Qiu Haoran","unstructured":"Haoran Qiu, Subho S. Banerjee, Saurabh Jha, Zbigniew T. Kalbarczyk, and Ravishankar K. Iyer. FIRM: An intelligent fine-grained resource management framework for SLO-Oriented microservices. In 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI 20), pages 805\u2013825. USENIX Association, November 2020."},{"key":"e_1_3_2_1_73_1","first-page":"181","volume-title":"Proceedings of the 30th ACM International Conference on Architectural Support for Programming Languages and Operating Systems","volume":"1","author":"Reidys Benjamin","year":"2025","unstructured":"Benjamin Reidys, Pantea Zardoshti, \u00cd\u00f1igo Goiri, Celine Irvene, Daniel S. Berger, Haoran Ma, Kapil Arya, Eli Cortez, Taylor Stark, Eugene Bak, Mehmet Iyigun, Stanko Novakovic, Lisa Hsu, Karel Trueba, Abhisek Pan, Chetan Bansal, Saravan Rajmohan, Jian Huang, and Ricardo Bianchini. Coach: Exploiting temporal patterns for all-resource oversubscription in cloud platforms. In Proceedings of the 30th ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 1, ASPLOS '25, page 164\u2013181, New York, NY, USA, 2025. Association for Computing Machinery."},{"key":"e_1_3_2_1_74_1","first-page":"16","volume-title":"Proceedings of the Fifteenth European Conference on Computer Systems","author":"Rzadca Krzysztof","year":"2020","unstructured":"Krzysztof Rzadca, Pawel Findeisen, Jacek Swiderski, Przemyslaw Zych, Przemys-law Broniek, Jarek Kusmierek, Pawel Nowak, Beata Strack, Piotr Witusowski, Steven Hand, et al. Autopilot: workload autoscaling at google. In Proceedings of the Fifteenth European Conference on Computer Systems, pages 1\u201316, 2020."},{"key":"e_1_3_2_1_75_1","first-page":"923","volume-title":"Proceedings of the Nineteenth European Conference on Computer Systems, EuroSys '24","author":"Sachidananda Vighnesh","year":"2024","unstructured":"Vighnesh Sachidananda and Anirudh Sivaraman. Erlang: Application-aware autoscaling for cloud microservices. In Proceedings of the Nineteenth European Conference on Computer Systems, EuroSys '24, page 888\u2013923, New York, NY, USA, 2024. Association for Computing Machinery."},{"key":"e_1_3_2_1_76_1","doi-asserted-by":"publisher","DOI":"10.1145\/3579371.3589069"},{"key":"e_1_3_2_1_77_1","first-page":"803","volume-title":"14th USENIX Symposium on Operating Systems Design and Implementation (OSDI 20)","author":"Tang Chunqiang","year":"2020","unstructured":"Chunqiang Tang, Kenny Yu, Kaushik Veeraraghavan, Jonathan Kaldor, Scott Michelson, Thawan Kooburat, Aravind Anbudurai, Matthew Clark, Kabir Gogia, Long Cheng, et al. Twine: A unified cluster management system for shared infrastructure. In 14th USENIX Symposium on Operating Systems Design and Implementation (OSDI 20), pages 787\u2013803, 2020."},{"key":"e_1_3_2_1_78_1","first-page":"254","volume-title":"Proceedings of the Linux Symposium","author":"Turner Paul","year":"2010","unstructured":"Paul Turner, Bharata B Rao, and Nikhil Rao. Cpu bandwidth control for cfs. In Proceedings of the Linux Symposium, pages 245\u2013254, 2010."},{"key":"e_1_3_2_1_79_1","first-page":"254","volume-title":"Linux Symposium","volume":"10","author":"Turner Paul","unstructured":"Paul Turner, Bharata B Rao, and Nikhil Rao. CPU bandwidth control for CFS. In Linux Symposium, volume 10, pages 245\u2013254. Citeseer, 2010."},{"key":"e_1_3_2_1_80_1","doi-asserted-by":"publisher","DOI":"10.1145\/2741948.2741964"},{"key":"e_1_3_2_1_81_1","volume-title":"NSDI (USENIX Symposium on Networked Systems Design and Implementation). USENIX","author":"Wang Zibo","year":"2024","unstructured":"Zibo Wang, Pinghe Li, Chieh-Jan Mike Liang, Feng Wu, and Francis Y. Yan. Autothrottle: A Practical Bi-Level Approach to Resource Management for SLOTargeted Microservices. In NSDI (USENIX Symposium on Networked Systems Design and Implementation). USENIX, April 2024."},{"key":"e_1_3_2_1_82_1","volume-title":"Analytically-Driven Resource Management for Cloud-Native Microservices. arXiv preprint arXiv.2401.02920","author":"Zhang Yanqi","year":"2024","unstructured":"Yanqi Zhang, Zhuangzhuang Zhou, Sameh Elnikety, and Christina Delimitrou. Analytically-Driven Resource Management for Cloud-Native Microservices. arXiv preprint arXiv.2401.02920, 2024."},{"key":"e_1_3_2_1_83_1","first-page":"64","volume-title":"Proceedings of the 2023 ACM Symposium on Cloud Computing, SoCC '23","author":"Zhang Yuqiu","year":"2023","unstructured":"Yuqiu Zhang, Tongkun Zhang, Gengrui Zhang, and Hans-Arno Jacobsen. Lifting the fog of uncertainties: Dynamic resource orchestration for the containerized cloud. In Proceedings of the 2023 ACM Symposium on Cloud Computing, SoCC '23, page 48\u201364, New York, NY, USA, 2023. Association for Computing Machinery."}],"event":{"name":"SoCC '25: ACM Symposium on Cloud Computing","location":"Online USA","acronym":"SoCC '25","sponsor":["SIGOPS ACM Special Interest Group on Operating Systems","SIGMOD ACM Special Interest Group on Management of Data"]},"container-title":["Proceedings of the 2025 ACM Symposium on Cloud Computing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3772052.3772219","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,13]],"date-time":"2026-01-13T16:23:04Z","timestamp":1768321384000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3772052.3772219"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11,19]]},"references-count":83,"alternative-id":["10.1145\/3772052.3772219","10.1145\/3772052"],"URL":"https:\/\/doi.org\/10.1145\/3772052.3772219","relation":{},"subject":[],"published":{"date-parts":[[2025,11,19]]},"assertion":[{"value":"2026-01-13","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}