{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,5]],"date-time":"2026-03-05T15:47:27Z","timestamp":1772725647428,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":43,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,10,30]],"date-time":"2023-10-30T00:00:00Z","timestamp":1698624000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,10,30]]},"DOI":"10.1145\/3620678.3624660","type":"proceedings-article","created":{"date-parts":[[2023,10,31]],"date-time":"2023-10-31T13:58:07Z","timestamp":1698760687000},"page":"265-280","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["Maximizing the Utilization of GPUs Used by Cloud Gaming through Adaptive Co-location with Combo"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-2391-066X","authenticated-orcid":false,"given":"Binghao","family":"Chen","sequence":"first","affiliation":[{"name":"Shanghai Jiao Tong University, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1561-5329","authenticated-orcid":false,"given":"Han","family":"Zhao","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6646-5260","authenticated-orcid":false,"given":"Weihao","family":"Cui","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-8257-1230","authenticated-orcid":false,"given":"Yifu","family":"He","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0802-7203","authenticated-orcid":false,"given":"Shulai","family":"Zhang","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5832-0347","authenticated-orcid":false,"given":"Quan","family":"Chen","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4706-8451","authenticated-orcid":false,"given":"Zijun","family":"Li","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0034-2302","authenticated-orcid":false,"given":"Minyi","family":"Guo","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, China"}]}],"member":"320","published-online":{"date-parts":[[2023,10,31]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"2023. Amazon AppStream 2.0. https:\/\/aws.amazon.com\/appstream2\/. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_2_1","unstructured":"2023. The Ascent. https:\/\/curvegames.com\/our-games\/the-ascent\/. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_3_1","unstructured":"2023. Deliver Us to The Moon. https:\/\/www.deliverusthemoon.com\/. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_4_1","unstructured":"2023. DirectX. https:\/\/learn.microsoft.com\/en-us\/windows\/win32\/directx-sdk--august-2009-. Accessed: 2023-06-10."},{"key":"e_1_3_2_1_5_1","unstructured":"2023. GeForce RTX 3090 Family. https:\/\/www.nvidia.com\/en-us\/geforce\/graphics-cards\/30-series\/rtx-3090-3090ti\/. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_6_1","unstructured":"2023. Microsoft's Xbox Remote Play. https:\/\/www.xbox.com\/en-US\/consoles\/remote-play. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_7_1","unstructured":"2023. NIVIDIA Multi-Process Service. https:\/\/docs.nvidia.com\/deploy\/mps\/index.html. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_8_1","unstructured":"2023. NVIDIA CUDA Compiler Driver NVCC. https:\/\/docs.nvidia.com\/cuda\/cuda-compiler-driver-nvcc\/index.html. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_9_1","unstructured":"2023. Nvidia Geforce Now. https:\/\/www.nvidia.com\/en-us\/geforce-now\/. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_10_1","unstructured":"2023. NVIDIA OptiX Ray Tracing Engine. https:\/\/developer.nvidia.com\/rtx\/ray-tracing\/optix. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_11_1","unstructured":"2023. NVRTC. https:\/\/docs.nvidia.com\/cuda\/nvrtc\/index.html. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_12_1","unstructured":"2023. Quake 2 RTX. https:\/\/www.nvidia.com\/en-us\/geforce\/campaigns\/quake-II-rtx\/. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_13_1","unstructured":"2023. RTX Technology. https:\/\/developer.nvidia.com\/rtx\/ray-tracing. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_14_1","unstructured":"2023. Served Steel. https:\/\/digerati.games\/game\/severed-steel\/. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_15_1","unstructured":"2023. tensor core example code. https:\/\/github.com\/NVIDIA\/cuda-samples\/tree\/master\/Samples\/3_CUDA_Features\/cudaTensorCoreGemm. Accessed: 2023-06-08."},{"key":"e_1_3_2_1_16_1","unstructured":"2023. Vulkan. https:\/\/www.vulkan.org\/. Accessed: 2023-06-10."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/2954679.2872368"},{"key":"e_1_3_2_1_18_1","volume-title":"2022 USENIX Annual Technical Conference (USENIX ATC 22)","author":"Choi Seungbeom","year":"2022","unstructured":"Seungbeom Choi, Sunho Lee, Yeonjae Kim, Jongse Park, Youngjin Kwon, and Jaehyuk Huh. 2022. Serving Heterogeneous Machine Learning Models on {Multi-GPU} Servers with {Spatio-Temporal} Sharing. In 2022 USENIX Annual Technical Conference (USENIX ATC 22). 199--216."},{"key":"e_1_3_2_1_19_1","volume-title":"KRISP: Enabling Kernel-wise RIght-sizing for Spatial Partitioned GPU Inference Servers. In 2023 IEEE International Symposium on High-Performance Computer Architecture (HPCA). IEEE, 624--637","author":"Chow Marcus","year":"2023","unstructured":"Marcus Chow, Ali Jahanshahi, and Daniel Wong. 2023. KRISP: Enabling Kernel-wise RIght-sizing for Spatial Partitioned GPU Inference Servers. In 2023 IEEE International Symposium on High-Performance Computer Architecture (HPCA). IEEE, 624--637."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/3458817.3476143"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/3419111.3421284"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/3453953.3453972"},{"key":"e_1_3_2_1_23_1","volume-title":"A study of persistent threads style GPU programming for GPGPU workloads","author":"Gupta Kshitij","unstructured":"Kshitij Gupta, Jeff A Stuart, and John D Owens. 2012. A study of persistent threads style GPU programming for GPGPU workloads. IEEE."},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/RTAS.2019.00011"},{"key":"e_1_3_2_1_25_1","volume-title":"Proc. USENIX ATC. 17--30","author":"Kato Shinpei","year":"2011","unstructured":"Shinpei Kato, Karthik Lakshmanan, Raj Rajkumar, Yutaka Ishikawa, et al. 2011. TimeGraph: GPU scheduling for real-time multi-tasking environments. In Proc. USENIX ATC. 17--30."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA.2014.6835937"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2020.3024068"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/3037697.3037707"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/2632216"},{"key":"e_1_3_2_1_30_1","first-page":"27","article-title":"Parboil: A revised benchmark suite for scientific and commercial throughput computing","volume":"127","author":"Stratton John A","year":"2012","unstructured":"John A Stratton, Christopher Rodrigues, I-Jui Sung, Nady Obeid, Li-Wen Chang, Nasser Anssari, Geng Daniel Liu, and Wen-mei W Hwu. 2012. Parboil: A revised benchmark suite for scientific and commercial throughput computing. Center for Reliable and High-Performance Computing 127 (2012), 27.","journal-title":"Center for Reliable and High-Performance Computing"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/3079856.3080203"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/2751205.2751213"},{"key":"e_1_3_2_1_33_1","unstructured":"Wencong Xiao Shiru Ren Yong Li Yang Zhang Pengyang Hou Zhi Li Yihui Feng Wei Lin and Yangqing Jia. 2020. AntMan: Dynamic Scaling on GPU Clusters for Deep Learning.. In OSDI. 533--548."},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/3007787.3001161"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCAD51958.2021.9643501"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2013.288"},{"key":"e_1_3_2_1_37_1","volume-title":"2022 USENIX Annual Technical Conference (USENIX ATC 22)","author":"Zhang Wei","year":"2022","unstructured":"Wei Zhang, Binghao Chen, Zhenhua Han, Quan Chen, Peng Cheng, Fan Yang, Ran Shu, Yuqing Yang, and Minyi Guo. 2022. {PilotFish}: Harvesting Free Cycles of Cloud Gaming with Deep Learning Training. In 2022 USENIX Annual Technical Conference (USENIX ATC 22). 217--232."},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/3330345.3330351"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA53966.2022.00064"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCD53106.2021.00054"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2019.00074"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1145\/3373376.3378457"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/3503221.3508409"}],"event":{"name":"SoCC '23: ACM Symposium on Cloud Computing","location":"Santa Cruz CA USA","acronym":"SoCC '23","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGOPS ACM Special Interest Group on Operating Systems"]},"container-title":["Proceedings of the 2023 ACM Symposium on Cloud Computing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3620678.3624660","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3620678.3624660","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T15:56:20Z","timestamp":1755878180000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3620678.3624660"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,30]]},"references-count":43,"alternative-id":["10.1145\/3620678.3624660","10.1145\/3620678"],"URL":"https:\/\/doi.org\/10.1145\/3620678.3624660","relation":{},"subject":[],"published":{"date-parts":[[2023,10,30]]},"assertion":[{"value":"2023-10-31","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}