{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,14]],"date-time":"2026-04-14T00:15:59Z","timestamp":1776125759936,"version":"3.50.1"},"reference-count":32,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"3","license":[{"start":{"date-parts":[[2026,3,1]],"date-time":"2026-03-01T00:00:00Z","timestamp":1772323200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,3,1]],"date-time":"2026-03-01T00:00:00Z","timestamp":1772323200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,3,1]],"date-time":"2026-03-01T00:00:00Z","timestamp":1772323200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Shanghai Key Laboratory of Scalable Computing and Systems, the Eighth Research Institute of China Aerospace Science and Technology Group Company Ltd.","award":["USCAST2023-17"],"award-info":[{"award-number":["USCAST2023-17"]}]},{"name":"Shanghai Key Laboratory of Scalable Computing and Systems, the Eighth Research Institute of China Aerospace Science and Technology Group Company Ltd.","award":["USCAST2023-21"],"award-info":[{"award-number":["USCAST2023-21"]}]},{"name":"Shanghai Municipal Science and Technology Major Project"},{"name":"National Key Laboratory of Ship Structural Safety"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Comput."],"published-print":{"date-parts":[[2026,3]]},"DOI":"10.1109\/tc.2025.3628924","type":"journal-article","created":{"date-parts":[[2025,11,5]],"date-time":"2025-11-05T18:39:02Z","timestamp":1762367942000},"page":"776-787","source":"Crossref","is-referenced-by-count":4,"title":["HeShare: Energy-Aware and Efficient Multi-Task GPU Sharing in Heterogeneous GPU-Based Computing Systems"],"prefix":"10.1109","volume":"75","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-5078-9228","authenticated-orcid":false,"given":"Zhuolong","family":"Jiang","sequence":"first","affiliation":[{"name":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9373-8474","authenticated-orcid":false,"given":"Zinuo","family":"Cai","sequence":"additional","affiliation":[{"name":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"}]},{"given":"Hongyu","family":"Zhao","sequence":"additional","affiliation":[{"name":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"}]},{"given":"Baoheng","family":"Zhang","sequence":"additional","affiliation":[{"name":"Aerospace System Engineering Shanghai, Shanghai, China"}]},{"given":"Tianqi","family":"Wu","sequence":"additional","affiliation":[{"name":"China Ship Scientific Research Center, Jiangsu, China"}]},{"given":"Yiming","family":"Qiang","sequence":"additional","affiliation":[{"name":"China Ship Scientific Research Center, Jiangsu, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9592-8490","authenticated-orcid":false,"given":"Ruhui","family":"Ma","sequence":"additional","affiliation":[{"name":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4714-7400","authenticated-orcid":false,"given":"Haibing","family":"Guan","sequence":"additional","affiliation":[{"name":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9754-6496","authenticated-orcid":false,"given":"Rajkumar","family":"Buyya","sequence":"additional","affiliation":[{"name":"Cloud Computing and Distributed Systems (CLOUDS) Laboratory, School of Computing and Information Systems, The University of Melbourne, Melbourne, VIC, Australia"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2022.3144614"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CCGRID64434.2025.00015"},{"key":"ref3","first-page":"75","article-title":"Power-aware deep learning model serving with $\\{\\mu${\u03bc-Serve,$\\}$}","volume-title":"Proc. USENIX Annu. Tech. Conf. (USENIX ATC)","author":"Qiu","year":"2024"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/MASS58611.2023.00074"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3342195.3387555"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3701997"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/tcss.2024.3423749"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.jocs.2020.101153"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2023.3303877"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2020.03.307"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/s11554-021-01181-0"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/3431731"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.243"},{"key":"ref15","article-title":"Very deep convolutional networks for large-scale image recognition","author":"Simonyan","year":"2014"},{"key":"ref16","article-title":"MobileNets: Efficient convolutional neural networks for mobile vision applications","author":"Howard","year":"2017"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"key":"ref18","first-page":"4171","article-title":"BERT: Pre-training of deep bidirectional transformers for language understanding","volume-title":"Proc. Assoc. Comput. Linguistics: Human Lang. Technol.","author":"D","year":"2019"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref20","article-title":"Language models are unsupervised multitask learners","author":"Radford","year":"2019"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3542929.3563510"},{"key":"ref22","first-page":"1","article-title":"Characterization and prediction of deep learning workloads in large-scale GPU datacenters","volume-title":"Proc. Int. Conf. High Perform. Comput., Netw., Storage Anal.","author":"Hu","year":"2021"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TEVC.2016.2592479"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TR.2017.2738660"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TEVC.2019.2949841"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2023.3327279"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3649329.3655956"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3669940.3707231"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2023.3345401"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/2636342"},{"key":"ref31","article-title":"Gandiva: Introspective Cluster Scheduling for Deep Learning","author":"Xiao","year":"2018"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/infocom.2019.8737460"}],"container-title":["IEEE Transactions on Computers"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/12\/11392777\/11230091.pdf?arnumber=11230091","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,14]],"date-time":"2026-02-14T05:43:18Z","timestamp":1771047798000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11230091\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,3]]},"references-count":32,"journal-issue":{"issue":"3"},"URL":"https:\/\/doi.org\/10.1109\/tc.2025.3628924","relation":{},"ISSN":["0018-9340","1557-9956","2326-3814"],"issn-type":[{"value":"0018-9340","type":"print"},{"value":"1557-9956","type":"electronic"},{"value":"2326-3814","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,3]]}}}