{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,20]],"date-time":"2025-12-20T22:20:48Z","timestamp":1766269248254,"version":"3.40.3"},"reference-count":26,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,9,23]],"date-time":"2024-09-23T00:00:00Z","timestamp":1727049600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,9,23]],"date-time":"2024-09-23T00:00:00Z","timestamp":1727049600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,9,23]]},"DOI":"10.1109\/hpec62836.2024.10938521","type":"proceedings-article","created":{"date-parts":[[2025,4,3]],"date-time":"2025-04-03T19:07:19Z","timestamp":1743707239000},"page":"1-7","source":"Crossref","is-referenced-by-count":1,"title":["GPU Sharing with Triples Mode"],"prefix":"10.1109","author":[{"given":"Chansup","family":"Byun","sequence":"first","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Albert","family":"Reuther","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"LaToya","family":"Anderson","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"William","family":"Arcand","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Bill","family":"Bergeron","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"David","family":"Bestor","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Alexander","family":"Bonn","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Daniel","family":"Burrill","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Vijay","family":"Gadepally","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Michael","family":"Houle","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Matthew","family":"Hubbell","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Hayden","family":"Jananthan","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Michael","family":"Jones","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Piotr","family":"Luszczek","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Peter","family":"Michaleas","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Lauren","family":"Milechin","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Guillermo","family":"Morales","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Julie","family":"Mullen","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Andrew","family":"Prout","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Antonio","family":"Rosa","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Charles","family":"Yee","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Jeremy","family":"Kepner","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]}],"member":"263","reference":[{"volume-title":"OpenAI ChatGPT","key":"ref1"},{"volume-title":"Nvidia multi-process service (MPS)","key":"ref2"},{"volume-title":"Consistency and security: AMDs approach to gpu virtual-ization","author":"Knuth","key":"ref3"},{"volume-title":"Nvidia multi-instance GPU","key":"ref4"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/1996130.1996160"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ipdpsw.2016.94"},{"key":"ref7","first-page":"98","article-title":"Salus: Fine-grained GPU sharing primitives for deep learning applications","volume-title":"Proceedings of Machine Learning and Systems (MLSys 2020)","volume":"2","author":"Yu","year":"2020"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/2907294.2907298"},{"volume-title":"GPU sharing on Amazon EKS with NVIDIA time-slicing and accel-erated EC2 instances","key":"ref9"},{"volume-title":"About GPUs in Google Kubernetes Engine (GKE)","key":"ref10"},{"volume-title":"GPU sharing on your Azure Stack Edge Pro GPU device","key":"ref11"},{"volume-title":"Generic resource (GRES) scheduling","key":"ref12"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/hpec49654.2021.9622870"},{"key":"ref14","article-title":"Optimizing diverse workloads and system resource usage with slurm","volume-title":"Slurm User Group Meeting","author":"Byun","year":"2023"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/hpec.2016.7761618"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1177\/1094342007078446"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1137\/1.9780898718126"},{"key":"ref18","article-title":"LLGrid: Enabling on-demand grid computing with gridMatlab and pMatlab","volume-title":"2004 IEEE High Performance Extreme Computing Conference (HPEC)","author":"Reuther","year":"2004"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/hpec55821.2022.9926365"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/hpec58863.2023.10363604"},{"key":"ref21","doi-asserted-by":"crossref","DOI":"10.1145\/3626203.3670565","article-title":"Llload: Simplifying real-time job monitoring for HPC users","volume-title":"Practice and Experience in Advanced Research Computing, ser. PEARC \u201924","author":"Byun","year":"2024"},{"volume-title":"The MNIST database of handwritten digits","author":"LeCun","key":"ref22"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr.2009.5206848"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3620665.3640366"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/5.726791"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr.2016.90"}],"event":{"name":"2024 IEEE High Performance Extreme Computing Conference (HPEC)","start":{"date-parts":[[2024,9,23]]},"location":"Wakefield, MA, USA","end":{"date-parts":[[2024,9,27]]}},"container-title":["2024 IEEE High Performance Extreme Computing Conference (HPEC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10938401\/10938415\/10938521.pdf?arnumber=10938521","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,4]],"date-time":"2025-04-04T11:35:19Z","timestamp":1743766519000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10938521\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,9,23]]},"references-count":26,"URL":"https:\/\/doi.org\/10.1109\/hpec62836.2024.10938521","relation":{},"subject":[],"published":{"date-parts":[[2024,9,23]]}}}