{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,2]],"date-time":"2025-11-02T15:11:50Z","timestamp":1762096310042,"version":"build-2065373602"},"publisher-location":"New York, NY, USA","reference-count":9,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,11,12]],"date-time":"2023-11-12T00:00:00Z","timestamp":1699747200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,11,12]]},"DOI":"10.1145\/3624062.3624147","type":"proceedings-article","created":{"date-parts":[[2023,11,10]],"date-time":"2023-11-10T13:53:39Z","timestamp":1699624419000},"page":"704-707","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":2,"title":["Centralized provisioning of large language models for a research community"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6506-2243","authenticated-orcid":false,"given":"Dhruvil","family":"Shah","sequence":"first","affiliation":[{"name":"Computational Research Accelerator, Arizona State University, United States of America"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5888-5209","authenticated-orcid":false,"given":"Gil","family":"Speyer","sequence":"additional","affiliation":[{"name":"Computational Research Accelerator, Arizona State University, United States of America"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6866-9833","authenticated-orcid":false,"given":"Jason","family":"Yalim","sequence":"additional","affiliation":[{"name":"Computational Research Accelerator, Arizona State University, United States of America"}]}],"member":"320","published-online":{"date-parts":[[2023,11,12]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"2023. Falcon-40B: an open large language model with state-of-the-art performance. Technical Report."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1906.02569"},{"key":"e_1_3_2_1_3_1","unstructured":"ASU. 2023. Sol. https:\/\/github.com\/jackfrost1411\/HUST23-SC23-LLMs https:\/\/github.com\/jackfrost1411\/HUST23-SC23-LLMs."},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/3569951.3597573"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-021-03819-2"},{"key":"e_1_3_2_1_6_1","unstructured":"Dakota Mahan Ryan Carlow Louis Castricato Nathan Cooper and Christian Laforte. [n. d.]. Stable Beluga models. https:\/\/huggingface.co\/stabilityai\/StableBeluga2 huggingface.co\/stabilityai\/StableBeluga2."},{"key":"e_1_3_2_1_7_1","unstructured":"Mamba Org. 2023. mamba. https:\/\/github.com\/mamba-org\/mamba https:\/\/github.com\/mamba-org\/mamba."},{"key":"e_1_3_2_1_8_1","unstructured":"MosaicML\u00a0NLP Team. 2023. Introducing MPT-30B: Raising the bar for open-source foundation models. www.mosaicml.com\/blog\/mpt-30b"},{"key":"e_1_3_2_1_9_1","unstructured":"Hugo Touvron Louis Martin Kevin Stone Peter Albert Amjad Almahairi Yasmine Babaei Nikolay Bashlykov Soumya Batra Prajjwal Bhargava Shruti Bhosale Dan Bikel Lukas Blecher Cristian\u00a0Canton Ferrer Moya Chen Guillem Cucurull David Esiobu Jude Fernandes Jeremy Fu Wenyin Fu Brian Fuller Cynthia Gao Vedanuj Goswami Naman Goyal Anthony Hartshorn Saghar Hosseini Rui Hou Hakan Inan Marcin Kardas Viktor Kerkez Madian Khabsa Isabel Kloumann Artem Korenev Punit\u00a0Singh Koura Marie-Anne Lachaux Thibaut Lavril Jenya Lee Diana Liskovich Yinghai Lu Yuning Mao Xavier Martinet Todor Mihaylov Pushkar Mishra Igor Molybog Yixin Nie Andrew Poulton Jeremy Reizenstein Rashi Rungta Kalyan Saladi Alan Schelten Ruan Silva Eric\u00a0Michael Smith Ranjan Subramanian Xiaoqing\u00a0Ellen Tan Binh Tang Ross Taylor Adina Williams Jian\u00a0Xiang Kuan Puxin Xu Zheng Yan Iliyan Zarov Yuchen Zhang Angela Fan Melanie Kambadur Sharan Narang Aurelien Rodriguez Robert Stojnic Sergey Edunov and Thomas Scialom. 2023. Llama 2: Open Foundation and Fine-Tuned Chat Models. (2023). arxiv:2307.09288\u00a0[cs.CL]"}],"event":{"name":"SC-W 2023: Workshops of The International Conference on High Performance Computing, Network, Storage, and Analysis","acronym":"SC-W 2023","location":"Denver CO USA"},"container-title":["Proceedings of the SC '23 Workshops of the International Conference on High Performance Computing, Network, Storage, and Analysis"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3624062.3624147","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3624062.3624147","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T03:00:22Z","timestamp":1755745222000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3624062.3624147"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,11,12]]},"references-count":9,"alternative-id":["10.1145\/3624062.3624147","10.1145\/3624062"],"URL":"https:\/\/doi.org\/10.1145\/3624062.3624147","relation":{},"subject":[],"published":{"date-parts":[[2023,11,12]]},"assertion":[{"value":"2023-11-12","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}