{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,17]],"date-time":"2026-02-17T12:02:40Z","timestamp":1771329760556,"version":"3.50.1"},"reference-count":23,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,6,19]],"date-time":"2024-06-19T00:00:00Z","timestamp":1718755200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,6,19]],"date-time":"2024-06-19T00:00:00Z","timestamp":1718755200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,6,19]]},"DOI":"10.1109\/iwqos61813.2024.10682885","type":"proceedings-article","created":{"date-parts":[[2024,9,26]],"date-time":"2024-09-26T17:41:00Z","timestamp":1727372460000},"page":"1-6","source":"Crossref","is-referenced-by-count":4,"title":["Scheduling Generative-AI Job DAGs with Model Serving in Data Centers"],"prefix":"10.1109","author":[{"given":"Ying","family":"Zheng","sequence":"first","affiliation":[{"name":"Fudan University,China"}]},{"given":"Lei","family":"Jiao","sequence":"additional","affiliation":[{"name":"University of Oregon,USA"}]},{"given":"Yuedong","family":"Xu","sequence":"additional","affiliation":[{"name":"Fudan University,China"}]},{"given":"Bo","family":"An","sequence":"additional","affiliation":[{"name":"Nanyang Technological University,Singapore"}]},{"given":"Xin","family":"Wang","sequence":"additional","affiliation":[{"name":"Fudan University,China"}]},{"given":"Zongpeng","family":"Li","sequence":"additional","affiliation":[{"name":"Tsinghua University,China"}]}],"member":"263","reference":[{"key":"ref1","article-title":"GPT-4 Technical Report"},{"key":"ref2","article-title":"LLAMA 2: Open Foundation and Fine-Tuned Chat Models","author":"Touvron","year":"2023"},{"key":"ref3","article-title":"Discovering the Hidden Vocabulary of DALLE-2","author":"Daras","year":"2022"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00453"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2023.3288409"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10095046"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00984"},{"key":"ref9","volume-title":"NVIDIA Triton Inference Server"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM54140.2023.10436771"},{"issue":"99","key":"ref12","first-page":"1","article-title":"Exploring Collaborative Distributed Diffusion-based AI-Generated Content (AIGC) in Wireless Networks","author":"Du","year":"2023","journal-title":"IEEE Network"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/tii.2019.2959070"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/s10586-020-03151-w"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/tpds.2013.57"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1016\/j.simpat.2021.102328"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/j.future.2017.05.033"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2017.2735400"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611974331.ch14"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2022.3177046"},{"key":"ref21","article-title":"HuggingGPT: Solving AI Tasks with ChatGPT and its Friends in Hugging Face","author":"Shen","year":"2023"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2016.2609844"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/71.993206"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-09457-1_7"}],"event":{"name":"2024 IEEE\/ACM 32nd International Symposium on Quality of Service (IWQoS)","location":"Guangzhou, China","start":{"date-parts":[[2024,6,19]]},"end":{"date-parts":[[2024,6,21]]}},"container-title":["2024 IEEE\/ACM 32nd International Symposium on Quality of Service (IWQoS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10682818\/10682608\/10682885.pdf?arnumber=10682885","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,15]],"date-time":"2025-01-15T19:23:33Z","timestamp":1736969013000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10682885\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,6,19]]},"references-count":23,"URL":"https:\/\/doi.org\/10.1109\/iwqos61813.2024.10682885","relation":{},"subject":[],"published":{"date-parts":[[2024,6,19]]}}}