{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,11]],"date-time":"2026-04-11T13:09:19Z","timestamp":1775912959496,"version":"3.50.1"},"reference-count":58,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"3","license":[{"start":{"date-parts":[[2025,5,1]],"date-time":"2025-05-01T00:00:00Z","timestamp":1746057600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2025,5,1]],"date-time":"2025-05-01T00:00:00Z","timestamp":1746057600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,5,1]],"date-time":"2025-05-01T00:00:00Z","timestamp":1746057600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62272050"],"award-info":[{"award-number":["62272050"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62302048"],"award-info":[{"award-number":["62302048"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Guangdong Key Lab of AI and Multi-modal Data Processing"},{"name":"Beijing Normal-Hong Kong Baptist University, Zhuhai"},{"DOI":"10.13039\/501100010226","name":"Department of Education of Guangdong Province","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100010226","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Institute of Artificial Intelligence and Future Networks and Engineering Center of AI and Future Education"},{"name":"Guangdong Provincial Department of Science and Technology, China"},{"name":"Zhuhai Science-Tech Innovation Bureau","award":["2320004002772"],"award-info":[{"award-number":["2320004002772"]}]},{"name":"Interdisciplinary Intelligence Super Computer Center of Beijing Normal University at Zhuhai"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Serv. Comput."],"published-print":{"date-parts":[[2025,5]]},"DOI":"10.1109\/tsc.2025.3562362","type":"journal-article","created":{"date-parts":[[2025,4,18]],"date-time":"2025-04-18T17:37:59Z","timestamp":1744997879000},"page":"1412-1427","source":"Crossref","is-referenced-by-count":12,"title":["Enhancing LLM QoS Through Cloud-Edge Collaboration: A Diffusion-Based Multi-Agent Reinforcement Learning Approach"],"prefix":"10.1109","volume":"18","author":[{"given":"Zhi","family":"Yao","sequence":"first","affiliation":[{"name":"School of Artificial Intelligence, Beijing Normal University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9375-4818","authenticated-orcid":false,"given":"Zhiqing","family":"Tang","sequence":"additional","affiliation":[{"name":"Institute of Artificial Intelligence and Future Networks, Beijing Normal University, Zhuhai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8493-4449","authenticated-orcid":false,"given":"Wenmian","family":"Yang","sequence":"additional","affiliation":[{"name":"Institute of Artificial Intelligence and Future Networks, Beijing Normal University, Zhuhai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1000-3937","authenticated-orcid":false,"given":"Weijia","family":"Jia","sequence":"additional","affiliation":[{"name":"Institute of Artificial Intelligence and Future Networks, Beijing Normal University, Zhuhai, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.001.2300550"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2024.3353265"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2022.3186496"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/OJCOMS.2023.3320646"},{"key":"ref5","first-page":"36 187","article-title":"Memory-efficient fine-tuning of compressed large language models via sub-4-bit integer quantization","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Kim"},{"key":"ref6","first-page":"38 087","article-title":"SmoothQuant: Accurate and efficient post-training quantization for large language models","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Xiao"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-acl.507"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2022.3156047"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/mnet.2024.3376419"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.2024.3353377"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICWS60048.2023.00012"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/3534619"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/LCA.2023.3296251"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/tsc.2024.3418328"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3448016.3457550"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.825"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/s00778-024-00864-x"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.59287\/icaens.1127"},{"key":"ref19","first-page":"8469","article-title":"PaLM-E: An embodied multimodal language model","volume-title":"Proc. 40th Int. Conf. Mach. Learn.","author":"Driess"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ASE56229.2023.00065"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TBDATA.2020.2990558"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-71682-4_5"},{"key":"ref23","first-page":"6840","article-title":"Denoising diffusion probabilistic models","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Ho"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICWS60048.2023.00088"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2024.3356178"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2022.3222765"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.14778\/3554821.3554843"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/j.dcan.2018.10.003"},{"key":"ref30","first-page":"1","article-title":"Making efficient use of demonstrations to solve hard exploration problems","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Gulcehre"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICWS62655.2024.00105"},{"key":"ref32","article-title":"Qwen technical report","author":"Bai","year":"2023"},{"key":"ref33","first-page":"47 669","article-title":"Openassistant conversations-democratizing large language model alignment","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"K\u00f6pf"},{"key":"ref35","first-page":"87","article-title":"AWQ: Activation-aware weight quantization for on-device LLM compression and acceleration","volume-title":"Proc. Mach. Learn. Syst.","author":"Lin"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM54140.2023.10437617"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA59077.2024.00019"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1145\/3660605.3660941"},{"key":"ref39","first-page":"20 132","article-title":"A minimalist approach to offline reinforcement learning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Fujimoto"},{"key":"ref40","article-title":"CleanDiffuser: An easy-to-use modularized library for diffusion models in decision making","author":"Dong","year":"2024"},{"key":"ref41","first-page":"1","article-title":"Diffusion policies as an expressive policy class for offline reinforcement learning","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Wang"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/TSC.2024.3399654"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-96-0805-8_16"},{"key":"ref44","article-title":"Efficient LLM scheduling by learning to rank","author":"Fu","year":"2024"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.14778\/3685800.3685905"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/OJVT.2024.3447449"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1145\/3638757"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/LCOMM.2019.2931688"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM.2016.7524384"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2023.3330255"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.bigscience-1.9"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/tsc.2024.3451185"},{"key":"ref53","first-page":"1057","article-title":"Policy gradient methods fomoesysr reinforcement learning with function approximation","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Sutton"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.12794\/metadc1505267"},{"key":"ref55","first-page":"15 908","article-title":"Transformer in transformer","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Han"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2022.3142079"},{"key":"ref57","article-title":"The pile: An 800GB dataset of diverse text for language modeling","author":"Gao","year":"2020"},{"key":"ref59","first-page":"24 611","article-title":"The surprising effectiveness of PPO in cooperative multi-agent games","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Yu"},{"key":"ref60","article-title":"Understanding diffusion models: A unified perspective","author":"Luo","year":"2022"}],"container-title":["IEEE Transactions on Services Computing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/4629386\/11031152\/10970093.pdf?arnumber=10970093","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,12]],"date-time":"2025-06-12T17:43:22Z","timestamp":1749750202000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10970093\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5]]},"references-count":58,"journal-issue":{"issue":"3"},"URL":"https:\/\/doi.org\/10.1109\/tsc.2025.3562362","relation":{},"ISSN":["1939-1374","2372-0204"],"issn-type":[{"value":"1939-1374","type":"electronic"},{"value":"2372-0204","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,5]]}}}