{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,25]],"date-time":"2026-02-25T22:04:27Z","timestamp":1772057067085,"version":"3.50.1"},"reference-count":237,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"PERFORM Research Chair Program funded by Fondation J.-Louis L\u00e9vesque and Seatrium New Energy Laboratory, Singapore Ministry of Education (MOE) Tier 1","award":["RT5\/23"],"award-info":[{"award-number":["RT5\/23"]}]},{"name":"PERFORM Research Chair Program funded by Fondation J.-Louis L\u00e9vesque and Seatrium New Energy Laboratory, Singapore Ministry of Education (MOE) Tier 1","award":["RG24\/24"],"award-info":[{"award-number":["RG24\/24"]}]},{"name":"Nanyang Technological University (NTU) Centre for Computational Technologies in Finance"},{"name":"Research Innovation and Enterprise (RIE) 2025 Industry Alignment Fund\u2014Industry Collaboration Projects (IAF-ICP), administered by Agency for Science, Technology and Research","award":["I2301E0026"],"award-info":[{"award-number":["I2301E0026"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Commun. Surv. Tutorials"],"published-print":{"date-parts":[[2026]]},"DOI":"10.1109\/comst.2026.3665395","type":"journal-article","created":{"date-parts":[[2026,2,16]],"date-time":"2026-02-16T21:10:37Z","timestamp":1771276237000},"page":"4915-4947","source":"Crossref","is-referenced-by-count":0,"title":["From Data Mirror to Smart Copilot: A Survey on NextG Semantic Communication for Propelling Digital Twin World Into Cognitive Stage"],"prefix":"10.1109","volume":"28","author":[{"given":"Fang","family":"Zhu","sequence":"first","affiliation":[{"name":"ZTE Microelectronics R&#x0026;D Institute, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2581-951X","authenticated-orcid":false,"given":"Jiayuan","family":"Chen","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China"}]},{"given":"Junjie","family":"Wen","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-0397-2162","authenticated-orcid":false,"given":"Yuye","family":"Yang","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3467-0710","authenticated-orcid":false,"given":"Changyan","family":"Yi","sequence":"additional","affiliation":[{"name":"College of Computer Science and Technology, Nanjing University of Aeronautics and Astronautics, Nanjing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8258-6206","authenticated-orcid":false,"given":"Yun","family":"Tie","sequence":"additional","affiliation":[{"name":"Zhengzhou University, Zhengzhou, China"}]},{"given":"Peng","family":"Zhang","sequence":"additional","affiliation":[{"name":"Advanced Institute of Information Technology, Peking University, Hangzhou, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9254-0404","authenticated-orcid":false,"given":"Jun","family":"Cai","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, Concordia University, Montreal, QC, Canada"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7442-7416","authenticated-orcid":false,"given":"Dusit","family":"Niyato","sequence":"additional","affiliation":[{"name":"College of Computing and Data Science, Nanyang Technological University, Jurong West, Singapore"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8972-8094","authenticated-orcid":false,"given":"Mohsen","family":"Guizani","sequence":"additional","affiliation":[{"name":"Machine Learning Department, Mohamed Bin Zayed University of Artificial Intelligence (MBZUAI), Abu Dhabi, United Arab Emirates"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2021.3079510"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2023.3297395"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/j.cie.2024.110418"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2024.109587"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2023.3308717"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.3389\/fbioe.2021.793782"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2017.2743240"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2024.3402386"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/SOSE62659.2024.10620933"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2022.3232063"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/j.apradiso.2022.110579"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2024.3421918"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.118.2200071"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/3674838"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/j.jii.2025.100943"},{"key":"ref16","article-title":"World models for cognitive agents: Transforming edge intelligence in future networks","author":"Zhao","year":"2025","journal-title":"arXiv:2506.00417"},{"key":"ref17","article-title":"Edge general intelligence through world models and agentic AI: Fundamentals, solutions, and challenges","author":"Zhao","year":"2025","journal-title":"arXiv:2508.09561"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.02575"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1016\/j.aei.2024.102570"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2025.3568637"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/MIOT.2025.3615709"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1016\/j.jii.2025.100799"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.2024.3411008"},{"key":"ref24","article-title":"Digital twin generation from visual data: A survey","author":"Melnik","year":"2025","journal-title":"arXiv:2504.13159"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01560"},{"key":"ref26","first-page":"2165","article-title":"RT-2: Vision-language-action models transfer web knowledge to robotic control","volume-title":"Proc. CoRL","author":"Brohan"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.2024.3507157"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1016\/j.cie.2023.109764"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/j.rcim.2024.102769"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.3390\/machines9090193"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1080\/00207543.2024.2435583"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.101.2100269"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2022.3223224"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/LWC.2025.3557843"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2022.3223408"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.001.2300575"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3639563"},{"key":"ref38","article-title":"SWI: Speaking with intent in large language models","author":"Yin","year":"2025","journal-title":"arXiv:2503.21544"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2024.3351601"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i17.29811"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72970-6_8"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2025.3554028"},{"key":"ref43","article-title":"From understanding to utilization: A survey on explainability for large language models","author":"Luo","year":"2024","journal-title":"arXiv:2401.12874"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.52202\/079017-0607"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.findings-acl.416"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1145\/3716846"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.005.2400366"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.003.2200616"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2023.3317629"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2024.3401229"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2025.3574592"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2025.3581152"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2023.3333342"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2024.3520707"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2024.3443193"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2024.3435524"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-38756-7_4"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1155\/2011\/154798"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1155\/2014\/439278"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.2514\/6.2012-1818"},{"issue":"2014","key":"ref61","first-page":"1","article-title":"Digital twin: Manufacturing excellence through virtual factory replication","volume":"1","author":"Grieves","year":"2014","journal-title":"White paper"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1016\/j.ifacol.2018.08.474"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1016\/j.dajour.2022.100039"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-32156-1_5"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.2514\/1.J055201"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.2025.3574228"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1016\/j.cie.2024.110308"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1016\/j.cie.2024.110491"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1080\/09544828.2024.2326111"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2023.3310106"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2025.3527719"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/TNSM.2025.3558358"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2023.3340132"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2024.3519331"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.2025.3526556"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/tmc.2025.3645306"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.001.2300346"},{"key":"ref78","article-title":"Image generation with supervised selection based on multimodal features for semantic communications","author":"Liang","year":"2024","journal-title":"arXiv:2411.17428"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.3390\/s21134276"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2025.3531413"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49660.2025.10889160"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1145\/3641289"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2025.3567613"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3651029"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2024.3415470"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2024.3412852"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1145\/3600100.3623719"},{"key":"ref88","first-page":"2616","article-title":"MIDLM: Multi-intent detection with bidirectional large language models","volume-title":"Proc. COLING","author":"Yin"},{"key":"ref89","article-title":"SAM 2: Segment anything in images and videos","author":"Ravi","year":"2024","journal-title":"arXiv:2408.00714"},{"key":"ref90","article-title":"LRM: Large reconstruction model for single image to 3D","author":"Hong","year":"2023","journal-title":"arXiv:2311.04400"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1038\/s42256-025-01033-7"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2025.3531546"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2024.3422496"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1016\/j.rcim.2025.103068"},{"key":"ref95","first-page":"1316","article-title":"MobileLLM: Optimizing sub-billion parameter language models for on-device use cases","volume-title":"Proc. ICML","author":"Liu"},{"key":"ref96","article-title":"Faster segment anything: Towards lightweight SAM for mobile applications","author":"Zhang","year":"2023","journal-title":"arXiv:2306.14289"},{"key":"ref97","article-title":"VisualBERT: A simple and performant baseline for vision and language","author":"Harold Li","year":"2019","journal-title":"arXiv:1908.03557"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1109\/WACV57701.2024.00427"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2024.3406607"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2025.3582755"},{"key":"ref101","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2023.3324704"},{"key":"ref102","article-title":"TIGER: Time-frequency interleaved gain extraction and reconstruction for efficient speech separation","author":"Xu","year":"2024","journal-title":"arXiv:2410.01469"},{"key":"ref103","doi-asserted-by":"publisher","DOI":"10.1109\/icassp49660.2025.10889530"},{"key":"ref104","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.2024.3366560"},{"key":"ref105","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2024.3516819"},{"key":"ref106","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-acl.807"},{"key":"ref107","doi-asserted-by":"publisher","DOI":"10.1093\/nsr\/nwae403"},{"key":"ref108","article-title":"Cross-modal consistency in multimodal large language models","author":"Zhang","year":"2024","journal-title":"arXiv:2411.09273"},{"key":"ref109","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10096509"},{"key":"ref110","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.358"},{"key":"ref111","article-title":"REGEN: Learning compact video embedding with (re-)generative decoder","author":"Zhang","year":"2025","journal-title":"arXiv:2503.08665"},{"key":"ref112","doi-asserted-by":"publisher","DOI":"10.1109\/ICNP59255.2023.10355575"},{"key":"ref113","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.013.2100642"},{"key":"ref114","doi-asserted-by":"publisher","DOI":"10.1145\/3626772.3661381"},{"key":"ref115","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2005.844108"},{"key":"ref116","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2023.3257770"},{"key":"ref117","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2025.3561786"},{"key":"ref118","doi-asserted-by":"publisher","DOI":"10.1109\/TDSC.2008.11"},{"key":"ref119","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2024.3385816"},{"key":"ref120","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2020.3016962"},{"key":"ref121","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2023.3339706"},{"key":"ref122","doi-asserted-by":"publisher","DOI":"10.1007\/s11432-024-4556-9"},{"key":"ref123","doi-asserted-by":"publisher","DOI":"10.1109\/MCOMSTD.2025.3585026"},{"key":"ref124","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2024.3418612"},{"key":"ref125","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2021.3112570"},{"key":"ref126","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2018.2811387"},{"key":"ref127","doi-asserted-by":"publisher","DOI":"10.1016\/j.cose.2018.09.014"},{"key":"ref128","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2015.2417155"},{"key":"ref129","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2024.3406591"},{"key":"ref130","doi-asserted-by":"publisher","DOI":"10.32604\/cmc.2025.066975"},{"key":"ref131","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2023.3290005"},{"key":"ref132","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2025.3572680"},{"key":"ref133","first-page":"1","article-title":"DTAS: Adaptive model splitting for dynamic digital twin update with edge-cloud collaboration","volume-title":"Proc. IEEE INFOCOM","author":"Chen"},{"key":"ref134","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2020.2970110"},{"key":"ref135","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2018.2865661"},{"key":"ref136","doi-asserted-by":"publisher","DOI":"10.1109\/TNSE.2023.3342183"},{"key":"ref137","doi-asserted-by":"publisher","DOI":"10.5772\/intechopen.110475"},{"key":"ref138","article-title":"Intent3D: 3D object detection in RGB-D scans based on human intention","author":"Kang","year":"2024","journal-title":"arXiv:2405.18295"},{"key":"ref139","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02546"},{"key":"ref140","first-page":"39","article-title":"UniDoc: Unified pretraining framework for document understanding","volume-title":"Proc. NeurIPS","volume":"34","author":"Gu"},{"key":"ref141","doi-asserted-by":"publisher","DOI":"10.1109\/WACV57701.2024.00689"},{"key":"ref142","doi-asserted-by":"publisher","DOI":"10.1145\/3503250"},{"key":"ref143","doi-asserted-by":"publisher","DOI":"10.1109\/WACV57701.2024.00342"},{"key":"ref144","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP48485.2024.10445897"},{"key":"ref145","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.02049"},{"key":"ref146","article-title":"V2V-LLM: Vehicle-to-vehicle cooperative autonomous driving with multi-modal large language models","author":"Chiu","year":"2025","journal-title":"arXiv:2502.09980"},{"key":"ref147","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3611964"},{"key":"ref148","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-long.290"},{"key":"ref149","doi-asserted-by":"publisher","DOI":"10.52202\/079017-0036"},{"key":"ref150","article-title":"V2X-LLM: Enhancing V2X integration and understanding in connected vehicle corridors","author":"Wu","year":"2025","journal-title":"arXiv:2503.02239"},{"key":"ref151","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i16.29710"},{"key":"ref152","doi-asserted-by":"publisher","DOI":"10.52202\/079017-4020"},{"key":"ref153","first-page":"34892","article-title":"Visual instruction tuning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"36","author":"Liu"},{"key":"ref154","first-page":"2187","article-title":"Next-GPT: Any-to-any multimodal LLM","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Wu"},{"key":"ref155","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2024.3361502"},{"key":"ref156","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00665"},{"key":"ref157","doi-asserted-by":"publisher","DOI":"10.1109\/ICCWorkshops57953.2023.10283705"},{"key":"ref158","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2024.3506286"},{"key":"ref159","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00563"},{"key":"ref160","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02010"},{"key":"ref161","first-page":"13485","article-title":"Streaming radiance fields for 3D video synthesis","volume-title":"Proc. NeurIPS","author":"Li"},{"key":"ref162","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00052"},{"key":"ref163","doi-asserted-by":"publisher","DOI":"10.1145\/3487045"},{"key":"ref164","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i1.19884"},{"key":"ref165","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.emnlp-main.319"},{"key":"ref166","article-title":"Harder tasks need more experts: Dynamic routing in MoE models","author":"Huang","year":"2024","journal-title":"arXiv:2403.07652"},{"key":"ref167","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2019.2919300"},{"key":"ref168","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2025.3556909"},{"key":"ref169","doi-asserted-by":"publisher","DOI":"10.1109\/MCOMSTD.2025.3605634"},{"key":"ref170","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2025.3539526"},{"key":"ref171","doi-asserted-by":"publisher","DOI":"10.1109\/TNSE.2018.2848960"},{"key":"ref172","doi-asserted-by":"publisher","DOI":"10.1109\/NOMS59830.2024.10575676"},{"key":"ref173","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2020.2970707"},{"key":"ref174","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2024.3397862"},{"key":"ref175","article-title":"Pilot-guided multimodal semantic communication for audio-visual event localization","author":"Yu","year":"2024","journal-title":"arXiv:2412.06208"},{"key":"ref176","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2025.3573407"},{"key":"ref177","article-title":"Conditional generative adversarial nets","author":"Mirza","year":"2014","journal-title":"arXiv:1411.1784"},{"key":"ref178","doi-asserted-by":"publisher","DOI":"10.1145\/3626235"},{"key":"ref179","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2025.3549592"},{"key":"ref180","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2024.3409428"},{"key":"ref181","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2007.897979"},{"key":"ref182","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2022.3191937"},{"key":"ref183","doi-asserted-by":"publisher","DOI":"10.21236\/AD0707853"},{"key":"ref184","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2025.3531012"},{"key":"ref185","doi-asserted-by":"publisher","DOI":"10.1109\/blackseacom.2019.8812774"},{"key":"ref186","doi-asserted-by":"publisher","DOI":"10.3390\/e25030413"},{"key":"ref187","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2011.091411.110249"},{"key":"ref188","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2023.3242718"},{"key":"ref189","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2025.3528938"},{"key":"ref190","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2020.3037374"},{"key":"ref191","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2022.3173463"},{"key":"ref192","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2022.3191085"},{"key":"ref193","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2024.3475884"},{"key":"ref194","doi-asserted-by":"publisher","DOI":"10.1109\/OJCOMS.2023.3305583"},{"key":"ref195","doi-asserted-by":"publisher","DOI":"10.1109\/LCOMM.2022.3172437"},{"key":"ref196","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2020.3037317"},{"key":"ref197","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2023.3266298"},{"key":"ref198","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2024.3402556"},{"key":"ref199","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2021.3111838"},{"key":"ref200","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2025.3581600"},{"key":"ref201","article-title":"How hungry is AI? Benchmarking energy, water, and carbon footprint of LLM inference","author":"Jegham","year":"2025","journal-title":"arXiv:2505.09598"},{"key":"ref202","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-71467-2_40"},{"key":"ref203","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2025.3556091"},{"key":"ref204","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2025.3565469"},{"key":"ref205","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2024.3430486"},{"key":"ref206","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2019.2891736"},{"key":"ref207","doi-asserted-by":"publisher","DOI":"10.1109\/ICCC62479.2024.10681718"},{"key":"ref208","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2025.3577233"},{"key":"ref209","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19815-1_26"},{"key":"ref210","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2024.3378003"},{"key":"ref211","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i15.29656"},{"key":"ref212","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10094680"},{"key":"ref213","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2021.3082521"},{"key":"ref214","first-page":"20482","article-title":"3D-LLM: Injecting the 3D world into large language models","volume-title":"Proc. NeurIPS","author":"Hong"},{"key":"ref215","article-title":"3D-VLA: A 3D vision-language-action generative world model","author":"Zhen","year":"2024","journal-title":"arXiv:2403.09631"},{"key":"ref216","article-title":"Multi-modal fusion-based multi-task semantic communication system","author":"Zhu","year":"2024","journal-title":"arXiv:2407.00964"},{"key":"ref217","doi-asserted-by":"publisher","DOI":"10.1007\/s00371-023-02853-7"},{"key":"ref218","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2025.103789"},{"key":"ref219","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.001.2300807"},{"key":"ref220","doi-asserted-by":"publisher","DOI":"10.1016\/j.future.2024.107538"},{"key":"ref221","article-title":"HELIOS: Adaptive model and early-exit selection for efficient LLM inference serving","author":"Kumar","year":"2025","journal-title":"arXiv:2504.10724"},{"key":"ref222","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2025.3572437"},{"key":"ref223","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2024.3395709"},{"key":"ref224","doi-asserted-by":"publisher","DOI":"10.1145\/3735633"},{"key":"ref225","article-title":"Federated continual learning for edge-AI: A comprehensive survey","author":"Wang","year":"2024","journal-title":"arXiv:2411.13740"},{"key":"ref226","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2017.2740724"},{"key":"ref227","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2024.3352749"},{"key":"ref228","doi-asserted-by":"publisher","DOI":"10.3233\/FAIA250949"},{"key":"ref229","doi-asserted-by":"publisher","DOI":"10.1007\/s43684-023-00060-8"},{"key":"ref230","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOMWKSHPS65812.2025.11152999"},{"key":"ref231","doi-asserted-by":"publisher","DOI":"10.1109\/jsac.2026.3660010"},{"key":"ref232","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2023.3322776"},{"key":"ref233","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2024.3382829"},{"key":"ref234","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2024.3457777"},{"key":"ref235","doi-asserted-by":"publisher","DOI":"10.1016\/j.adhoc.2024.103484"},{"key":"ref236","doi-asserted-by":"publisher","DOI":"10.1109\/SEAMS51251.2021.00015"},{"key":"ref237","doi-asserted-by":"publisher","DOI":"10.1016\/j.cma.2011.03.016"}],"container-title":["IEEE Communications Surveys &amp; Tutorials"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/9739\/11321210\/11397356.pdf?arnumber=11397356","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,25]],"date-time":"2026-02-25T21:00:21Z","timestamp":1772053221000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11397356\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"references-count":237,"URL":"https:\/\/doi.org\/10.1109\/comst.2026.3665395","relation":{},"ISSN":["1553-877X","2373-745X"],"issn-type":[{"value":"1553-877X","type":"electronic"},{"value":"2373-745X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]}}}