{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,11]],"date-time":"2025-12-11T19:06:29Z","timestamp":1765479989858,"version":"3.48.0"},"reference-count":64,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"24","license":[{"start":{"date-parts":[[2025,12,15]],"date-time":"2025-12-15T00:00:00Z","timestamp":1765756800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2025,12,15]],"date-time":"2025-12-15T00:00:00Z","timestamp":1765756800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,12,15]],"date-time":"2025-12-15T00:00:00Z","timestamp":1765756800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Intelligent Computing and Security(ICNS) Lab"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Internet Things J."],"published-print":{"date-parts":[[2025,12,15]]},"DOI":"10.1109\/jiot.2025.3625275","type":"journal-article","created":{"date-parts":[[2025,10,27]],"date-time":"2025-10-27T18:05:59Z","timestamp":1761588359000},"page":"55725-55741","source":"Crossref","is-referenced-by-count":0,"title":["CacheMoE: Task-Aware Expert Model Caching for Multitask Inference in Distributed Edge IoT Networks"],"prefix":"10.1109","volume":"12","author":[{"ORCID":"https:\/\/orcid.org\/0009-0000-6066-6865","authenticated-orcid":false,"given":"Afsana Kabir","family":"Sinthia","sequence":"first","affiliation":[{"name":"Department of Artificial Intelligence, School of Computing, Kyung Hee University, Yongin, Republic of Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0858-5563","authenticated-orcid":false,"given":"Nosin Ibna","family":"Mahbub","sequence":"additional","affiliation":[{"name":"Department of Artificial Intelligence, School of Computing, Kyung Hee University, Yongin, Republic of Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2953-7314","authenticated-orcid":false,"given":"Md Nahid","family":"Sultan","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Engineering, School of Computing, Kyung Hee University, Yongin, Republic of Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0184-6975","authenticated-orcid":false,"given":"Eui-Nam","family":"Huh","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Engineering, School of Computing, Kyung Hee University, Yongin, Republic of Korea"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/mwc.005.2400019"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/comst.2025.3568637"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"ref4","article-title":"An image is worth 16\u00d716 words: Transformers for image recognition at scale","author":"Dosovitskiy","year":"2020","journal-title":"arXiv:2010.11929"},{"key":"ref5","first-page":"1877","article-title":"Language models are few-shot learners","volume-title":"Proc. NIPS","author":"Brown"},{"key":"ref6","article-title":"Blockchain large language models","author":"Gai","year":"2023","journal-title":"arXiv:2304.12749"},{"issue":"240","key":"ref7","first-page":"1","article-title":"PaLM: Scaling language modeling with pathways","volume":"24","author":"Chowdhery","year":"2023","journal-title":"J. Mach. Learn. Res."},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2024.3359040"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/GCWkshps58843.2023.10465123"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3054719"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3220007"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00332"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.433"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2025.3597815"},{"key":"ref16","first-page":"5547","article-title":"GLaM: Efficient scaling of language models with mixture-of-experts","volume-title":"Proc. Int. Conf. Mach. Learn.","volume":"162","author":"Du"},{"key":"ref17","first-page":"973","article-title":"GEMEL: Model merging for memory-efficient, real-time video analytics at the edge","volume-title":"Proc. 20th USENIX Symp. Networked Syst. Design Implement. (NSDI 23)","author":"Padmanabhan"},{"volume-title":"Technical Specification Group Services and System Aspects; General Packet Radio Service (GPRS) Enhancements for Evolved Universal Terrestrial Radio Access Network (E-UTRAN) Access","year":"2011","key":"ref18"},{"key":"ref19","article-title":"Wireless large AI model: Shaping the AI-native future of 6G and beyond","author":"Zhu","year":"2025","journal-title":"arXiv:2504.14653"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2016.2636843"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICDCS60910.2024.00013"},{"key":"ref22","article-title":"CacheNet: A model caching framework for deep learning inference on the edge","author":"Fang","year":"2020","journal-title":"arXiv:2007.01793"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/BigData50022.2020.9378161"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TNSM.2022.3172370"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2021.3053055"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TNSM.2024.3403842"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM42002.2020.9322208"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/MDM.2019.00115"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM46510.2021.9685947"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/GLOBECOM42002.2020.9322101"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/VTCFall.2019.8891441"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2020.2988386"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2022.3142809"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2020.2991408"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2020.2993359"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2901525"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CSCWD57460.2023.10152582"},{"key":"ref38","article-title":"Edge intelligence: Architectures, challenges, and applications","author":"Xu","year":"2020","journal-title":"arXiv:2003.12172"},{"key":"ref39","article-title":"Pushing large language models to the 6G edge: Vision, challenges, and opportunities","author":"Lin","year":"2023","journal-title":"arXiv:2309.16739"},{"key":"ref40","article-title":"Cached model-as-a-resource: Provisioning large language model agents for edge intelligence in space-air-ground integrated networks","author":"Xu","year":"2024","journal-title":"arXiv:2403.05826"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1016\/j.dcan.2023.02.003"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2024.3373015"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM41043.2020.9155455"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/WCSP55476.2022.10039249"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1016\/j.future.2022.03.025"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2021.3133291"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2020.2968326"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/TETC.2025.3598369"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2025.3571023"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/MASS50613.2020.00062"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2017.2713384"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.23919\/JCC.2023.03.004"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2023.3235443"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/ICCAD57390.2023.10323651"},{"key":"ref55","first-page":"28441","article-title":"M3vit: Mixture-of-experts vision transformer for efficient multi-task learning with model-accelerator co-design","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"35","author":"Fan"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2022.3221271"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2023.3259688"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02638"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2022.3201983"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2024.3384313"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/TII.2019.2953189"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2024.3392329"},{"key":"ref63","first-page":"531","article-title":"Mutual information neural estimation","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Belghazi"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49660.2025.10890805"}],"container-title":["IEEE Internet of Things Journal"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/6488907\/11293846\/11216406.pdf?arnumber=11216406","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,11]],"date-time":"2025-12-11T18:47:42Z","timestamp":1765478862000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11216406\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,15]]},"references-count":64,"journal-issue":{"issue":"24"},"URL":"https:\/\/doi.org\/10.1109\/jiot.2025.3625275","relation":{},"ISSN":["2327-4662","2372-2541"],"issn-type":[{"type":"electronic","value":"2327-4662"},{"type":"electronic","value":"2372-2541"}],"subject":[],"published":{"date-parts":[[2025,12,15]]}}}