{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,9]],"date-time":"2026-04-09T14:46:31Z","timestamp":1775745991856,"version":"3.50.1"},"reference-count":40,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"10","license":[{"start":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T00:00:00Z","timestamp":1759276800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T00:00:00Z","timestamp":1759276800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T00:00:00Z","timestamp":1759276800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62394322"],"award-info":[{"award-number":["62394322"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U22B2031"],"award-info":[{"award-number":["U22B2031"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62471066"],"award-info":[{"award-number":["62471066"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62394323"],"award-info":[{"award-number":["62394323"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62472240"],"award-info":[{"award-number":["62472240"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62132009"],"award-info":[{"award-number":["62132009"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61932016"],"award-info":[{"award-number":["61932016"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62132011"],"award-info":[{"award-number":["62132011"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["92167204"],"award-info":[{"award-number":["92167204"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Science Fund for Creative Research Groups of the National Natural Science Foundation of China","award":["62221003"],"award-info":[{"award-number":["62221003"]}]},{"DOI":"10.13039\/100018735","name":"Ant Group","doi-asserted-by":"publisher","award":["CCF-AFSGRF20210023"],"award-info":[{"award-number":["CCF-AFSGRF20210023"]}],"id":[{"id":"10.13039\/100018735","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100017582","name":"Beijing National Research Center for Information Science and Technology","doi-asserted-by":"publisher","award":["BNR2025RC01010"],"award-info":[{"award-number":["BNR2025RC01010"]}],"id":[{"id":"10.13039\/501100017582","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100017582","name":"Beijing National Research Center for Information Science and Technology","doi-asserted-by":"publisher","award":["BNR2023TD03006"],"award-info":[{"award-number":["BNR2023TD03006"]}],"id":[{"id":"10.13039\/501100017582","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100011532","name":"State Key Laboratory of Networking and Switching Technology","doi-asserted-by":"publisher","award":["NST20250203"],"award-info":[{"award-number":["NST20250203"]}],"id":[{"id":"10.13039\/501100011532","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. on Mobile Comput."],"published-print":{"date-parts":[[2025,10]]},"DOI":"10.1109\/tmc.2025.3531793","type":"journal-article","created":{"date-parts":[[2025,1,21]],"date-time":"2025-01-21T13:29:59Z","timestamp":1737466199000},"page":"9289-9302","source":"Crossref","is-referenced-by-count":19,"title":["Multi-Agent Reinforcement Learning for Task Offloading in Crowd-Edge Computing"],"prefix":"10.1109","volume":"24","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5165-2787","authenticated-orcid":false,"given":"Su","family":"Yao","sequence":"first","affiliation":[{"name":"Beijing National Research Center for Information Science and Technology (BNRist), Tsinghua University, Beijing, China"}]},{"given":"Mu","family":"Wang","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Networking and Switching Technology, Beijing University of Posts and Telecommunications, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2782-183X","authenticated-orcid":false,"given":"Ju","family":"Ren","sequence":"additional","affiliation":[{"name":"Beijing National Research Center for Information Science and Technology (BNRist), Tsinghua University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5879-7644","authenticated-orcid":false,"given":"Tianyu","family":"Xia","sequence":"additional","affiliation":[{"name":"Ant Group, Hangzhou, China"}]},{"given":"Weiqiang","family":"Wang","sequence":"additional","affiliation":[{"name":"Ant Group, Hangzhou, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2587-8517","authenticated-orcid":false,"given":"Ke","family":"Xu","sequence":"additional","affiliation":[{"name":"Beijing National Research Center for Information Science and Technology (BNRist), Tsinghua University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4847-4585","authenticated-orcid":false,"given":"Mingwei","family":"Xu","sequence":"additional","affiliation":[{"name":"Beijing National Research Center for Information Science and Technology (BNRist), Tsinghua University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8906-813X","authenticated-orcid":false,"given":"Hongke","family":"Zhang","sequence":"additional","affiliation":[{"name":"School of Electronic and Information Engineering, Beijing Jiaotong University, Beijing, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2018.2864559"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2018.2829513"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2021.3068748"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2019.2894306"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2020.3003307"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2018.2880407"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TIFS.2019.2939713"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.001.1900130"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM.2017.8057198"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.003.2300475"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TII.2020.2983209"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TII.2019.2961237"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2020.3036871"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2021.3066619"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/COMST.2020.2986024"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TIFS.2016.2607691"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICDCS.2019.00212"},{"key":"ref18","first-page":"1057","article-title":"Policy gradient method for reinforcement learning with function approximation","volume-title":"Proc. 1998 IEEE Int. Conf. Robot. Automat.","author":"Sutton"},{"issue":"518","key":"ref19","first-page":"529","article-title":"Human-level control through deep reinforcement learning","volume":"7540","author":"Volodymyr","year":"2019","journal-title":"Nature"},{"key":"ref20","first-page":"1338","article-title":"Asynchronous methods for model-based reinforcement learning","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Zhang"},{"key":"ref21","first-page":"2961","article-title":"Actor-attention-critic for multi-agent reinforcement learning","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Iqbal"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11794"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2019.2926979"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2019.2896999"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.2018.1701054"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2019.2903088"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2020.2968427"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2018.2890685"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2018.2876279"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2020.3043038"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2020.3046737"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2021.3120050"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TCCN.2020.3027695"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2019.2929263"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2022.3213358"},{"key":"ref36","article-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-79995-2"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2020.3047859"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2021.3114193"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2021.3115262"}],"container-title":["IEEE Transactions on Mobile Computing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/7755\/11154819\/10848135.pdf?arnumber=10848135","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,12]],"date-time":"2025-09-12T17:32:27Z","timestamp":1757698347000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10848135\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10]]},"references-count":40,"journal-issue":{"issue":"10"},"URL":"https:\/\/doi.org\/10.1109\/tmc.2025.3531793","relation":{},"ISSN":["1536-1233","1558-0660","2161-9875"],"issn-type":[{"value":"1536-1233","type":"print"},{"value":"1558-0660","type":"electronic"},{"value":"2161-9875","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,10]]}}}