{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,21]],"date-time":"2026-03-21T06:29:03Z","timestamp":1774074543491,"version":"3.50.1"},"reference-count":31,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"7","license":[{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,7,1]],"date-time":"2020-07-01T00:00:00Z","timestamp":1593561600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61672131"],"award-info":[{"award-number":["61672131"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61773284"],"award-info":[{"award-number":["61773284"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61773087"],"award-info":[{"award-number":["61773087"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61972448"],"award-info":[{"award-number":["61972448"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004517","name":"Innovation Foundation of Tianjin University and Tianjin Key Laboratory of Advanced Networking","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100004517","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Internet Things J."],"published-print":{"date-parts":[[2020,7]]},"DOI":"10.1109\/jiot.2019.2963499","type":"journal-article","created":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T21:14:21Z","timestamp":1577913261000},"page":"6191-6200","source":"Crossref","is-referenced-by-count":36,"title":["Deep Actor\u2013Critic Learning-Based Robustness Enhancement of Internet of Things"],"prefix":"10.1109","volume":"7","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6806-4287","authenticated-orcid":false,"given":"Ning","family":"Chen","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2324-2523","authenticated-orcid":false,"given":"Tie","family":"Qiu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1055-9513","authenticated-orcid":false,"given":"Chaoxu","family":"Mu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2964-4884","authenticated-orcid":false,"given":"Min","family":"Han","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8629-4622","authenticated-orcid":false,"given":"Pan","family":"Zhou","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref31","article-title":"Continuous control with deep reinforcement learning","author":"lillicrap","year":"2016","journal-title":"Proc Int Conf Learn Represent (ICLR)"},{"key":"ref30","article-title":"Deep reinforcement learning in large discrete action spaces","author":"dulac-arnold","year":"2015","journal-title":"Comput Sci"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.001.1900094"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1126\/science.286.5439.509"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TPDS.2019.2953745"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2011.248"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.2017.1600275"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevE.65.056109"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1009440108"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2018.2872013"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/MCOM.2017.1700246"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2017.2773600"},{"key":"ref28","first-page":"1352","article-title":"Reinforcement learning with deep energy-based policies","volume":"70","author":"haarnoja","year":"2017","journal-title":"Proc 34th Int Conf Mach Learn"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM.2018.8486269"},{"key":"ref27","article-title":"Deep deterministic policy gradient for urban traffic light control","author":"casas","year":"2017","journal-title":"Comput Sci"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2019.2956615"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TCYB.2016.2520477"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRev.36.823"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2017.2689019"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-20267-4_18"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1088\/1742-5468\/2011\/01\/P01027"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TII.2018.2872579"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TNET.2019.2907243"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2016.2612041"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1016\/j.jnca.2011.08.007"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2017.2712560"},{"key":"ref21","author":"sutton","year":"2018","journal-title":"Reinforcement Learning An Introduction"},{"key":"ref24","first-page":"2829","article-title":"Continuous deep Q-learning with model-based acceleration","author":"gu","year":"2016","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref23","first-page":"2094","article-title":"Deep reinforcement learning with double Q-learning","author":"van hasselt","year":"2016","journal-title":"Proc 13th AAAI Conf Artif Intell"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989385"},{"key":"ref25","first-page":"387","article-title":"Deterministic policy gradient algorithms","author":"silver","year":"2014","journal-title":"Proc 31st Int Conf Int Conf Mach Learn"}],"container-title":["IEEE Internet of Things Journal"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6488907\/9138535\/08948047.pdf?arnumber=8948047","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,4,27]],"date-time":"2022-04-27T17:26:40Z","timestamp":1651080400000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8948047\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,7]]},"references-count":31,"journal-issue":{"issue":"7"},"URL":"https:\/\/doi.org\/10.1109\/jiot.2019.2963499","relation":{},"ISSN":["2327-4662","2372-2541"],"issn-type":[{"value":"2327-4662","type":"electronic"},{"value":"2372-2541","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,7]]}}}