{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,6]],"date-time":"2026-06-06T15:48:53Z","timestamp":1780760933492,"version":"3.54.1"},"reference-count":45,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"6","license":[{"start":{"date-parts":[[2022,11,1]],"date-time":"2022-11-01T00:00:00Z","timestamp":1667260800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2022,11,1]],"date-time":"2022-11-01T00:00:00Z","timestamp":1667260800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,11,1]],"date-time":"2022-11-01T00:00:00Z","timestamp":1667260800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100012166","name":"National Key Research and Development Program of China","doi-asserted-by":"publisher","award":["2020YFB0906000"],"award-info":[{"award-number":["2020YFB0906000"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012166","name":"National Key Research and Development Program of China","doi-asserted-by":"publisher","award":["2020YFB0906002"],"award-info":[{"award-number":["2020YFB0906002"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100005595","name":"University of California","doi-asserted-by":"publisher","award":["L22CR4556"],"award-info":[{"award-number":["L22CR4556"]}],"id":[{"id":"10.13039\/100005595","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Smart Grid"],"published-print":{"date-parts":[[2022,11]]},"DOI":"10.1109\/tsg.2022.3185975","type":"journal-article","created":{"date-parts":[[2022,6,24]],"date-time":"2022-06-24T19:36:15Z","timestamp":1656099375000},"page":"4873-4886","source":"Crossref","is-referenced-by-count":173,"title":["Multi-Agent Deep Reinforcement Learning for Voltage Control With Coordinated Active and Reactive Power Optimization"],"prefix":"10.1109","volume":"13","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9400-2490","authenticated-orcid":false,"given":"Daner","family":"Hu","sequence":"first","affiliation":[{"name":"Department of Electrical Engineering, Zhejiang University, Hangzhou, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7105-014X","authenticated-orcid":false,"given":"Zhenhui","family":"Ye","sequence":"additional","affiliation":[{"name":"Department of Electrical Engineering, Zhejiang University, Hangzhou, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4078-6143","authenticated-orcid":false,"given":"Yuanqi","family":"Gao","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, University of California at Riverside, Riverside, CA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0428-662X","authenticated-orcid":false,"given":"Zuzhao","family":"Ye","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, University of California at Riverside, Riverside, CA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0960-3807","authenticated-orcid":false,"given":"Yonggang","family":"Peng","sequence":"additional","affiliation":[{"name":"Department of Electrical Engineering, Zhejiang University, Hangzhou, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5086-5465","authenticated-orcid":false,"given":"Nanpeng","family":"Yu","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, University of California at Riverside, Riverside, CA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2013.2256375"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/tia.2017.2740850"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2014.2374613"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2017.2648509"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CCTA48906.2021.9659162"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TSTE.2010.2098483"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2016.2585202"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2016.2558585"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/tsg.2018.2879572"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2014.2329842"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2017.2752234"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2018.2813400"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2015.2419134"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ISGT49243.2021.9372283"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2020.3010130"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/SmartGridComm.2019.8909741"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2019.2962625"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2020.2990179"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/tsg.2021.3060027"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2021.3058996"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/5.726791"},{"key":"ref22","article-title":"Reinforcement learning with augmented data","author":"Laskin","year":"2020","journal-title":"arXiv:2004.14990"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/SmartGridComm.2019.8909777"},{"key":"ref24","article-title":"Model-free voltage regulation of unbalanced distribution network based on surrogate model and deep reinforcement learning","author":"Cao","year":"2020","journal-title":"arXiv:2006.13992"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/tpwrs.2019.2948132"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1016\/j.apenergy.2022.118762"},{"key":"ref27","article-title":"Multi-agent actor-critic for mixed cooperative-competitive environments","author":"Lowe","year":"2017","journal-title":"arXiv:1706.02275"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/TII.2021.3050039"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/61.19266"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2014.2332712"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2006.879234"},{"key":"ref32","first-page":"2961","article-title":"Actor-attention-critic for multi-agent reinforcement learning","volume-title":"Proc. 36th Int. Conf. Mach. Learn.","volume":"97","author":"Iqbal"},{"key":"ref33","first-page":"1861","article-title":"Soft actor-critic: Off-policy maximum entropy deep reinforcement learning with a stochastic actor","volume-title":"Proc. ICML","volume":"80","author":"Haarnoja"},{"key":"ref34","article-title":"Continuous control with deep reinforcement learning","author":"Lillicrap","year":"2015","journal-title":"arXiv:1509.02971"},{"key":"ref35","first-page":"1587","article-title":"Addressing function approximation error in actor-critic methods","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Fujimoto"},{"key":"ref36","article-title":"Meta-SAC: Auto-tune the entropy temperature of soft actor-critic via metagradient","author":"Wang","year":"2020","journal-title":"arXiv:2007.01932"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11492"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/TRA.2002.804040"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-71682-4_5"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/MPER.1989.4310642"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/59.119237"},{"key":"ref42","volume-title":"Web Application-Renewable Ninja","year":"2019"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1016\/j.apenergy.2018.07.065"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/CACSD.2004.1393890"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.1998.712192"}],"container-title":["IEEE Transactions on Smart Grid"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/5165411\/9927219\/09805763.pdf?arnumber=9805763","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,1]],"date-time":"2024-02-01T04:32:00Z","timestamp":1706761920000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9805763\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,11]]},"references-count":45,"journal-issue":{"issue":"6"},"URL":"https:\/\/doi.org\/10.1109\/tsg.2022.3185975","relation":{},"ISSN":["1949-3053","1949-3061"],"issn-type":[{"value":"1949-3053","type":"print"},{"value":"1949-3061","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,11]]}}}