{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T18:03:28Z","timestamp":1777658608071,"version":"3.51.4"},"reference-count":122,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"4","license":[{"start":{"date-parts":[[2023,7,1]],"date-time":"2023-07-01T00:00:00Z","timestamp":1688169600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"},{"start":{"date-parts":[[2023,7,1]],"date-time":"2023-07-01T00:00:00Z","timestamp":1688169600000},"content-version":"am","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"DOI":"10.13039\/100000005","name":"U.S. Environmental Security Technology Certification Program","doi-asserted-by":"publisher","award":["EW20-EO-5331"],"award-info":[{"award-number":["EW20-EO-5331"]}],"id":[{"id":"10.13039\/100000005","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Smart Grid"],"published-print":{"date-parts":[[2023,7]]},"DOI":"10.1109\/tsg.2022.3222323","type":"journal-article","created":{"date-parts":[[2022,11,15]],"date-time":"2022-11-15T20:39:19Z","timestamp":1668544759000},"page":"3232-3245","source":"Crossref","is-referenced-by-count":69,"title":["Fusion of Microgrid Control With Model-Free Reinforcement Learning: Review and Vision"],"prefix":"10.1109","volume":"14","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-2624-560X","authenticated-orcid":false,"given":"Buxin","family":"She","sequence":"first","affiliation":[{"name":"Department of Electrical Engineering and Computer Science, The University of Tennessee at Knoxville, Knoxville, TN, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1060-7618","authenticated-orcid":false,"given":"Fangxing","family":"Li","sequence":"additional","affiliation":[{"name":"Department of Electrical Engineering and Computer Science, The University of Tennessee at Knoxville, Knoxville, TN, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4259-5925","authenticated-orcid":false,"given":"Hantao","family":"Cui","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, Oklahoma State University, Stillwater, OK, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7291-2533","authenticated-orcid":false,"given":"Jingqiu","family":"Zhang","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, National University of Singapore, Cluny Road, Singapore"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9108-1093","authenticated-orcid":false,"given":"Rui","family":"Bo","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, Missouri University of Science and Technology, Rolla, MO, USA"}]}],"member":"263","reference":[{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2021.3052515"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.35833\/MPCE.2021.000257"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2021.3112692"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2013.2245925"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/OAJPE.2022.3148375"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/PGSRET.2018.8686010"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/TPEL.2019.2923734"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/TEC.2020.3010049"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1016\/j.rser.2021.110992"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1016\/j.aei.2019.100945"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2022.3158254"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3032378"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1016\/j.ijepes.2021.107339"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/JESTPE.2020.2974046"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/JSYST.2020.3047673"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1088\/1757-899X\/561\/1\/012075"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1016\/j.rser.2016.03.002"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1016\/j.rser.2021.111915"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/JSYST.2021.3077213"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2017.2762349"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2017.2703126"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2015.2396992"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2021.3124465"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2016.2521405"},{"key":"ref6","article-title":"Virtual inertia scheduling for power systems with high penetration of inverter-based resources","author":"she","year":"2022","journal-title":"arXiv 2209 06677"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2012.2213276"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2021.3092220"},{"key":"ref101","doi-asserted-by":"crossref","DOI":"10.1016\/j.epsr.2021.107266","article-title":"Analysis of gray box modelling of transformers","volume":"197","author":"h\u00f8idalen","year":"2021","journal-title":"Electr Power Syst Res"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/TPEL.2019.2951694"},{"key":"ref35","article-title":"Decentralized and coordinated Vf control for islanded microgrids considering DER inadequacy and demand control","author":"she","year":"2022","journal-title":"arXiv 2206 11407"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/IEEESTD.2018.8340204"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2010.2041015"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/JESTPE.2019.2942491"},{"key":"ref31","first-page":"329","article-title":"Review of energy management and planning of islanded microgrids","volume":"6","author":"anderson","year":"2019","journal-title":"CSEE J Power Energy Syst"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-021-04301-9"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TPEC48276.2020.9042549"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/OAJPE.2022.3175129"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1016\/j.rser.2017.10.022"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/TPEL.2012.2199334"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1016\/j.apenergy.2020.116117"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2021.3071357"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1080\/00207721.2020.1803436"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/MPE.2022.3150825"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2015.2500269"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1016\/j.renene.2019.07.067"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1016\/j.ins.2020.06.061"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1146\/annurev-control-042920-020211"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2021.3054625"},{"key":"ref29","first-page":"213","article-title":"Deep reinforcement learning for power system applications: An overview","volume":"6","author":"zhang","year":"2019","journal-title":"CSEE J Power Energy Syst"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/JESTPE.2020.3001971"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2014.2377018"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/j.rser.2017.05.267"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TIE.2012.2194969"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.1109\/JSYST.2021.3074296"},{"key":"ref96","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2019.2931753"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2012.2197425"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.1109\/TCSI.2022.3141229"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.3389\/fenrg.2022.895163"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2021.3099133"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TPEL.2017.2761438"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3014977"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/JESTPE.2018.2796029"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TIA.2020.3012415"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2019.2930299"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.1109\/TETCI.2020.2964886"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.1109\/TII.2019.2896618"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1109\/ICPES47639.2019.9105413"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1109\/PESGM46819.2021.9637836"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2022.3162550"},{"key":"ref89","doi-asserted-by":"publisher","DOI":"10.1109\/CCWC51732.2021.9376126"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.1109\/TPEL.2021.3132028"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2020.3030164"},{"key":"ref88","doi-asserted-by":"publisher","DOI":"10.1109\/TPEL.2020.2977765"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3038735"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/TIE.2020.3005071"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2021.3100898"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2020.3035127"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1016\/j.apenergy.2022.119123"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2022.3154718"},{"key":"ref79","article-title":"Continuous control with deep reinforcement learning","author":"lillicrap","year":"2015","journal-title":"arXiv 1509 02971"},{"key":"ref108","first-page":"1","article-title":"Attention is all you need","volume":"30","author":"vaswani","year":"2017","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref78","first-page":"387","article-title":"Deterministic policy gradient algorithms","author":"silver","year":"2014","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref109","article-title":"A survey on federated learning systems: Vision, hype and reality for data privacy and protection","author":"li","year":"2021","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"ref106","doi-asserted-by":"publisher","DOI":"10.1016\/j.ejor.2019.06.025"},{"key":"ref107","article-title":"Evolutionary reinforcement learning","author":"khadka","year":"2018","journal-title":"arXiv 1805 07917"},{"key":"ref75","first-page":"2020","article-title":"Phasic policy gradient","author":"cobbe","year":"2021","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref104","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00304"},{"key":"ref74","article-title":"Proximal policy optimization algorithms","author":"schulman","year":"2017","journal-title":"arXiv 1707 06347"},{"key":"ref105","doi-asserted-by":"publisher","DOI":"10.35833\/MPCE.2021.000424"},{"key":"ref77","first-page":"1861","article-title":"Soft actor-critic: Off-policy maximum entropy deep reinforcement learning with a stochastic actor","author":"haarnoja","year":"2018","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2018.2824823"},{"key":"ref76","first-page":"1928","article-title":"Asynchronous methods for deep reinforcement learning","author":"mnih","year":"2016","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref103","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2020.3017019"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2019.2925703"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2013.2295514"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11796"},{"key":"ref111","article-title":"Contrastive behavioral similarity embeddings for generalization in reinforcement learning","author":"agarwal","year":"2021","journal-title":"arXiv 2101 05265"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11791"},{"key":"ref112","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2020.3041620"},{"key":"ref73","first-page":"1889","article-title":"Trust region policy optimization","author":"schulman","year":"2015","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref72","first-page":"1","article-title":"Policy gradient methods for reinforcement learning with function approximation","volume":"12","author":"sutton","year":"1999","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref110","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2991734"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v30i1.10295"},{"key":"ref119","article-title":"Ensuring transient stability with guaranteed region of attraction in DC microgrids","author":"liu","year":"2022","journal-title":"IEEE Trans Power Syst"},{"key":"ref67","first-page":"351","article-title":"Playing Atari with deep reinforcement learning","volume":"21","author":"chung","year":"2013","journal-title":"Proc NIPS"},{"key":"ref117","article-title":"Applications of physics-informed neural networks in power systems&#x2014;A review","author":"huang","year":"2022","journal-title":"IEEE Trans Power Syst"},{"key":"ref69","first-page":"449","article-title":"A distributional perspective on reinforcement learning","author":"bellemare","year":"2017","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref118","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2020.3041774"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/TSG.2021.3103405"},{"key":"ref115","first-page":"1093","article-title":"Safe reinforcement learning using robust action governor","author":"li","year":"2021","journal-title":"Proc Learn Dyn Control"},{"key":"ref63","article-title":"Reinforcement learning for decision-making and control in power systems: Tutorial, review, and vision","author":"chen","year":"2021","journal-title":"arXiv 2102 01168"},{"key":"ref116","first-page":"1","article-title":"Safe model-based reinforcement learning with stability guarantees","volume":"30","author":"berkenkamp","year":"2017","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1007\/BF00993306"},{"key":"ref113","first-page":"2817","article-title":"Robust adversarial reinforcement learning","author":"pinto","year":"2017","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref65","article-title":"An analysis of temporal-difference learning with function approximation","author":"tsitsiklis","year":"1996"},{"key":"ref114","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-662-49674-9_8"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1016\/j.seta.2022.102066"},{"key":"ref122","doi-asserted-by":"publisher","DOI":"10.1109\/LCSYS.2021.3088068"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/ISGT49243.2021.9372283"},{"key":"ref120","doi-asserted-by":"publisher","DOI":"10.1109\/TPWRS.2021.3098960"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3090266"},{"key":"ref121","first-page":"8103","article-title":"A Lyapunov-based approach to safe reinforcement learning","volume":"31","author":"chow","year":"2018","journal-title":"Proc Adv Neural Inf Process Syst"}],"container-title":["IEEE Transactions on Smart Grid"],"original-title":[],"link":[{"URL":"https:\/\/ieeexplore.ieee.org\/ielam\/5165411\/10158941\/9951405-aam.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/5165411\/10158941\/09951405.pdf?arnumber=9951405","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,10]],"date-time":"2023-07-10T19:22:55Z","timestamp":1689016975000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9951405\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,7]]},"references-count":122,"journal-issue":{"issue":"4"},"URL":"https:\/\/doi.org\/10.1109\/tsg.2022.3222323","relation":{},"ISSN":["1949-3053","1949-3061"],"issn-type":[{"value":"1949-3053","type":"print"},{"value":"1949-3061","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,7]]}}}