{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,7]],"date-time":"2025-11-07T13:31:01Z","timestamp":1762522261582,"version":"3.28.0"},"reference-count":28,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,8]]},"DOI":"10.1109\/rcar.2018.8621852","type":"proceedings-article","created":{"date-parts":[[2019,1,25]],"date-time":"2019-01-25T02:29:36Z","timestamp":1548383376000},"page":"348-353","source":"Crossref","is-referenced-by-count":2,"title":["Cooperative and Adaptive Optimal Output Regulation of Discrete-Time Multi-Agent Systems Using Reinforcement Learning"],"prefix":"10.1109","author":[{"given":"Weinan","family":"Gao","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yiyang","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Adedapo","family":"Odekunle","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhong-Ping","family":"Jiang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yunjun","family":"Yu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Pingli","family":"Lu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/MCAS.2009.933854"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TSMC.2015.2466191"},{"key":"ref12","article-title":"Discrete-time stable generalized self-learning optimal control with approximation errors","author":"wei","year":"2017","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TSMCB.2010.2043839"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2016.05.008"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1049\/iet-cta.2015.0977"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2014.02.015"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TCYB.2016.2548941"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2016.2548662"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1007\/s10846-016-0395-3"},{"key":"ref28","doi-asserted-by":"crossref","first-page":"76","DOI":"10.1109\/MCS.2012.2214134","article-title":"Reinforcement learning and feedback control: Using natural decision methods to design optimal adaptive controllers","volume":"32","author":"lewis","year":"2012","journal-title":"IEEE Control Systems Magazine"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2010.2076250"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2012.06.096"},{"key":"ref3","doi-asserted-by":"crossref","first-page":"1062","DOI":"10.1109\/TAC.2011.2169618","article-title":"Cooperative output regulation of linear multiagent systems","volume":"57","author":"su","year":"2012","journal-title":"IEEE Transactions on Automatic Control"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2016.2636930"},{"key":"ref5","first-page":"267","volume":"59","author":"huang","year":"2014","journal-title":"Cooperative output regulation of heterogeneous multi-agent systems An $H$? criterion"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2014.2360023"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2016.2594151"},{"key":"ref2","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4471-0011-9","author":"isidori","year":"2003","journal-title":"Robust Autonomous Guidance An Internal Model Approach"},{"journal-title":"Beyond Regression New Tools for Prediction and Analysis in the Behavioral Sciences","year":"1974","author":"werbos","key":"ref9"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9780898718683"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2017.2761718"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1002\/9781119132677"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2014.10.047"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2003.820143"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1137\/0315033"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.1977.1101556"},{"key":"ref25","doi-asserted-by":"crossref","DOI":"10.1093\/oso\/9780198537953.001.0001","author":"lancaster","year":"1995","journal-title":"Algebraic Riccati Equations"}],"event":{"name":"2018 IEEE International Conference on Real-time Computing and Robotics (RCAR)","start":{"date-parts":[[2018,8,1]]},"location":"Kandima, Maldives","end":{"date-parts":[[2018,8,5]]}},"container-title":["2018 IEEE International Conference on Real-time Computing and Robotics (RCAR)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8605389\/8621626\/08621852.pdf?arnumber=8621852","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,7,14]],"date-time":"2024-07-14T09:42:25Z","timestamp":1720950145000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8621852\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,8]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/rcar.2018.8621852","relation":{},"subject":[],"published":{"date-parts":[[2018,8]]}}}