{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,16]],"date-time":"2026-01-16T04:16:46Z","timestamp":1768537006052,"version":"3.49.0"},"reference-count":47,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2022,9,1]],"date-time":"2022-09-01T00:00:00Z","timestamp":1661990400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2022,9,1]],"date-time":"2022-09-01T00:00:00Z","timestamp":1661990400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2022,9,1]],"date-time":"2022-09-01T00:00:00Z","timestamp":1661990400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2022,9,1]],"date-time":"2022-09-01T00:00:00Z","timestamp":1661990400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2022,9,1]],"date-time":"2022-09-01T00:00:00Z","timestamp":1661990400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2022,9,1]],"date-time":"2022-09-01T00:00:00Z","timestamp":1661990400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,9,1]],"date-time":"2022-09-01T00:00:00Z","timestamp":1661990400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Information Sciences"],"published-print":{"date-parts":[[2022,9]]},"DOI":"10.1016\/j.ins.2022.07.181","type":"journal-article","created":{"date-parts":[[2022,8,4]],"date-time":"2022-08-04T22:32:21Z","timestamp":1659652341000},"page":"401-424","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":15,"special_numbering":"C","title":["Optimal couple-group tracking control for the heterogeneous multi-agent systems with cooperative-competitive interactions via reinforcement learning method"],"prefix":"10.1016","volume":"610","author":[{"given":"Jun","family":"Li","sequence":"first","affiliation":[]},{"given":"Lianghao","family":"Ji","sequence":"additional","affiliation":[]},{"given":"Cuijuan","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Huaqing","family":"Li","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"issue":"2","key":"10.1016\/j.ins.2022.07.181_b0005","doi-asserted-by":"crossref","first-page":"560","DOI":"10.1109\/TITS.2017.2750073","article-title":"A probabilistic framework for tracking the formation and evolution of multi-vehicle groups in public traffic in the presence of observation uncertainties","volume":"19","author":"Wang","year":"2018","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"issue":"4","key":"10.1016\/j.ins.2022.07.181_b0010","doi-asserted-by":"crossref","first-page":"494","DOI":"10.1109\/TSMC.2013.2259155","article-title":"A new consensus model for group decision making problems with nonhomogeneous experts","volume":"44","author":"Pirez","year":"2014","journal-title":"IEEE Trans. Syst., Man, Cybern. Syst."},{"issue":"6","key":"10.1016\/j.ins.2022.07.181_b0015","doi-asserted-by":"crossref","first-page":"340","DOI":"10.1016\/j.sysconle.2010.03.009","article-title":"Group consensus in multi-agent systems with switching topologies and communication delays","volume":"59","author":"Yu","year":"2010","journal-title":"Syst. Control Lett."},{"issue":"3","key":"10.1016\/j.ins.2022.07.181_b0020","doi-asserted-by":"crossref","first-page":"532","DOI":"10.1002\/rnc.2904","article-title":"Group consensus control for double-integrator dynamic multiagent systems with fixed communication topology","volume":"24","author":"Feng","year":"2014","journal-title":"Int. J. Robust Nonlinear Control"},{"issue":"6","key":"10.1016\/j.ins.2022.07.181_b0025","doi-asserted-by":"crossref","first-page":"1888","DOI":"10.1109\/TCYB.2017.2716970","article-title":"Event-triggered communication for leader-following consensus of second-order multiagent systems","volume":"48","author":"Zhao","year":"2018","journal-title":"IEEE Trans. Cybern."},{"issue":"12","key":"10.1016\/j.ins.2022.07.181_b0030","doi-asserted-by":"crossref","first-page":"4122","DOI":"10.1109\/TCYB.2016.2600753","article-title":"On group synchronization for interacting clusters of heterogeneous systems","volume":"47","author":"Qin","year":"2017","journal-title":"IEEE Trans. Cybern."},{"key":"10.1016\/j.ins.2022.07.181_b0035","doi-asserted-by":"crossref","first-page":"262","DOI":"10.1016\/j.neucom.2013.12.024","article-title":"On pinning group consensus for dynamical multiagent networks with general connected topology","volume":"135","author":"Liao","year":"2014","journal-title":"Neurocomputing"},{"issue":"11","key":"10.1016\/j.ins.2022.07.181_b0040","doi-asserted-by":"crossref","first-page":"7133","DOI":"10.1109\/TIE.2016.2584009","article-title":"Clustered event-triggered consensus analysis: an impulsive framework","volume":"63","author":"Xu","year":"2016","journal-title":"IEEE Trans. Ind. Electron."},{"issue":"2","key":"10.1016\/j.ins.2022.07.181_b0045","doi-asserted-by":"crossref","first-page":"259","DOI":"10.1080\/00207179.2015.1072876","article-title":"Group consensus control for heterogeneous multi-agent systems with fixed and switching topologies","volume":"89","author":"Wen","year":"2016","journal-title":"Int. J. Control"},{"issue":"4","key":"10.1016\/j.ins.2022.07.181_b0050","doi-asserted-by":"crossref","first-page":"566","DOI":"10.1109\/TNNLS.2013.2237786","article-title":"Cluster consensus in discrete-time networks of multiagents with inter-cluster nonidentical inputs","volume":"24","author":"Han","year":"2013","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"issue":"3","key":"10.1016\/j.ins.2022.07.181_b0055","doi-asserted-by":"crossref","first-page":"793","DOI":"10.1109\/TAC.2014.2330428","article-title":"Achieving cluster consensus in continuous time networks of multi-agents with inter-cluster non-identical inputs","volume":"60","author":"Han","year":"2015","journal-title":"IEEE Trans. Autom. Control"},{"key":"10.1016\/j.ins.2022.07.181_b0060","doi-asserted-by":"crossref","first-page":"247","DOI":"10.1016\/j.ins.2020.05.085","article-title":"Group consensus via pinning control for a class of heterogeneous multi-agent systems with input constraints","volume":"542","author":"Li","year":"2021","journal-title":"Inf. Sci."},{"key":"10.1016\/j.ins.2022.07.181_b0065","first-page":"1","article-title":"Distributed model reference adaptive optimization of disturbed multiagent systems with intermittent communications","volume":"99","author":"Guo","year":"2020","journal-title":"IEEE Trans. Cybern."},{"key":"10.1016\/j.ins.2022.07.181_b0070","first-page":"1","article-title":"Distributed optimization of multi-agent systems against unmatched disturbances: A hierarchical integral control framework","volume":"99","author":"Guo","year":"2021","journal-title":"IEEE Trans. Syst. Man Cybern.: Syst."},{"issue":"6","key":"10.1016\/j.ins.2022.07.181_b0075","first-page":"2902","article-title":"Lyapunov Redesign-based optimal consensus control for multi-agent Systems with uncertain dynamics","volume":"69","author":"Guo","year":"2022","journal-title":"IEEE Trans. Circuits Syst. II Express Briefs"},{"key":"10.1016\/j.ins.2022.07.181_b0080","doi-asserted-by":"crossref","unstructured":"Y. Liu, Z. Wang, Optimal output synchronization of heterogeneous multi-agent systems using measured input-output data, 582 (2022) 462\u2013479.","DOI":"10.1016\/j.ins.2021.08.044"},{"key":"10.1016\/j.ins.2022.07.181_b0085","doi-asserted-by":"crossref","unstructured":"B. Yan, P. Shi, C. Lim, Z. Shi, Optimal robust formation control for heterogeneous multi-agent systems based on reinforcement learning, 32 (5) (2022) 1049-8923.","DOI":"10.1002\/rnc.5828"},{"issue":"8","key":"10.1016\/j.ins.2022.07.181_b0090","doi-asserted-by":"crossref","first-page":"1556","DOI":"10.1016\/j.automatica.2011.03.005","article-title":"Multi-player non-zero-sum games: online adaptive learning solution of coupled Hamilton-Jacobi equations","volume":"47","author":"Vamvoudakis","year":"2011","journal-title":"Automatica"},{"key":"10.1016\/j.ins.2022.07.181_b0095","series-title":"Approximate dynamic programming for real-time control and neural modeling, Handbook of Intelligent Control","author":"Werbos","year":"1992"},{"issue":"2","key":"10.1016\/j.ins.2022.07.181_b0100","doi-asserted-by":"crossref","first-page":"39","DOI":"10.1109\/MCI.2009.932261","article-title":"Adaptive dynamic programming: An introduction","volume":"4","author":"Wang","year":"2009","journal-title":"IEEE Comput. Intell. Mag."},{"issue":"11","key":"10.1016\/j.ins.2022.07.181_b0105","doi-asserted-by":"crossref","first-page":"1544","DOI":"10.1109\/TSMC.2015.2492941","article-title":"Data-based adaptive critic designs for non-linear robust optimal control with uncertain dynamics","volume":"46","author":"Wang","year":"2016","journal-title":"IEEE Trans. Syst. Man Cyber. Syst."},{"key":"10.1016\/j.ins.2022.07.181_b0110","doi-asserted-by":"crossref","first-page":"84","DOI":"10.1016\/j.ins.2020.11.057","article-title":"Optimal tracking control based on reinforcement learning value iteration algorithm for time-delayed nonlinear systems with external disturbances and input constraints","volume":"554","author":"Mohammadi","year":"2021","journal-title":"Inf. Sci."},{"issue":"25","key":"10.1016\/j.ins.2022.07.181_b0115","doi-asserted-by":"crossref","first-page":"368","DOI":"10.1016\/j.ins.2022.05.048","article-title":"Optimized tracking control based on reinforcement learning for a class of high-order unknown nonlinear dynamic systems","volume":"606","author":"Wen","year":"2022","journal-title":"Inf. Sci."},{"issue":"2","key":"10.1016\/j.ins.2022.07.181_b0120","doi-asserted-by":"crossref","first-page":"402","DOI":"10.1109\/TCYB.2018.2856510","article-title":"Finite-horizon optimal consensus control for unknown multiagent state-delay systems","volume":"50","author":"Zhang","year":"2020","journal-title":"IEEE Trans. Cybern."},{"issue":"4","key":"10.1016\/j.ins.2022.07.181_b0125","doi-asserted-by":"crossref","first-page":"988","DOI":"10.1109\/TSMCB.2008.922019","article-title":"Adaptive critic learning techniques for engine torque and air-fuel ratio control","volume":"38","author":"Liu","year":"2008","journal-title":"IEEE Trans. Syst., Man, Cybern. B Cybern."},{"issue":"2","key":"10.1016\/j.ins.2022.07.181_b0130","doi-asserted-by":"crossref","first-page":"493","DOI":"10.1109\/TEC.2008.2001456","article-title":"Coordinated reactive power control of a large wind farm and a statcom using heuristic dynamic programming","volume":"24","author":"Qiao","year":"2009","journal-title":"IEEE Trans. Energy Convers."},{"key":"10.1016\/j.ins.2022.07.181_b0135","doi-asserted-by":"crossref","first-page":"213","DOI":"10.1016\/j.comcom.2021.07.010","article-title":"Reinforcement learning multi-agent system for faults diagnosis of mircoservices in industrial settings","volume":"177","author":"Belhadi","year":"2021","journal-title":"Comput. Commun."},{"issue":"12","key":"10.1016\/j.ins.2022.07.181_b0140","doi-asserted-by":"crossref","first-page":"3038","DOI":"10.1016\/j.automatica.2014.10.047","article-title":"Multi-agent discrete-time graphical games and reinforcement learning solutions","volume":"50","author":"Abouheaf","year":"2014","journal-title":"Automatica"},{"issue":"8","key":"10.1016\/j.ins.2022.07.181_b0145","doi-asserted-by":"crossref","first-page":"1825","DOI":"10.1016\/j.automatica.2012.05.049","article-title":"Optimal control of unknown non-affine nonlinear discrete-time systems based on adaptive dynamic programming","volume":"48","author":"Wang","year":"2012","journal-title":"Automatica"},{"issue":"3","key":"10.1016\/j.ins.2022.07.181_b0150","doi-asserted-by":"crossref","first-page":"621","DOI":"10.1109\/TNNLS.2013.2281663","article-title":"Policy iteration adaptive dynamic programming algorithm for discrete-time nonlinear system","volume":"25","author":"Liu","year":"2014","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"issue":"5","key":"10.1016\/j.ins.2022.07.181_b0155","doi-asserted-by":"crossref","first-page":"4091","DOI":"10.1109\/TIE.2016.2542134","article-title":"Data-driven optimal consensus control for discrete-time multi-agent systems with unknown dynamics using reinforcement learning method","volume":"64","author":"Zhang","year":"2017","journal-title":"IEEE Trans. Ind. Electron."},{"issue":"7","key":"10.1016\/j.ins.2022.07.181_b0160","doi-asserted-by":"crossref","first-page":"3034","DOI":"10.1109\/TNNLS.2020.3009214","article-title":"Reinforcement learning-based optimal tracking control of an unknown unmanned surface vehicle","volume":"32","author":"Wang","year":"2021","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"10.1016\/j.ins.2022.07.181_b0165","doi-asserted-by":"crossref","first-page":"9363","DOI":"10.1007\/s00521-021-05696-2","article-title":"Optimal tracking control of switched systems applied in grid-connected hybrid generation using reinforcement learning","volume":"33","author":"Sun","year":"2021","journal-title":"Neural Comput. Appl."},{"key":"10.1016\/j.ins.2022.07.181_b0170","doi-asserted-by":"crossref","unstructured":"Z. Peng, R. Luo, J. Hu, K. Shi, B.K. Ghosh, Distributed optimal tracking control of discrete-time multiagent systems via event-triggered reinforcement learning, IEEE Trans. Circuits Syst. I: Regular Papers. doi: 10.1109\/TCSI.2022.3177407.","DOI":"10.1109\/TCSI.2022.3177407"},{"key":"10.1016\/j.ins.2022.07.181_b0175","doi-asserted-by":"crossref","first-page":"84","DOI":"10.1016\/j.ins.2020.11.057","article-title":"Optimal tracking control based on reinforcement learning value iteration algorithm for time-delayed nonlinear systems with external disturbances and input constraints","volume":"554","author":"Mohammadi","year":"2021","journal-title":"Inf. Sci."},{"issue":"30","key":"10.1016\/j.ins.2022.07.181_b0180","doi-asserted-by":"crossref","first-page":"92","DOI":"10.1016\/j.neucom.2018.08.048","article-title":"Couple-group consensus for discrete-time heterogeneous multiagent systems with cooperative-competitive interactions and time delays","volume":"319","author":"Jiang","year":"2018","journal-title":"Neurocomputing"},{"issue":"7","key":"10.1016\/j.ins.2022.07.181_b0185","first-page":"1618","article-title":"Energy-efficient distributed filtering in sensor networks: a unified switched system approach","volume":"47","author":"Zhang","year":"2017","journal-title":"IEEE Trans. Cybern."},{"key":"10.1016\/j.ins.2022.07.181_b0190","doi-asserted-by":"crossref","first-page":"189","DOI":"10.1016\/j.ins.2018.12.079","article-title":"Data-driven optimal tracking control of discrete-time multi-agent systems with two-stage policy iteration algorithm","volume":"481","author":"Peng","year":"2019","journal-title":"Inf. Sci."},{"issue":"10","key":"10.1016\/j.ins.2022.07.181_b0195","first-page":"243","article-title":"Dynamical consensus seeking of heterogeneous multi-agent systems under input delays","volume":"26","author":"Liu","year":"2012","journal-title":"Int. J. Commun. Syst."},{"key":"10.1016\/j.ins.2022.07.181_b0200","doi-asserted-by":"crossref","first-page":"278","DOI":"10.1016\/j.neucom.2015.10.060","article-title":"Dynamical group consensus of heterogeneous multi-agent systems with input time delays","volume":"175","author":"Wen","year":"2016","journal-title":"Neurocomputing"},{"issue":"2","key":"10.1016\/j.ins.2022.07.181_b0205","first-page":"241","article-title":"Cluster consensus in networks of agents with weighted cooperative-competitive interactions","volume":"65","author":"Zhan","year":"2018","journal-title":"IEEE Trans. Circuits Syst. II Express Briefs"},{"issue":"1","key":"10.1016\/j.ins.2022.07.181_b0210","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/s11425-013-4750-6","article-title":"Cluster synchronization of a class of multiagent systems with a bipartite graph topology","volume":"57","author":"Wang","year":"2014","journal-title":"Sci. China"},{"issue":"12","key":"10.1016\/j.ins.2022.07.181_b0215","doi-asserted-by":"crossref","first-page":"10951","DOI":"10.1109\/TIE.2019.2958277","article-title":"Optimal model-free output synchronization of heterogeneous multiagent systems under switching topologies","volume":"67","author":"Mu","year":"2020","journal-title":"IEEE Trans. Ind. Electron."},{"issue":"6","key":"10.1016\/j.ins.2022.07.181_b0220","doi-asserted-by":"crossref","first-page":"1747","DOI":"10.1109\/TCYB.2017.2714173","article-title":"Distributed optimal consensus control for multiagent systems with input delay","volume":"48","author":"Zhang","year":"2018","journal-title":"IEEE Trans. Cybern."},{"issue":"1","key":"10.1016\/j.ins.2022.07.181_b0225","doi-asserted-by":"crossref","first-page":"152","DOI":"10.1109\/TFUZZ.2014.2310238","article-title":"Leader-based optimal coordination control for the consensus problem of multiagent differential games via fuzzy adaptive dynamic programming","volume":"23","author":"Zhang","year":"2015","journal-title":"IEEE Trans. Fuzzy Syst."},{"key":"10.1016\/j.ins.2022.07.181_b0230","series-title":"Adaptive control tutorial","author":"Ioannou","year":"2006"},{"key":"10.1016\/j.ins.2022.07.181_b0235","doi-asserted-by":"crossref","unstructured":"C. Liu, F. Liu, Consensus problem of delayed linear multi-agent systems, Springer, 2017. doi: 10.1007\/978-981-10-2492-4.","DOI":"10.1007\/978-981-10-2492-4"}],"container-title":["Information Sciences"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0020025522008726?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0020025522008726?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2025,9,17]],"date-time":"2025-09-17T05:47:17Z","timestamp":1758088037000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0020025522008726"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,9]]},"references-count":47,"alternative-id":["S0020025522008726"],"URL":"https:\/\/doi.org\/10.1016\/j.ins.2022.07.181","relation":{},"ISSN":["0020-0255"],"issn-type":[{"value":"0020-0255","type":"print"}],"subject":[],"published":{"date-parts":[[2022,9]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Optimal couple-group tracking control for the heterogeneous multi-agent systems with cooperative-competitive interactions via reinforcement learning method","name":"articletitle","label":"Article Title"},{"value":"Information Sciences","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.ins.2022.07.181","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2022 Elsevier Inc. All rights reserved.","name":"copyright","label":"Copyright"}]}}