{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,26]],"date-time":"2026-03-26T07:54:49Z","timestamp":1774511689524,"version":"3.50.1"},"reference-count":31,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2025,10,30]],"date-time":"2025-10-30T00:00:00Z","timestamp":1761782400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,10,30]],"date-time":"2025-10-30T00:00:00Z","timestamp":1761782400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Sci. China Inf. Sci."],"published-print":{"date-parts":[[2025,11]]},"DOI":"10.1007\/s11432-025-4614-9","type":"journal-article","created":{"date-parts":[[2025,11,3]],"date-time":"2025-11-03T07:14:48Z","timestamp":1762154088000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Zero-sum game control of unmanned aerial vehicle confrontation via reinforcement learning"],"prefix":"10.1007","volume":"68","author":[{"given":"Zijun","family":"Li","sequence":"first","affiliation":[]},{"given":"Yongshuai","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Guoxing","family":"Wen","sequence":"additional","affiliation":[]},{"given":"Chengyi","family":"Xia","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,10,30]]},"reference":[{"key":"4614_CR1","doi-asserted-by":"publisher","first-page":"684","DOI":"10.1109\/TCE.2024.3368062","volume":"70","author":"X Li","year":"2024","unstructured":"Li X, Lu X, Chen W, et al. Research on UAVs reconnaissance task allocation method based on communication preservation. IEEE Trans Consumer Electron, 2024, 70: 684\u2013695","journal-title":"IEEE Trans Consumer Electron"},{"key":"4614_CR2","doi-asserted-by":"publisher","first-page":"109595","DOI":"10.1016\/j.engappai.2024.109595","volume":"139","author":"S Shahid","year":"2025","unstructured":"Shahid S, Zhen Z, Javaid U. Cooperative task assignment of heterogeneous unmanned aerial vehicles for simultaneous multidirectional attack on a moving target. Eng Appl Artif Intell, 2025, 139: 109595","journal-title":"Eng Appl Artif Intell"},{"key":"4614_CR3","doi-asserted-by":"publisher","first-page":"111830","DOI":"10.1016\/j.knosys.2024.111830","volume":"296","author":"J Li","year":"2024","unstructured":"Li J, Yang X, Yang Y, et al. Cooperative mapping task assignment of heterogeneous multi-UAV using an improved genetic algorithm. Knowl-Based Syst, 2024, 296: 111830","journal-title":"Knowl-Based Syst"},{"key":"4614_CR4","doi-asserted-by":"publisher","first-page":"1615","DOI":"10.1109\/TIV.2023.3307134","volume":"9","author":"S Chen","year":"2024","unstructured":"Chen S, Liu G, Zhou Z, et al. Robust multi-agent reinforcement learning method based on adversarial domain randomization for real-world dual-UAV cooperation. IEEE Trans Intell Veh, 2024, 9: 1615\u20131627","journal-title":"IEEE Trans Intell Veh"},{"key":"4614_CR5","doi-asserted-by":"publisher","first-page":"7034","DOI":"10.1109\/TVT.2023.3337154","volume":"73","author":"Y Chen","year":"2024","unstructured":"Chen Y, Liu G, Zhang Z, et al. Improving physical layer security for multi-UAV systems against hybrid wireless attacks. IEEE Trans Veh Technol, 2024, 73: 7034\u20137048","journal-title":"IEEE Trans Veh Technol"},{"key":"4614_CR6","doi-asserted-by":"publisher","first-page":"42","DOI":"10.1016\/j.comcom.2024.04.004","volume":"221","author":"C Zhou","year":"2024","unstructured":"Zhou C, Kadhim K M R, Zheng X. Multi-UAVs path planning for data harvesting in adversarial scenarios. Comput Commun, 2024, 221: 42\u201353","journal-title":"Comput Commun"},{"key":"4614_CR7","doi-asserted-by":"publisher","first-page":"222302","DOI":"10.1007\/s11432-020-3228-8","volume":"64","author":"Q Y Gao","year":"2021","unstructured":"Gao Q Y, Wu H C, Zhang Y F, et al. Differential game-based analysis of multi-attacker multi-defender interaction. Sci China Inf Sci, 2021, 64: 222302","journal-title":"Sci China Inf Sci"},{"key":"4614_CR8","doi-asserted-by":"publisher","first-page":"1516","DOI":"10.1109\/JSYST.2016.2539364","volume":"11","author":"C Xia","year":"2016","unstructured":"Xia C, Ding S, Wang C, et al. Risk analysis and enhancement of cooperation yielded by the individual reputation in the spatial public goods game. IEEE Syst J, 2016, 11: 1516\u20131525","journal-title":"IEEE Syst J"},{"key":"4614_CR9","doi-asserted-by":"publisher","first-page":"817","DOI":"10.1109\/TNNLS.2022.3177461","volume":"35","author":"J Long","year":"2022","unstructured":"Long J, Yu D, Wen G, et al. Game-based backstepping design for strict-feedback nonlinear multi-agent systems based on reinforcement learning. IEEE Trans Neural Netw Learn Syst, 2022, 35: 817\u2013830","journal-title":"IEEE Trans Neural Netw Learn Syst"},{"key":"4614_CR10","doi-asserted-by":"publisher","first-page":"1699","DOI":"10.1109\/JAS.2023.124149","volume":"11","author":"Z Gong","year":"2024","unstructured":"Gong Z, Yang F. Secure tracking control via fixed-time convergent reinforcement learning for a UAV CPS. IEEE CAA J Autom Sin, 2024, 11: 1699\u20131701","journal-title":"IEEE CAA J Autom Sin"},{"key":"4614_CR11","doi-asserted-by":"publisher","first-page":"1272","DOI":"10.1109\/TCYB.2022.3215716","volume":"54","author":"H Ren","year":"2022","unstructured":"Ren H, Jiang B, Ma Y. Zero-sum differential game-based fault-tolerant control for a class of affine nonlinear systems. IEEE Trans Cybern, 2022, 54: 1272\u20131282","journal-title":"IEEE Trans Cybern"},{"key":"4614_CR12","doi-asserted-by":"publisher","first-page":"212209","DOI":"10.1007\/s11432-023-4062-6","volume":"67","author":"S Y Lv","year":"2024","unstructured":"Lv S Y, Wu Z, Xiong J. A zero-sum hybrid stochastic differential game with impulse controls. Sci China Inf Sci, 2024, 67: 212209","journal-title":"Sci China Inf Sci"},{"key":"4614_CR13","doi-asserted-by":"publisher","first-page":"435","DOI":"10.1016\/j.ins.2015.09.001","volume":"328","author":"X Yang","year":"2016","unstructured":"Yang X, Liu D, Ma H, et al. Online approximate solution of HJI equation for unknown constrained-input nonlinear continuous-time systems. Inf Sci, 2016, 328: 435\u2013454","journal-title":"Inf Sci"},{"key":"4614_CR14","doi-asserted-by":"publisher","first-page":"110207","DOI":"10.1016\/j.automatica.2022.110207","volume":"140","author":"R Yan","year":"2022","unstructured":"Yan R, Duan X, Shi Z, et al. Matching-based capture strategies for 3D heterogeneous multiplayer reach-avoid differential games. Automatica, 2022, 140: 110207","journal-title":"Automatica"},{"key":"4614_CR15","doi-asserted-by":"publisher","first-page":"110811","DOI":"10.1016\/j.automatica.2022.110811","volume":"149","author":"H Fu","year":"2023","unstructured":"Fu H, Liu H H T. Justification of the geometric solution of a target defense game with faster defenders and a convex target area using the HJI equation. Automatica, 2023, 149: 110811","journal-title":"Automatica"},{"key":"4614_CR16","doi-asserted-by":"publisher","first-page":"1981","DOI":"10.1109\/TCYB.2025.3534463","volume":"55","author":"F Yang","year":"2025","unstructured":"Yang F, Gong Z, Wei Q, et al. Secure containment control for multi-UAV systems by fixed-time convergent reinforcement learning. IEEE Trans Cybern, 2025, 55: 1981\u20131994","journal-title":"IEEE Trans Cybern"},{"key":"4614_CR17","doi-asserted-by":"publisher","first-page":"2799","DOI":"10.1007\/s11071-022-07586-1","volume":"109","author":"J Cui","year":"2022","unstructured":"Cui J, Pan Y, Xue H, et al. Simplified optimized finite-time containment control for a class of multi-agent systems with actuator faults. Nonlinear Dyn, 2022, 109: 2799\u20132816","journal-title":"Nonlinear Dyn"},{"key":"4614_CR18","doi-asserted-by":"publisher","first-page":"212204","DOI":"10.1007\/s11432-023-4041-6","volume":"67","author":"Z P Zhang","year":"2024","unstructured":"Zhang Z P, Xia C Y, Qi G Y, et al. Multi-step state-based opacity for unambiguous weighted machines. Sci China Inf Sci, 2024, 67: 212204","journal-title":"Sci China Inf Sci"},{"key":"4614_CR19","doi-asserted-by":"publisher","first-page":"4969","DOI":"10.1109\/TII.2019.2894282","volume":"15","author":"G Wen","year":"2019","unstructured":"Wen G, Chen C L P, Ge S S, et al. Optimized adaptive nonlinear tracking control using actor-critic reinforcement learning strategy. IEEE Trans Ind Inf, 2019, 15: 4969\u20134977","journal-title":"IEEE Trans Ind Inf"},{"key":"4614_CR20","first-page":"6302","volume":"17","author":"Z Li","year":"2023","unstructured":"Li Z, Song Y, Wen G. Reinforcement learning based optimized sliding-mode consensus control of high-order nonlinear canonical dynamic multiagent system. IEEE Syst J, 2023, 17: 6302\u20136311","journal-title":"IEEE Syst J"},{"key":"4614_CR21","doi-asserted-by":"publisher","first-page":"5212","DOI":"10.1002\/rnc.7259","volume":"34","author":"Y Song","year":"2024","unstructured":"Song Y, Li Z, Li B, et al. Optimized leader-follower consensus control using combination of reinforcement learning and sliding mode mechanism for multiple robot manipulator system. Intl J Robust Nonlinear, 2024, 34: 5212\u20135228","journal-title":"Intl J Robust Nonlinear"},{"key":"4614_CR22","doi-asserted-by":"publisher","first-page":"6075","DOI":"10.1109\/TAES.2024.3401668","volume":"60","author":"G Wen","year":"2024","unstructured":"Wen G, Yu D, Zhao Y. Optimized fuzzy attitude control of quadrotor unmanned aerial vehicle using adaptive reinforcement learning strategy. IEEE Trans Aerosp Electron Syst, 2024, 60: 6075\u20136083","journal-title":"IEEE Trans Aerosp Electron Syst"},{"key":"4614_CR23","doi-asserted-by":"publisher","first-page":"545","DOI":"10.1002\/rnc.6460","volume":"33","author":"G Wen","year":"2023","unstructured":"Wen G, Dou H, Li B. Adaptive fuzzy leader-follower consensus control using sliding mode mechanism for a class of high-order unknown nonlinear dynamic multi-agent systems. Intl J Robust Nonlinear, 2023, 33: 545\u2013558","journal-title":"Intl J Robust Nonlinear"},{"key":"4614_CR24","doi-asserted-by":"publisher","first-page":"1872","DOI":"10.1109\/TCYB.2016.2623901","volume":"47","author":"W Yu","year":"2016","unstructured":"Yu W, Wang H, Cheng F, et al. Second-order consensus in multiagent systems via distributed sliding mode control. IEEE Trans Cybern, 2016, 47: 1872\u20131881","journal-title":"IEEE Trans Cybern"},{"key":"4614_CR25","doi-asserted-by":"publisher","first-page":"070216","DOI":"10.1007\/s11432-017-9407-6","volume":"61","author":"B R Zhao","year":"2018","unstructured":"Zhao B R, Peng Y J, Song Y N, et al. Sliding mode control for consensus tracking of second-order nonlinear multi-agent systems driven by brownian motion. Sci China Inf Sci, 2018, 61: 070216","journal-title":"Sci China Inf Sci"},{"key":"4614_CR26","doi-asserted-by":"publisher","first-page":"2009","DOI":"10.1016\/j.neucom.2017.10.041","volume":"275","author":"Q Qu","year":"2018","unstructured":"Qu Q, Zhang H, Yu R, et al. Neural network-based H\u221e sliding mode control for nonlinear systems with actuator faults and unmatched disturbances. Neurocomputing, 2018, 275: 2009\u20132018","journal-title":"Neurocomputing"},{"key":"4614_CR27","doi-asserted-by":"publisher","first-page":"4010","DOI":"10.1109\/TFUZZ.2023.3273566","volume":"31","author":"H Zhao","year":"2023","unstructured":"Zhao H, Zong G, Zhao X, et al. Hierarchical sliding-mode surface-based adaptive critic tracking control for nonlinear multiplayer zero-sum games via generalized fuzzy hyperbolic models. IEEE Trans Fuzzy Syst, 2023, 31: 4010\u20134023","journal-title":"IEEE Trans Fuzzy Syst"},{"key":"4614_CR28","first-page":"494","volume":"69","author":"G Cui","year":"2022","unstructured":"Cui G, Yang W, Yu J, et al. Fixed-time prescribed performance adaptive trajectory tracking control for a quav. IEEE Trans Circ Syst II, 2022, 69: 494\u2013498","journal-title":"IEEE Trans Circ Syst II"},{"key":"4614_CR29","doi-asserted-by":"publisher","first-page":"5546","DOI":"10.1109\/TSMC.2021.3130070","volume":"52","author":"G Wen","year":"2021","unstructured":"Wen G, Li B. Optimized leader-follower consensus control using reinforcement learning for a class of second-order nonlinear multiagent systems. IEEE Trans Syst Man Cybern Syst, 2021, 52: 5546\u20135555","journal-title":"IEEE Trans Syst Man Cybern Syst"},{"key":"4614_CR30","doi-asserted-by":"publisher","first-page":"246","DOI":"10.1162\/neco.1991.3.2.246","volume":"3","author":"J Park","year":"1991","unstructured":"Park J, Sandberg I W. Universal approximation using radial-basis-function networks. Neural Comput, 1991, 3: 246\u2013257","journal-title":"Neural Comput"},{"key":"4614_CR31","doi-asserted-by":"publisher","first-page":"674","DOI":"10.1109\/TNN.2004.826130","volume":"15","author":"S S Ge","year":"2004","unstructured":"Ge S S, Wang C. Adaptive neural control of uncertain MIMO nonlinear systems. IEEE Trans Neural Netw, 2004, 15: 674\u2013692","journal-title":"IEEE Trans Neural Netw"}],"container-title":["Science China Information Sciences"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11432-025-4614-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11432-025-4614-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11432-025-4614-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,3]],"date-time":"2025-11-03T07:14:49Z","timestamp":1762154089000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11432-025-4614-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,30]]},"references-count":31,"journal-issue":{"issue":"11","published-print":{"date-parts":[[2025,11]]}},"alternative-id":["4614"],"URL":"https:\/\/doi.org\/10.1007\/s11432-025-4614-9","relation":{},"ISSN":["1674-733X","1869-1919"],"issn-type":[{"value":"1674-733X","type":"print"},{"value":"1869-1919","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,10,30]]},"assertion":[{"value":"23 June 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 August 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 September 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 October 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"210211"}}