{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T15:55:05Z","timestamp":1778255705231,"version":"3.51.4"},"reference-count":32,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"1","license":[{"start":{"date-parts":[[2023,2,1]],"date-time":"2023-02-01T00:00:00Z","timestamp":1675209600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,2,1]],"date-time":"2023-02-01T00:00:00Z","timestamp":1675209600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,2,1]],"date-time":"2023-02-01T00:00:00Z","timestamp":1675209600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61876079"],"award-info":[{"award-number":["61876079"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Human-Mach. Syst."],"published-print":{"date-parts":[[2023,2]]},"DOI":"10.1109\/thms.2022.3225867","type":"journal-article","created":{"date-parts":[[2022,12,9]],"date-time":"2022-12-09T18:42:45Z","timestamp":1670611365000},"page":"201-214","source":"Crossref","is-referenced-by-count":24,"title":["Intelligent Decision-Making and Human Language Communication Based on Deep Reinforcement Learning in a Wargame Environment"],"prefix":"10.1109","volume":"53","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4897-2007","authenticated-orcid":false,"given":"Yuxiang","family":"Sun","sequence":"first","affiliation":[{"name":"School of Engineering Management, Nanjing University, Nanjing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bo","family":"Yuan","sequence":"additional","affiliation":[{"name":"School of Computing and Mathematical Sciences, University of Leicester, Leicester, U.K."}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qi","family":"Xiang","sequence":"additional","affiliation":[{"name":"School of Management and Engineering, Nanjing University, Nanjing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jiawei","family":"Zhou","sequence":"additional","affiliation":[{"name":"School of Management and Engineering, Nanjing University, Nanjing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jiahui","family":"Yu","sequence":"additional","affiliation":[{"name":"School of Management and Engineering, Nanjing University, Nanjing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Di","family":"Dai","sequence":"additional","affiliation":[{"name":"School of Artificial Intelligence, Peking University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4321-1441","authenticated-orcid":false,"given":"Xianzhong","family":"Zhou","sequence":"additional","affiliation":[{"name":"School of Management and Engineering, Nanjing University, Nanjing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/SMC.2017.8123163"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/SMC.2016.7844517"},{"key":"ref3","first-page":"2637","article-title":"Modeling CGF behavior with machine learning techniques","volume-title":"Proc. Interservice\/Industry Training, Simul., Educ. Conf.","author":"Toubman","year":"2015"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1038\/nature24270"},{"key":"ref5","first-page":"1652","article-title":"Adversarial hierarchical-task network planning for complex real-time games","volume-title":"Proc. 24th Int. Conf. Artif. Intell.","author":"Ontan","year":"2015"},{"key":"ref6","first-page":"2656","volume-title":"ELF: An Extensive, Lightweight and Flexible Research Platform for Real-Time Strategy Games","volume":"30","author":"Tian","year":"2017"},{"key":"ref7","article-title":"Dota 2 with large scale deep reinforcement learning","author":"Berner","year":"2019"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CIG.2011.6032006"},{"key":"ref9","first-page":"621","article-title":"Towards playing full MOBA games with deep reinforcement learning","volume-title":"Advances in Neural Information Processing Systems","volume":"33","author":"Ye","year":"2020"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1609\/aiide.v16i1.7449"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33011206"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-019-1724-z"},{"key":"ref13","article-title":"The starcraft multi-agent challenge","author":"Samvelyan","year":"2019"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/s00530-022-00922-w"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CIG.2012.6374183"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CIG.2018.8490409"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TSMCC.2010.2052041"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1201\/b17742"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.3390\/s21144810"},{"key":"ref20","doi-asserted-by":"crossref","first-page":"285","DOI":"10.1016\/j.future.2020.07.048","volume":"114","author":"Yun","year":"2021","journal-title":"Future Gener. Comput. Syst."},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.1998.712192"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1016\/j.ejor.2007.11.001"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2020.106685"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i02.5533"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2020.3003163"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.3390\/electronics9101668"},{"key":"ref27","article-title":"Places205-VGGNet models for scene recognition","author":"Wang","year":"2015"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2018.8545591"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLA.2017.00-47"},{"key":"ref30","article-title":"Neural machine translation by jointly learning to align and translate","author":"Bahdanau","year":"2014"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2020.106198"},{"key":"ref32","first-page":"37","article-title":"Long short-term memory","volume-title":"Supervised Sequence Labelling With Recurrent Neural Networks","author":"Hochreiter","year":"2012"}],"container-title":["IEEE Transactions on Human-Machine Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6221037\/10016745\/09979044.pdf?arnumber=9979044","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,1]],"date-time":"2024-02-01T04:31:25Z","timestamp":1706761885000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9979044\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,2]]},"references-count":32,"journal-issue":{"issue":"1"},"URL":"https:\/\/doi.org\/10.1109\/thms.2022.3225867","relation":{},"ISSN":["2168-2291","2168-2305"],"issn-type":[{"value":"2168-2291","type":"print"},{"value":"2168-2305","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,2]]}}}