{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T14:33:42Z","timestamp":1730298822035,"version":"3.28.0"},"reference-count":15,"publisher":"IEEE","license":[{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019,12]]},"DOI":"10.1109\/ssci44817.2019.9002811","type":"proceedings-article","created":{"date-parts":[[2020,2,21]],"date-time":"2020-02-21T07:49:24Z","timestamp":1582271364000},"page":"9-15","source":"Crossref","is-referenced-by-count":1,"title":["Deep Reinforcement Learning Based Intelligent Decision Making for Two-player Sequential Game with Uncertain Irrational Player"],"prefix":"10.1109","author":[{"given":"Zejian","family":"Zhou","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hao","family":"Xu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","first-page":"322","article-title":"Friend-or-foe q-learning in general-sum games","volume":"1","author":"littman","year":"2001","journal-title":"International Conference on Machine Learning"},{"article-title":"Deep reinforcement learning from self-play in imperfect-information games","year":"2016","author":"heinrich","key":"ref11"},{"key":"ref12","first-page":"805","article-title":"Fictitious self-play in extensive-form games","author":"heinrich","year":"2015","journal-title":"International Conference on Machine Learning"},{"key":"ref13","first-page":"6379","article-title":"Multi-agent actor-critic for mixed cooperative-competitive environments","author":"lowe","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref14","first-page":"242","article-title":"Multiagent reinforcement learning: theoretical framework and an algorithm","volume":"98","author":"hu","year":"1998","journal-title":"International Conference on Machine Learning"},{"year":"0","key":"ref15","article-title":"Defense advanced research projects agency"},{"key":"ref4","article-title":"Deterministic policy gradient algorithms","author":"silver","year":"2014","journal-title":"Proceedings of the 31th International Conference on Machine Learning"},{"article-title":"Playing atari with deep reinforcement learning","year":"2013","author":"mnih","key":"ref3"},{"key":"ref6","first-page":"6379","article-title":"Multi-agent actor-critic for mixed cooperative-competitive environments","author":"lowe","year":"2017","journal-title":"Advances in neural information processing systems"},{"article-title":"Episodic exploration for deep deterministic policies: An application to starcraft micromanagement tasks","year":"2016","author":"usunier","key":"ref5"},{"key":"ref8","first-page":"4190","article-title":"A unified game-theoretic approach to multiagent reinforcement learning","author":"lanctot","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/B978-1-55860-307-3.50049-6"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/SSCI.2018.8628889"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8461233"},{"key":"ref9","first-page":"746","article-title":"The dynamics of reinforcement learning in cooperative multiagent systems","author":"claus","year":"1998","journal-title":"Proceedings of the 15th National\/10th Conference on Artificial Intelligence\/Innovative Applications of Artificial Intelligence"}],"event":{"name":"2019 IEEE Symposium Series on Computational Intelligence (SSCI)","start":{"date-parts":[[2019,12,6]]},"location":"Xiamen, China","end":{"date-parts":[[2019,12,9]]}},"container-title":["2019 IEEE Symposium Series on Computational Intelligence (SSCI)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8975711\/9002648\/09002811.pdf?arnumber=9002811","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,17]],"date-time":"2022-07-17T21:51:39Z","timestamp":1658094699000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9002811\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,12]]},"references-count":15,"URL":"https:\/\/doi.org\/10.1109\/ssci44817.2019.9002811","relation":{},"subject":[],"published":{"date-parts":[[2019,12]]}}}