{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,17]],"date-time":"2026-03-17T18:38:25Z","timestamp":1773772705594,"version":"3.50.1"},"reference-count":45,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,5,30]]},"DOI":"10.1109\/icra48506.2021.9561463","type":"proceedings-article","created":{"date-parts":[[2021,10,19]],"date-time":"2021-10-19T20:28:35Z","timestamp":1634675315000},"page":"4509-4515","source":"Crossref","is-referenced-by-count":23,"title":["Anytime Game-Theoretic Planning with Active Reasoning About Humans\u2019 Latent States for Human-Centered Robots"],"prefix":"10.1109","author":[{"given":"Ran","family":"Tian","sequence":"first","affiliation":[]},{"given":"Liting","family":"Sun","sequence":"additional","affiliation":[]},{"given":"Masayoshi","family":"Tomizuka","sequence":"additional","affiliation":[]},{"given":"David","family":"Isele","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC.2019.8916944"},{"key":"ref38","first-page":"1433","article-title":"Maximum entropy inverse reinforcement learning","volume":"8","author":"ziebart","year":"2008","journal-title":"AAAI"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1016\/B978-0-08-042375-3.50010-X"},{"key":"ref32","doi-asserted-by":"crossref","first-page":"34","DOI":"10.1126\/science.153.3731.34","article-title":"Dynamic programming","volume":"153","author":"bellman","year":"1966","journal-title":"Science"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.1974.1100635"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9781139344203"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ITSC.2019.8916982"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2012.6425906"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.2514\/6.2009-5876"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1145\/584091.584093"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.23919\/ACC.2018.8430842"},{"key":"ref40","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v35i7.16750","article-title":"Bounded risk-sensitive markov games: Forward policy design and inverse reward learning with iterative reasoning and cumulative prospect theory","author":"tian","year":"2021","journal-title":"AAAI Conference on Artificial Intelligence"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2018.8619275"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CDC40024.2019.9029646"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1017\/9781139061759"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/BF00935561"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1111\/1468-0262.00239"},{"key":"ref16","first-page":"1025","article-title":"Point-based value iteration: An anytime algorithm for pomdps","volume":"3","author":"pineau","year":"2003","journal-title":"IJCAI"},{"key":"ref17","first-page":"2329","article-title":"Point-based value iteration for continuous pomdps","volume":"7","author":"porta","year":"2006","journal-title":"Journal of Machine Learning Research"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2008.IV.009"},{"key":"ref19","article-title":"Open-loop plans in multi-robot pomdps","author":"yu","year":"2005","journal-title":"Technical report Stanford CS Dept Tech Rep"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1006\/game.1995.1023"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1111\/j.1468-0262.2007.00810.x"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1016\/j.geb.2017.09.009"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1257\/aer.91.5.1402"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2016.7759036"},{"key":"ref29","article-title":"Trust-aware decision making for human-robot collaboration: Model learning and planning","volume":"9","author":"chen","year":"2020","journal-title":"Human Robot Interaction"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/2600057.2602907"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8794007"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2016.XII.029"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1820676116"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.2307\/j.ctvjsf522"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.23919\/ECC.2019.8795627"},{"key":"ref20","doi-asserted-by":"crossref","first-page":"1436","DOI":"10.1609\/aaai.v27i1.8547","article-title":"Open-loop planning in large-scale stochastic domains","author":"weinstein","year":"2013","journal-title":"Proceedings of the Twenty-seventh AAAI Conference on Artificial Intelligence"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CACSD.2010.5612665"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33017941"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/2739480.2754811"},{"key":"ref24","article-title":"Sparse tree search optimality guarantees in pomdps with continuous observation spaces","author":"lim","year":"2019"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1257\/aer.96.5.1737"},{"key":"ref23","first-page":"2164","article-title":"Monte-carlo planning in large pomdps","author":"silver","year":"2010","journal-title":"Advances in neural information processing systems"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.23919\/ACC45564.2020.9147974"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1016\/0167-2681(94)90103-1"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/IVS.2015.7225830"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1162\/0033553041502225"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1162\/JEEA.2009.7.2-3.365"}],"event":{"name":"2021 IEEE International Conference on Robotics and Automation (ICRA)","location":"Xi'an, China","start":{"date-parts":[[2021,5,30]]},"end":{"date-parts":[[2021,6,5]]}},"container-title":["2021 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9560720\/9560666\/09561463.pdf?arnumber=9561463","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,12]],"date-time":"2023-01-12T17:53:34Z","timestamp":1673546014000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9561463\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,5,30]]},"references-count":45,"URL":"https:\/\/doi.org\/10.1109\/icra48506.2021.9561463","relation":{},"subject":[],"published":{"date-parts":[[2021,5,30]]}}}