{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,17]],"date-time":"2026-05-17T20:07:15Z","timestamp":1779048435596,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":12,"publisher":"ACM","license":[{"start":{"date-parts":[[2009,6,14]],"date-time":"2009-06-14T00:00:00Z","timestamp":1244937600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2009,6,14]]},"DOI":"10.1145\/1553374.1553383","type":"proceedings-article","created":{"date-parts":[[2009,6,16]],"date-time":"2009-06-16T09:34:36Z","timestamp":1245144876000},"page":"65-72","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["Predictive representations for policy gradient in POMDPs"],"prefix":"10.1145","author":[{"given":"Abdeslam","family":"Boularias","sequence":"first","affiliation":[{"name":"Laval University, Quebec, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Brahim","family":"Chaib-draa","sequence":"additional","affiliation":[{"name":"Laval University, Quebec, Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2009,6,14]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.5555\/645531.655827"},{"key":"e_1_3_2_1_2_1","volume-title":"Proc. 11th Int. Conf. Artificial Intelligence and Statistics.","author":"Aberdeen D.","year":"2007","unstructured":"Aberdeen, D., Buffet, O., &amp; Thomas, O. (2007). Policy-Gradients for PSRs and POMDPs. Proc. 11th Int. Conf. Artificial Intelligence and Statistics."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.5555\/645529.757773"},{"key":"e_1_3_2_1_4_1","first-page":"229","volume":"15","author":"Casella G.","year":"1996","unstructured":"Casella, G., &amp; Robert, C. P. (1996). Raoblackwellisation of Sampling Schemes. Biometrika, 15, 229--235.","journal-title":"Raoblackwellisation of Sampling Schemes. Biometrika"},{"key":"e_1_3_2_1_5_1","volume-title":"Predictive Representations of State. Advances in Neural Information Processing Systems 14 (pp. 1555--1561)","author":"Littman M.","year":"2002","unstructured":"Littman, M., Sutton, R., &amp; Singh, S. (2002). Predictive Representations of State. Advances in Neural Information Processing Systems 14 (pp. 1555--1561)."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/1390156.1390236"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.5555\/2073796.2073845"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.5555\/936007"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2006.282564"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.5555\/935509"},{"key":"e_1_3_2_1_11_1","volume-title":"Policy Gradient Methods for Reinforcement Learning with Function Approximation. Advances in Neural Information Processing Systems 12 (pp. 1057--1063)","author":"Sutton R. S.","year":"2000","unstructured":"Sutton, R. S., Mcallester, D., Singh, S., &amp; Mansour, Y. (2000). Policy Gradient Methods for Reinforcement Learning with Function Approximation. Advances in Neural Information Processing Systems 12 (pp. 1057--1063)."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/1102351.1102473"}],"event":{"name":"ICML '09: The 26th Annual International Conference on Machine Learning held in conjunction with the 2007 International Conference on Inductive Logic Programming","location":"Montreal Quebec Canada","acronym":"ICML '09","sponsor":["MITACS","Microsoft Research Microsoft Research","NSF"]},"container-title":["Proceedings of the 26th Annual International Conference on Machine Learning"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1553374.1553383","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/1553374.1553383","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,17]],"date-time":"2026-05-17T19:51:57Z","timestamp":1779047517000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1553374.1553383"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,6,14]]},"references-count":12,"alternative-id":["10.1145\/1553374.1553383","10.1145\/1553374"],"URL":"https:\/\/doi.org\/10.1145\/1553374.1553383","relation":{},"subject":[],"published":{"date-parts":[[2009,6,14]]},"assertion":[{"value":"2009-06-14","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}