{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T14:03:51Z","timestamp":1730297031747,"version":"3.28.0"},"reference-count":9,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2012,4]]},"DOI":"10.1109\/siu.2012.6204703","type":"proceedings-article","created":{"date-parts":[[2012,6,1]],"date-time":"2012-06-01T14:52:14Z","timestamp":1338562334000},"page":"1-4","source":"Crossref","is-referenced-by-count":0,"title":["Importance sampling for model-based reinforcement learning"],"prefix":"10.1109","author":[{"given":"Orhan","family":"Sonmez","sequence":"first","affiliation":[]},{"given":"A. Taylan","family":"Cemgil","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"3","first-page":"387","article-title":"Introduction to Machine Learning","volume":"56","author":"alpaydin","year":"2004","journal-title":"Machine Learning"},{"key":"2","doi-asserted-by":"publisher","DOI":"10.2200\/S00268ED1V01Y201005AIM009"},{"key":"1","article-title":"Dynamic Programming and Optimal Control 3rd Edition","volume":"1 2","author":"bertsekas","year":"2007","journal-title":"Athena Scientific Series in Optimization and Neural Computation"},{"key":"7","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-23780-5_41"},{"key":"6","first-page":"221","article-title":"Efficient Inference in Markov Control Problems","author":"furmston","year":"2011","journal-title":"Proceedings of the Twenty-Seventh Conference Annual Conference on Uncertainty in Artificial Intelligence (UAI-11)"},{"key":"5","doi-asserted-by":"publisher","DOI":"10.1145\/1143844.1143963"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.2.271"},{"key":"9","article-title":"New inference strategies for solving Markov Decision Processes using reversible jump MCMC","author":"hoffman","year":"2009","journal-title":"Conference on Uncertainty in Artificial Intelligence"},{"key":"8","first-page":"1","article-title":"Trans-dimensional MCMC for Bayesian Policy Learning","volume":"20","author":"hoffman","year":"2008","journal-title":"Neural Information Processing Systems"}],"event":{"name":"2012 20th Signal Processing and Communications Applications Conference (SIU)","start":{"date-parts":[[2012,4,18]]},"location":"Mugla, Turkey","end":{"date-parts":[[2012,4,20]]}},"container-title":["2012 20th Signal Processing and Communications Applications Conference (SIU)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/6200808\/6204410\/06204703.pdf?arnumber=6204703","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,3,21]],"date-time":"2017-03-21T10:36:13Z","timestamp":1490092573000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/6204703\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,4]]},"references-count":9,"URL":"https:\/\/doi.org\/10.1109\/siu.2012.6204703","relation":{},"subject":[],"published":{"date-parts":[[2012,4]]}}}