{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,29]],"date-time":"2025-08-29T10:09:11Z","timestamp":1756462151613},"reference-count":18,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2009,5]]},"DOI":"10.1109\/robot.2009.5152707","type":"proceedings-article","created":{"date-parts":[[2009,8,24]],"date-time":"2009-08-24T11:04:04Z","timestamp":1251111844000},"page":"2125-2132","source":"Crossref","is-referenced-by-count":9,"title":["Smoothed Sarsa: Reinforcement learning for robot delivery tasks"],"prefix":"10.1109","author":[{"given":"Deepak","family":"Ramachandran","sequence":"first","affiliation":[]},{"given":"Rakesh","family":"Gupta","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","article-title":"FastSLAM: A factored solution to the simultaneous localization and mapping problem","author":"montemerlo","year":"2002","journal-title":"Proceedings of the AAAI National Conference on Artificial Intelligence"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1177\/0278364904048962"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4757-3437-9"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1016\/S0004-3702(98)00023-X"},{"key":"ref14","first-page":"317","article-title":"The player\/stage project: Tools for multi-robot and distributed sensor systems","author":"gerkey","year":"2003","journal-title":"Proceedings of the 11th International Conference on Advanced Robotics"},{"article-title":"People detection in 3-dimensions on STAIR","year":"2008","author":"goodfellow","key":"ref15"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/1349822.1349855"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ROMAN.2008.4600738"},{"key":"ref18","first-page":"442","article-title":"Planning and learning in environments with delayed feedback","author":"walsh","year":"2007","journal-title":"ECML-07"},{"article-title":"On-line $q$-learning using connectionist systems","year":"1994","author":"rummery","key":"ref4"},{"journal-title":"Reinforcement Learning","year":"1998","author":"sutton","key":"ref3"},{"key":"ref6","first-page":"91","article-title":"Xavier: A robot navigation architecture based on partially observable markov decision process models","author":"koenig","year":"1998","journal-title":"Artificial Intelligence Based Mobile Robotics Case Studies of Successful Robot Systems"},{"key":"ref5","article-title":"Approximate planning in POMDPs with macro-actions","author":"theocharous","year":"2004","journal-title":"Advances in Neural Information Processing Systems 16 (NIPS)"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2004.1307420"},{"key":"ref7","first-page":"1080","article-title":"Probabilistic robot navigation in partially observable environments","author":"simmons","year":"1995","journal-title":"Proceedings of the International Joint Conference on Artificial Intelligence (IJCAI)"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/S0921-8890(02)00381-0"},{"key":"ref1","doi-asserted-by":"crossref","DOI":"10.1109\/ROBOT.1998.680906","article-title":"Hybrid, high-precision localization for mail distribution mobile system robot mops","author":"arras","year":"1998","journal-title":"Proceedings of the IEEE International Conference on Robotics and Automation (ICRA)"},{"key":"ref9","article-title":"PEGASUS: A policy search method for large MDPs and POMDPs","author":"ng","year":"2000","journal-title":"Proceedings of the Sixteenth Conference in Uncertainty in Artificial Intelligence (UAI)"}],"event":{"name":"2009 IEEE International Conference on Robotics and Automation (ICRA)","start":{"date-parts":[[2009,5,12]]},"location":"Kobe","end":{"date-parts":[[2009,5,17]]}},"container-title":["2009 IEEE International Conference on Robotics and Automation"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/5076472\/5152175\/05152707.pdf?arnumber=5152707","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,18]],"date-time":"2017-06-18T19:05:15Z","timestamp":1497812715000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/5152707\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,5]]},"references-count":18,"URL":"https:\/\/doi.org\/10.1109\/robot.2009.5152707","relation":{},"subject":[],"published":{"date-parts":[[2009,5]]}}}