{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,29]],"date-time":"2025-10-29T19:03:46Z","timestamp":1761764626846,"version":"3.28.0"},"reference-count":18,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1109\/robot.2005.1570759","type":"proceedings-article","created":{"date-parts":[[2006,1,18]],"date-time":"2006-01-18T18:42:54Z","timestamp":1137609774000},"page":"4164-4169","source":"Crossref","is-referenced-by-count":15,"title":["Learning Sensory Feedback to CPG with Policy Gradient for Biped Locomotion"],"prefix":"10.1109","author":[{"given":"T.","family":"Matsubara","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"family":"Jun Morimoto","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"family":"Jun Nakanishi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"M.","family":"Sato","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"K.","family":"Doya","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"year":"0","key":"17"},{"key":"18","first-page":"623","article-title":"Reinforcement learning for a CPG-driven biped robot","author":"mori","year":"2004","journal-title":"Proceedings of the Nineteenth National Conference on Artificial Intelligence (AAAI'04)"},{"year":"0","key":"15"},{"key":"16","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.1998.677288"},{"key":"13","article-title":"Reinforcement learning for humanoid robotics","author":"peters","year":"2003","journal-title":"Humanoids2003 Third IEEE-RAS International Conference on Humanoid Robots"},{"key":"14","first-page":"329","article-title":"Autobalancer: An online dynamic balance compensation scheme for humanoid robots","author":"kagami","year":"2001","journal-title":"Algorithmic and Computational Robotics New Directions"},{"key":"11","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2003.1248926"},{"key":"12","doi-asserted-by":"publisher","DOI":"10.1162\/089976600300015961"},{"key":"3","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2004.1307523"},{"key":"2","doi-asserted-by":"publisher","DOI":"10.1007\/BF00198086"},{"key":"1","doi-asserted-by":"publisher","DOI":"10.1007\/BF00449593"},{"year":"0","key":"10"},{"key":"7","first-page":"278","article-title":"An analysis of actor\/critic algorithms using eligibility traces: Reinforcement learning with imperfect value function","author":"kimura","year":"1998","journal-title":"Internatinal Conference on Machine Learning"},{"key":"6","first-page":"777","article-title":"Reinforcement learning for biped locomotion","author":"sato","year":"2002","journal-title":"International Conference on Artificial Neural Networks"},{"key":"5","doi-asserted-by":"publisher","DOI":"10.1537\/ase.106.327"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1177\/0278364903022003004"},{"key":"9","doi-asserted-by":"publisher","DOI":"10.1137\/S036301299731669X"},{"key":"8","first-page":"1057","article-title":"Policy gradient methods for reinforcement learning with function approximation","volume":"12","author":"sutton","year":"2000","journal-title":"Advances in neural information processing systems"}],"event":{"name":"2005 IEEE International Conference on Robotics and Automation","location":"Barcelona, Spain"},"container-title":["Proceedings of the 2005 IEEE International Conference on Robotics and Automation"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/10495\/33250\/01570759.pdf?arnumber=1570759","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,3,14]],"date-time":"2017-03-14T17:04:49Z","timestamp":1489511089000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/1570759\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"references-count":18,"URL":"https:\/\/doi.org\/10.1109\/robot.2005.1570759","relation":{},"subject":[]}}