{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,27]],"date-time":"2026-05-27T19:21:58Z","timestamp":1779909718125,"version":"3.53.1"},"reference-count":24,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"10","license":[{"start":{"date-parts":[[2023,10,1]],"date-time":"2023-10-01T00:00:00Z","timestamp":1696118400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Robot. Autom. Lett."],"published-print":{"date-parts":[[2023,10]]},"DOI":"10.1109\/lra.2023.3303786","type":"journal-article","created":{"date-parts":[[2023,8,9]],"date-time":"2023-08-09T17:35:01Z","timestamp":1691602501000},"page":"6243-6250","source":"Crossref","is-referenced-by-count":7,"title":["Reinforcement Learning With Energy-Exchange Dynamics for Spring-Loaded Biped Robot Walking"],"prefix":"10.1109","volume":"8","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3085-0343","authenticated-orcid":false,"given":"Cheng-Yu","family":"Kuo","sequence":"first","affiliation":[{"name":"Graduate School of Science and Technology, Nara Institute of Science and Technology, Nara, Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0265-3710","authenticated-orcid":false,"given":"Hirofumi","family":"Shin","sequence":"additional","affiliation":[{"name":"Honda R&amp;D, Ltd., Saitama, Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3545-4814","authenticated-orcid":false,"given":"Takamitsu","family":"Matsubara","sequence":"additional","affiliation":[{"name":"Graduate School of Science and Technology, Nara Institute of Science and Technology, Nara, Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9811962"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TRO.2022.3228713"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/Humanoids53995.2022.9999741"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/Humanoids53995.2022.10000225"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9811541"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/s10472-015-9463-9"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2021.3066833"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9561814"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9812154"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9560769"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/1553374.1553403"},{"key":"ref12","first-page":"1701","article-title":"Data-efficient reinforcement learning with probabilistic model predictive control","volume-title":"Proc. Int. Conf. Artif. Intell. Statist.","author":"Kamthe","year":"2018"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1561\/2200000086"},{"key":"ref14","first-page":"II829","article-title":"Learning complex neural network policies with trajectory optimization","volume-title":"Proc. 31st Int. Conf. Int. Conf. Mach. Learn.","author":"Levine","year":"2014"},{"key":"ref15","first-page":"1539","article-title":"Minimax differential dynamic programming: An application to robust biped walking","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Morimoto","year":"2002"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2012.6385955"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1002\/rob.21990"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9197449"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/Humanoids53995.2022.10000180"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2021.3065271"},{"key":"ref21","first-page":"465","article-title":"PILCO: A model-based and data-efficient approach to policy search","volume-title":"Proc. 28th Int. Conf. Int. Conf. Mach. Learn.","author":"Deisenroth","year":"2011"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1561\/2300000038"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.7551\/mitpress\/3074.001.0001"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1038\/s41598-021-01694-5"}],"container-title":["IEEE Robotics and Automation Letters"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7083369\/10220574\/10214113.pdf?arnumber=10214113","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,13]],"date-time":"2024-03-13T22:53:54Z","timestamp":1710370434000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10214113\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10]]},"references-count":24,"journal-issue":{"issue":"10"},"URL":"https:\/\/doi.org\/10.1109\/lra.2023.3303786","relation":{},"ISSN":["2377-3766","2377-3774"],"issn-type":[{"value":"2377-3766","type":"electronic"},{"value":"2377-3774","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,10]]}}}