{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,23]],"date-time":"2026-01-23T21:40:12Z","timestamp":1769204412897,"version":"3.49.0"},"reference-count":30,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,11]]},"DOI":"10.1109\/humanoids.2018.8625045","type":"proceedings-article","created":{"date-parts":[[2019,1,25]],"date-time":"2019-01-25T02:51:38Z","timestamp":1548384698000},"page":"270-276","source":"Crossref","is-referenced-by-count":20,"title":["Learning Whole-Body Motor Skills for Humanoids"],"prefix":"10.1109","author":[{"given":"Chuanyu","family":"Yang","sequence":"first","affiliation":[]},{"given":"Kai","family":"Yuan","sequence":"additional","affiliation":[]},{"given":"Wolfgang","family":"Merkt","sequence":"additional","affiliation":[]},{"given":"Taku","family":"Komura","sequence":"additional","affiliation":[]},{"given":"Sethu","family":"Vijayakumar","sequence":"additional","affiliation":[]},{"given":"Zhibin","family":"Li","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICHR.2010.5686288"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICHR.2006.321375"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICHR.2006.321385"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TBME.2005.851530"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/Humanoids.2011.6100894"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8461101"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/HUMANOIDS.2017.8246970"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/HUMANOIDS.2017.8239534"},{"key":"ref17","article-title":"Stabilizing humanoids on slopes using terrain inclination estimation","author":"li","year":"2013","journal-title":"IROS"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/HUMANOIDS.2016.7803247"},{"key":"ref19","article-title":"Emergence of locomotion behaviours in rich environments","author":"heess","year":"2017","journal-title":"arXiv 1707 02286"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3099564.3099567"},{"key":"ref4","article-title":"Proximal policy optimization algorithms","author":"schulman","year":"2017","journal-title":"arXiv 1707 06347"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/HUMANOIDS.2017.8246900"},{"key":"ref3","article-title":"Continuous control with deep reinforcement learning","author":"lillicrap","year":"2015","journal-title":"arXiv 1509 02971"},{"key":"ref6","doi-asserted-by":"crossref","DOI":"10.1145\/3072959.3073602","article-title":"DeepLoco: Dynamic locomotion skills using hierarchical deep reinforcement learning","author":"peng","year":"2017","journal-title":"Transactions on Graphics"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/j.robot.2006.04.007"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-95972-6_29"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICHR.2007.4813931"},{"key":"ref7","article-title":"Learning symmetry and low-energy locomotion","author":"yu","year":"2018","journal-title":"arXiv 1801 08093"},{"key":"ref2","article-title":"Trust region policy optimization","author":"schulman","year":"0","journal-title":"ICML 2015"},{"key":"ref9","article-title":"Humanoid balancing behavior featured by underactuated foot motion","author":"li","year":"2017","journal-title":"T-RO"},{"key":"ref1","article-title":"An improved formulation for model predictive control of leggedrobots for gait planning and feedback control","author":"yuan","year":"2018","journal-title":"IROS"},{"key":"ref20","article-title":"Generative adversarial imitation learning","author":"ho","year":"2016","journal-title":"NIPS"},{"key":"ref22","article-title":"Deepmimic: Example-guided deep reinforcement learning of physics-based character skills","author":"peng","year":"2018","journal-title":"arXiv 1804 02717"},{"key":"ref21","article-title":"Learning human behaviors from motion capture by adversarial imitation","author":"merel","year":"2017","journal-title":"arXiv 1707 02201"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1002\/rob.21560"},{"key":"ref23","author":"coumans","year":"0","journal-title":"Pybullet physics engine"},{"key":"ref26","article-title":"High-dimensional continuous control using generalized advantage estimation","author":"schulman","year":"2015","journal-title":"arXiv 1506 02438 [cs]"},{"key":"ref25","author":"abadi","year":"2015","journal-title":"TensorFlow Large-Scale Machine Learning on Heterogeneous Systems"}],"event":{"name":"2018 IEEE-RAS 18th International Conference on Humanoid Robots (Humanoids)","location":"Beijing, China","start":{"date-parts":[[2018,11,6]]},"end":{"date-parts":[[2018,11,9]]}},"container-title":["2018 IEEE-RAS 18th International Conference on Humanoid Robots (Humanoids)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8596719\/8624912\/08625045.pdf?arnumber=8625045","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,26]],"date-time":"2022-01-26T22:43:59Z","timestamp":1643237039000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8625045\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,11]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/humanoids.2018.8625045","relation":{},"subject":[],"published":{"date-parts":[[2018,11]]}}}