{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,26]],"date-time":"2026-03-26T15:28:45Z","timestamp":1774538925350,"version":"3.50.1"},"reference-count":41,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,12,12]],"date-time":"2023-12-12T00:00:00Z","timestamp":1702339200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,12,12]],"date-time":"2023-12-12T00:00:00Z","timestamp":1702339200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,12,12]]},"DOI":"10.1109\/humanoids57100.2023.10375154","type":"proceedings-article","created":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T19:32:51Z","timestamp":1704137571000},"page":"1-8","source":"Crossref","is-referenced-by-count":33,"title":["Learning Torque Control for Quadrupedal Locomotion"],"prefix":"10.1109","author":[{"given":"Shuxiao","family":"Chen","sequence":"first","affiliation":[{"name":"University of California,Department of Mechanical Engineering,Berkeley,CA,USA,94720"}]},{"given":"Bike","family":"Zhang","sequence":"additional","affiliation":[{"name":"University of California,Department of Mechanical Engineering,Berkeley,CA,USA,94720"}]},{"given":"Mark W.","family":"Mueller","sequence":"additional","affiliation":[{"name":"University of California,Department of Mechanical Engineering,Berkeley,CA,USA,94720"}]},{"given":"Akshara","family":"Rai","sequence":"additional","affiliation":[{"name":"Meta AI,CA,USA,94025"}]},{"given":"Koushil","family":"Sreenath","sequence":"additional","affiliation":[{"name":"University of California,Department of Mechanical Engineering,Berkeley,CA,USA,94720"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1177\/0956797612446346"},{"key":"ref2","article-title":"Reinforcement learning for pivoting task","author":"Antonova","year":"2017","journal-title":"arXiv preprint"},{"key":"ref3","article-title":"Robust quadruped jumping via deep reinforcement learning","author":"Bellegarda","year":"2020","journal-title":"arXiv preprint"},{"key":"ref4","article-title":"Robust high-speed running for quadruped robots via deep reinforcement learning","year":"2021","journal-title":"arXiv preprint"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1126\/scirobotics.ade2256"},{"key":"ref6","first-page":"883","article-title":"Learning a contact-adaptive controller for robust, efficient legged locomotion","volume-title":"Conference on Robot Learning","author":"Da"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2018.8594448"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/tro.2022.3172469"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1111\/desc.13069"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1126\/scirobotics.aau5872"},{"key":"ref11","article-title":"Mnn: A universal and efficient inference engine","author":"Jiang","year":"2020","journal-title":"MLSys"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9561731"},{"key":"ref13","first-page":"769","article-title":"Hierarchical apprenticeship learning with application to quadruped locomotion","volume-title":"Advances in Neural Information Processing Systems","author":"Kolter","year":"2008"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2021.XVII.011"},{"key":"ref15","article-title":"Robust recovery controller for a quadrupedal robot using deep reinforcement learning","author":"Lee","year":"2019","journal-title":"arXiv preprint"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1126\/scirobotics.abc5986"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9196642"},{"key":"ref18","article-title":"Continuous control with deep reinforce-ment learning","author":"Lillicrap","year":"2015","journal-title":"arXiv preprint"},{"key":"ref19","article-title":"Isaac gym: High performance gpu-based physics simulation for robot learning","author":"Makoviychuk","year":"2021","journal-title":"arXiv preprint"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1126\/scirobotics.abk2822"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8460528"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.15607\/rss.2020.xvi.064"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3099564.3099567"},{"key":"ref24","first-page":"2817","article-title":"Robust adversar-ial reinforcement learning","volume-title":"International Conference on Machine Learning","author":"Pinto"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.3182\/20080706-5-KR-1001.01833"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/MEX.1986.4307016"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3424636.3426907"},{"key":"ref28","first-page":"91","article-title":"Learning to walk in minutes using massively parallel deep reinforcement learning","volume-title":"Conference on Robot Learning","author":"Rudin"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.29007\/czvx"},{"key":"ref30","article-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017","journal-title":"arXiv preprint"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2022.3145495"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9561814"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9812166"},{"key":"ref34","article-title":"A walk in the park: Learning to walk in 20 minutes with model-free reinforcement learning","author":"Smith","year":"2022","journal-title":"arXiv preprint"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2021.3108510"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2018.XIV.010"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/IROS40897.2019.8967946"},{"key":"ref38","article-title":"Day-dreamer: World models for physical robot learning","author":"Wu","year":"2022","journal-title":"arXiv preprint"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9560837"},{"key":"ref40","first-page":"773","article-title":"Fast and efficient locomotion via learned gait transitions","volume-title":"Conference on Robot Learning","author":"Yang"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10160836"}],"event":{"name":"2023 IEEE-RAS 22nd International Conference on Humanoid Robots (Humanoids)","location":"Austin, TX, USA","start":{"date-parts":[[2023,12,12]]},"end":{"date-parts":[[2023,12,14]]}},"container-title":["2023 IEEE-RAS 22nd International Conference on Humanoid Robots (Humanoids)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10375141\/10374561\/10375154.pdf?arnumber=10375154","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,12]],"date-time":"2024-01-12T23:52:39Z","timestamp":1705103559000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10375154\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,12,12]]},"references-count":41,"URL":"https:\/\/doi.org\/10.1109\/humanoids57100.2023.10375154","relation":{},"subject":[],"published":{"date-parts":[[2023,12,12]]}}}