{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,14]],"date-time":"2026-04-14T11:41:26Z","timestamp":1776166886036,"version":"3.50.1"},"reference-count":31,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/501100003453","name":"Guangdong Provincial Natural Science Foundation","doi-asserted-by":"publisher","award":["2024A1515012637"],"award-info":[{"award-number":["2024A1515012637"]}],"id":[{"id":"10.13039\/501100003453","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Advanced Engineering Informatics"],"published-print":{"date-parts":[[2026,9]]},"DOI":"10.1016\/j.aei.2026.104659","type":"journal-article","created":{"date-parts":[[2026,4,7]],"date-time":"2026-04-07T13:16:54Z","timestamp":1775567814000},"page":"104659","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"PA","title":["Concurrent training of teacher-student networks and state estimator with a single optimizer for dynamic wheeled bipedal robots locomotion"],"prefix":"10.1016","volume":"74","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7581-6774","authenticated-orcid":false,"given":"Yanbiao","family":"Zou","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0005-2568-9961","authenticated-orcid":false,"given":"Yizan","family":"Qiu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9716-3970","authenticated-orcid":false,"given":"Tie","family":"Zhang","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0008-1608-7362","authenticated-orcid":false,"given":"Xuming","family":"Guo","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.aei.2026.104659_b0005","series-title":"2019 International Conference on Robotics and Automation (ICRA)","first-page":"7515","article-title":"Ascento: a two-wheeled jumping robot","author":"Klemm","year":"2019"},{"key":"10.1016\/j.aei.2026.104659_b0010","doi-asserted-by":"crossref","first-page":"607","DOI":"10.1007\/s42235-023-00468-1","article-title":"Development of wheel-legged biped robots: a review","volume":"21","author":"Liu","year":"2024","journal-title":"J. Bionic Eng."},{"key":"10.1016\/j.aei.2026.104659_b0015","series-title":"Proceedings of 1993 IEEE\/Tsukuba International Workshop on Advanced Robotics","first-page":"109","article-title":"Leg-wheel robot: a futuristic mobile platform for forestry industry","author":"Eiji","year":"1993"},{"key":"10.1016\/j.aei.2026.104659_b0020","series-title":"2019 IEEE-RAS 19th International Conference on Humanoid Robots (Humanoids)","first-page":"1","article-title":"Model decoupling and control of the wheeled humanoid robot moving in sagittal plane","author":"Zhou","year":"2019"},{"key":"10.1016\/j.aei.2026.104659_b0025","series-title":"2019 IEEE International Conference on Robotics and Biomimetics (ROBIO)","first-page":"1875","article-title":"Dynamic height balance control for bipedal wheeled robot based on ROS-gazebo","author":"Liu","year":"2019"},{"key":"10.1016\/j.aei.2026.104659_b0030","doi-asserted-by":"crossref","first-page":"3745","DOI":"10.1109\/LRA.2020.2979625","article-title":"LQR-assisted whole-body control of a wheeled bipedal robot with kinematic loops","volume":"5","author":"Klemm","year":"2020","journal-title":"IEEE Robot. Autom. Lett."},{"key":"10.1016\/j.aei.2026.104659_b0035","series-title":"2021 IEEE International Conference on Robotics and Automation (ICRA)","first-page":"6782","article-title":"Balance control of a novel wheel-legged robot: design and experiments","author":"Wang","year":"2021"},{"key":"10.1016\/j.aei.2026.104659_b0040","series-title":"2020 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)","first-page":"3892","article-title":"Online dynamic motion planning and control for wheeled biped robots","author":"Xin","year":"2020"},{"key":"10.1016\/j.aei.2026.104659_b0045","doi-asserted-by":"crossref","first-page":"7881","DOI":"10.1109\/LRA.2023.3322084","article-title":"Modeling and MPC-based pose tracking for wheeled bipedal robot","volume":"8","author":"Yu","year":"2023","journal-title":"IEEE Robot. Autom. Lett."},{"key":"10.1016\/j.aei.2026.104659_b0050","doi-asserted-by":"crossref","first-page":"180630","DOI":"10.1109\/ACCESS.2019.2959333","article-title":"Speed and acceleration control for a two wheel-leg robot based on distributed dynamic model and whole-body control","volume":"7","author":"Xin","year":"2019","journal-title":"IEEE Access"},{"key":"10.1016\/j.aei.2026.104659_b0055","doi-asserted-by":"crossref","DOI":"10.1016\/j.apm.2024.115737","article-title":"A novel adaptive dynamic optimal balance control method for wheel-legged robot","volume":"137","author":"Liu","year":"2025","journal-title":"App. Math. Model."},{"key":"10.1016\/j.aei.2026.104659_b0060","doi-asserted-by":"crossref","DOI":"10.1016\/j.aei.2022.101787","article-title":"Robotics in construction: a critical review of the reinforcement learning and imitation learning paradigms","volume":"54","author":"Manuel Davila Delgado","year":"2022","journal-title":"Adv. Eng. Inf."},{"key":"10.1016\/j.aei.2026.104659_b0065","doi-asserted-by":"crossref","first-page":"26","DOI":"10.1109\/MSP.2017.2743240","article-title":"Deep reinforcement learning: a brief survey","volume":"34","author":"Arulkumaran","year":"2017","journal-title":"IEEE Signal Process Mag."},{"key":"10.1016\/j.aei.2026.104659_b0070","doi-asserted-by":"crossref","DOI":"10.1126\/scirobotics.aau5872","article-title":"Learning agile and dynamic motor skills for legged robots","volume":"4","author":"Hwangbo","year":"2019","journal-title":"Sci. Robot."},{"key":"10.1016\/j.aei.2026.104659_b0075","doi-asserted-by":"crossref","DOI":"10.1126\/scirobotics.abc5986","article-title":"Learning quadrupedal locomotion over challenging terrain","volume":"5","author":"Lee","year":"2020","journal-title":"Sci. Robot."},{"key":"10.1016\/j.aei.2026.104659_b0080","doi-asserted-by":"crossref","unstructured":"A. Kumar, Z. Fu, D. Pathak, J. Malik, RMA: Rapid Motor Adaptation for Legged Robots, in: Robotics: Science and Systems XVII, Robotics: Science and Systems Foundation, 2021. https:\/\/doi.org\/10.15607\/RSS.2021.XVII.011.","DOI":"10.15607\/RSS.2021.XVII.011"},{"key":"10.1016\/j.aei.2026.104659_b0085","doi-asserted-by":"crossref","first-page":"4630","DOI":"10.1109\/LRA.2022.3151396","article-title":"Concurrent training of a control policy and a state estimator for dynamic and robust legged locomotion","volume":"7","author":"Ji","year":"2022","journal-title":"IEEE Robot. Autom. Lett."},{"key":"10.1016\/j.aei.2026.104659_b0090","doi-asserted-by":"crossref","DOI":"10.1126\/scirobotics.abk2822","article-title":"Learning robust perceptive locomotion for quadrupedal robots in the wild","volume":"7","author":"Miki","year":"2022","journal-title":"Sci. Robot."},{"key":"10.1016\/j.aei.2026.104659_b0095","unstructured":"N. Rudin, D. Hoeller, P. Reist, M. Hutter, Learning to Walk in Minutes Using Massively Parallel Deep Reinforcement Learning, (2022). http:\/\/arxiv.org\/abs\/2109.11978 (accessed October 17, 2024)."},{"key":"10.1016\/j.aei.2026.104659_b0100","series-title":"2023 IEEE International Conference on Robotics and Automation (ICRA)","first-page":"5078","article-title":"DreamWaQ: learning robust quadrupedal locomotion with implicit terrain imagination via deep reinforcement learning","author":"Aswin Nahrendra","year":"2023"},{"key":"10.1016\/j.aei.2026.104659_b0105","doi-asserted-by":"crossref","first-page":"4019","DOI":"10.1109\/LRA.2024.3375086","article-title":"MorAL: learning morphologically adaptive locomotion controller for quadrupedal robots on challenging terrains","volume":"9","author":"Luo","year":"2024","journal-title":"IEEE Robot. Autom. Lett."},{"key":"10.1016\/j.aei.2026.104659_b0110","doi-asserted-by":"crossref","first-page":"7667","DOI":"10.1109\/LRA.2021.3100269","article-title":"Learning-based balance control of wheel-legged robots","volume":"6","author":"Cui","year":"2021","journal-title":"IEEE Robot. Autom. Lett."},{"key":"10.1016\/j.aei.2026.104659_b0115","series-title":"2024 IEEE International Conference on Robotics and Automation (ICRA)","first-page":"8081","article-title":"Reinforcement learning for blind stair climbing with legged and wheeled-legged robots","author":"Chamorro","year":"2024"},{"key":"10.1016\/j.aei.2026.104659_b0120","unstructured":"J. Schulman, F. Wolski, P. Dhariwal, A. Radford, O. Klimov, Proximal policy optimization algorithms, (2017). http:\/\/arxiv.org\/abs\/1707.06347 (accessed October 24, 2024)."},{"key":"10.1016\/j.aei.2026.104659_b0125","series-title":"Arm-Constrained Curriculum Learning for Loco-Manipulation of a Wheel-Legged Robot","first-page":"10770","author":"Wang","year":"2024"},{"key":"10.1016\/j.aei.2026.104659_b0130","first-page":"23","article-title":"Domain randomization for transferring deep neural networks from simulation to the real world","volume":"2017","author":"Tobin","year":"2017","journal-title":"IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)"},{"key":"10.1016\/j.aei.2026.104659_b0135","series-title":"Robotics: Science and Systems XIV","article-title":"Sim-to-real: learning agile locomotion for quadruped robots","author":"Tan","year":"2018"},{"key":"10.1016\/j.aei.2026.104659_b0140","series-title":"Dynamics Randomization Revisited: A Case Study for Quadrupedal Locomotion","first-page":"4955","author":"Xie","year":"2021"},{"key":"10.1016\/j.aei.2026.104659_b0145","doi-asserted-by":"crossref","first-page":"9191","DOI":"10.1109\/LRA.2024.3457379","article-title":"CTS: concurrent teacher-student reinforcement learning for legged locomotion","volume":"9","author":"Wang","year":"2024","journal-title":"IEEE Robot. Autom. Lett."},{"key":"10.1016\/j.aei.2026.104659_b0150","doi-asserted-by":"crossref","DOI":"10.1016\/j.robot.2023.104550","article-title":"Stable skill improvement of quadruped robot based on privileged information and curriculum guidance","volume":"170","author":"Jiang","year":"2023","journal-title":"Rob. Auton. Syst."},{"key":"10.1016\/j.aei.2026.104659_b0155","unstructured":"V. Makoviychuk, L. Wawrzyniak, Y. Guo, M. Lu, K. Storey, M. Macklin, D. Hoeller, N. Rudin, A. Allshire, A. Handa, G. State, Isaac Gym: High Performance GPU-Based Physics Simulation For Robot Learning, (2021). https:\/\/doi.org\/10.48550\/arXiv.2108.10470."}],"container-title":["Advanced Engineering Informatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1474034626003514?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1474034626003514?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,4,14]],"date-time":"2026-04-14T10:36:12Z","timestamp":1776162972000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1474034626003514"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,9]]},"references-count":31,"alternative-id":["S1474034626003514"],"URL":"https:\/\/doi.org\/10.1016\/j.aei.2026.104659","relation":{},"ISSN":["1474-0346"],"issn-type":[{"value":"1474-0346","type":"print"}],"subject":[],"published":{"date-parts":[[2026,9]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Concurrent training of teacher-student networks and state estimator with a single optimizer for dynamic wheeled bipedal robots locomotion","name":"articletitle","label":"Article Title"},{"value":"Advanced Engineering Informatics","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.aei.2026.104659","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier Ltd. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"104659"}}