{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,5]],"date-time":"2026-05-05T01:40:56Z","timestamp":1777945256788,"version":"3.51.4"},"reference-count":28,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Robotics and Autonomous Systems"],"published-print":{"date-parts":[[2026,7]]},"DOI":"10.1016\/j.robot.2026.105428","type":"journal-article","created":{"date-parts":[[2026,3,18]],"date-time":"2026-03-18T17:23:58Z","timestamp":1773854638000},"page":"105428","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["A deep reinforcement learning based hierarchical obstacle crossing planner for multi-robot cooperative transportation"],"prefix":"10.1016","volume":"201","author":[{"given":"Wenzhe","family":"Yin","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3816-935X","authenticated-orcid":false,"given":"Guowei","family":"Zhao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhibo","family":"Pang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"78","reference":[{"key":"10.1016\/j.robot.2026.105428_b1","doi-asserted-by":"crossref","first-page":"222","DOI":"10.1016\/j.rcim.2017.12.003","article-title":"Automated material handling in composite manufacturing using pick-and-place systems\u2013a review","volume":"51","author":"Bj\u00f6rnsson","year":"2018","journal-title":"Robot. Comput.-Integr. Manuf."},{"key":"10.1016\/j.robot.2026.105428_b2","series-title":"2017 25th Mediterranean Conference on Control and Automation","first-page":"701","article-title":"A review on multi-robot systems categorised by application domain","author":"Darmanin","year":"2017"},{"issue":"1","key":"10.1016\/j.robot.2026.105428_b3","first-page":"21","article-title":"A review of task allocation and motion planning for multi-robot in major equipment manufacturing","volume":"50","author":"Zhen-Guo","year":"2024","journal-title":"Acta Automat. Sinica"},{"issue":"1","key":"10.1016\/j.robot.2026.105428_b4","doi-asserted-by":"crossref","first-page":"205","DOI":"10.1146\/annurev-control-042920-095844","article-title":"Multirobot control strategies for collective transport","volume":"5","author":"Farivarnejad","year":"2022","journal-title":"Annu. Rev. Control. Robot. Auton. Syst."},{"key":"10.1016\/j.robot.2026.105428_b5","doi-asserted-by":"crossref","first-page":"34","DOI":"10.1016\/j.robot.2016.08.010","article-title":"Advanced approaches for multi-robot coordination in logistic scenarios","volume":"90","author":"Farinelli","year":"2017","journal-title":"Robot. Auton. Syst."},{"issue":"9","key":"10.1016\/j.robot.2026.105428_b6","doi-asserted-by":"crossref","first-page":"1000","DOI":"10.1177\/0278364917719333","article-title":"Multi-robot formation control and object transport in dynamic environments via constrained optimization","volume":"36","author":"Alonso-Mora","year":"2017","journal-title":"Int. J. Robot. Res."},{"key":"10.1016\/j.robot.2026.105428_b7","doi-asserted-by":"crossref","DOI":"10.1016\/j.robot.2024.104773","article-title":"A decoupled solution to heterogeneous multi-formation planning and coordination for object transportation","volume":"180","author":"Zhang","year":"2024","journal-title":"Robot. Auton. Syst."},{"key":"10.1016\/j.robot.2026.105428_b8","doi-asserted-by":"crossref","DOI":"10.1109\/LRA.2025.3597895","article-title":"Multi-robot cooperative transportation of irregular objects by multi-objective optimization with distributed control","author":"Tian","year":"2025","journal-title":"IEEE Robot. Autom. Lett."},{"issue":"1","key":"10.1016\/j.robot.2026.105428_b9","doi-asserted-by":"crossref","first-page":"343","DOI":"10.1007\/s40747-023-01178-1","article-title":"A discrete-time distributed optimization algorithm for cooperative transportation of multi-robot system","volume":"10","author":"Meng","year":"2024","journal-title":"Complex & Intell. Syst."},{"issue":"4","key":"10.1016\/j.robot.2026.105428_b10","doi-asserted-by":"crossref","first-page":"7027","DOI":"10.1109\/TASE.2023.3336076","article-title":"Distributed multi-vehicle task assignment and motion planning in dense environments","volume":"21","author":"Xu","year":"2023","journal-title":"IEEE Trans. Autom. Sci. Eng."},{"key":"10.1016\/j.robot.2026.105428_b11","doi-asserted-by":"crossref","DOI":"10.1016\/j.robot.2021.103993","article-title":"Cooperative distributed nonlinear model predictive control of a formation of differentially-driven mobile robots","volume":"150","author":"Rosenfelder","year":"2022","journal-title":"Robot. Auton. Syst."},{"issue":"8","key":"10.1016\/j.robot.2026.105428_b12","doi-asserted-by":"crossref","first-page":"11811","DOI":"10.1109\/TITS.2021.3107336","article-title":"Learning-based multi-robot formation control with obstacle avoidance","volume":"23","author":"Bai","year":"2021","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"key":"10.1016\/j.robot.2026.105428_b13","doi-asserted-by":"crossref","DOI":"10.1016\/j.rcim.2023.102570","article-title":"Hierarchical multi-robot navigation and formation in unknown environments via deep reinforcement learning and distributed optimization","volume":"83","author":"Chang","year":"2023","journal-title":"Robot. Comput.-Integr. Manuf."},{"key":"10.1016\/j.robot.2026.105428_b14","doi-asserted-by":"crossref","first-page":"61","DOI":"10.1016\/j.neunet.2023.11.063","article-title":"Distributed deep reinforcement learning based on bi-objective framework for multi-robot formation","volume":"171","author":"Li","year":"2024","journal-title":"Neural Netw."},{"key":"10.1016\/j.robot.2026.105428_b15","doi-asserted-by":"crossref","DOI":"10.1109\/TIE.2025.3581265","article-title":"Deep reinforcement learning-based cooperative control for multimobile robots with obstacle avoidance","author":"Fu","year":"2025","journal-title":"IEEE Trans. Ind. Electron."},{"key":"10.1016\/j.robot.2026.105428_b16","series-title":"2025 37th Chinese Control and Decision Conference","first-page":"2179","article-title":"Distributed shape formation and obstacle avoidance method for multi-agent systems based on graph","author":"Xiao","year":"2025"},{"key":"10.1016\/j.robot.2026.105428_b17","doi-asserted-by":"crossref","DOI":"10.1016\/j.eswa.2024.125900","article-title":"Multirobot unknown environment exploration and obstacle avoidance based on a Voronoi diagram and reinforcement learning","volume":"264","author":"Zhao","year":"2025","journal-title":"Expert Syst. Appl."},{"issue":"5","key":"10.1016\/j.robot.2026.105428_b18","doi-asserted-by":"crossref","first-page":"4346","DOI":"10.1109\/TITS.2023.3330183","article-title":"Safe reinforcement learning-based motion planning for functional mobile robots suffering uncontrollable mobile robots","volume":"25","author":"Cao","year":"2023","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"key":"10.1016\/j.robot.2026.105428_b19","series-title":"Why does hierarchy (sometimes) work so well in reinforcement learning?","author":"Nachum","year":"2019"},{"key":"10.1016\/j.robot.2026.105428_b20","article-title":"Data-efficient hierarchical reinforcement learning","volume":"31","author":"Nachum","year":"2018","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.robot.2026.105428_b21","unstructured":"A. Levy, G. Konidaris, R. Platt, K. Saenko, Learning multi-level hierarchies with hindsight, in: Proceedings of International Conference on Learning Representations, 2019."},{"key":"10.1016\/j.robot.2026.105428_b22","doi-asserted-by":"crossref","unstructured":"P.-L. Bacon, J. Harb, D. Precup, The option-critic architecture, in: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 31, 2017.","DOI":"10.1609\/aaai.v31i1.10916"},{"key":"10.1016\/j.robot.2026.105428_b23","series-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017"},{"key":"10.1016\/j.robot.2026.105428_b24","series-title":"2018 IEEE\/RSJ International Conference on Intelligent Robots and Systems","first-page":"3052","article-title":"Motion planning among dynamic, decision-making agents with deep reinforcement learning","author":"Everett","year":"2018"},{"key":"10.1016\/j.robot.2026.105428_b25","series-title":"High-dimensional continuous control using generalized advantage estimation","author":"Schulman","year":"2015"},{"key":"10.1016\/j.robot.2026.105428_b26","series-title":"2012 IEEE\/RSJ International Conference on Intelligent Robots and Systems","first-page":"5026","article-title":"Mujoco: A physics engine for model-based control","author":"Todorov","year":"2012"},{"key":"10.1016\/j.robot.2026.105428_b27","unstructured":"L. Engstrom, A. Ilyas, S. Santurkar, D. Tsipras, F. Janoos, L. Rudolph, A. Madry, Implementation matters in deep rl: A case study on ppo and trpo, in: International Conference on Learning Representations, 2019."},{"key":"10.1016\/j.robot.2026.105428_b28","doi-asserted-by":"crossref","first-page":"714","DOI":"10.1109\/TRO.2023.3339989","article-title":"A novel graph-based motion planner of multi-mobile robot systems with formation and obstacle constraints","volume":"40","author":"Liu","year":"2023","journal-title":"IEEE Trans. Robot."}],"container-title":["Robotics and Autonomous Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0921889026001016?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0921889026001016?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,5,2]],"date-time":"2026-05-02T10:38:59Z","timestamp":1777718339000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0921889026001016"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,7]]},"references-count":28,"alternative-id":["S0921889026001016"],"URL":"https:\/\/doi.org\/10.1016\/j.robot.2026.105428","relation":{},"ISSN":["0921-8890"],"issn-type":[{"value":"0921-8890","type":"print"}],"subject":[],"published":{"date-parts":[[2026,7]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"A deep reinforcement learning based hierarchical obstacle crossing planner for multi-robot cooperative transportation","name":"articletitle","label":"Article Title"},{"value":"Robotics and Autonomous Systems","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.robot.2026.105428","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier B.V. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"105428"}}