{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,16]],"date-time":"2026-06-16T15:12:29Z","timestamp":1781622749564,"version":"3.54.5"},"reference-count":33,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,5,13]],"date-time":"2024-05-13T00:00:00Z","timestamp":1715558400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,5,13]],"date-time":"2024-05-13T00:00:00Z","timestamp":1715558400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,5,13]]},"DOI":"10.1109\/icra57147.2024.10611573","type":"proceedings-article","created":{"date-parts":[[2024,8,8]],"date-time":"2024-08-08T17:51:05Z","timestamp":1723139465000},"page":"5155-5161","source":"Crossref","is-referenced-by-count":6,"title":["MAexp: A Generic Platform for RL-based Multi-Agent Exploration"],"prefix":"10.1109","author":[{"given":"Shaohao","family":"Zhu","sequence":"first","affiliation":[{"name":"Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jiacheng","family":"Zhou","sequence":"additional","affiliation":[{"name":"Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Anjun","family":"Chen","sequence":"additional","affiliation":[{"name":"Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Mingming","family":"Bai","sequence":"additional","affiliation":[{"name":"Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jiming","family":"Chen","sequence":"additional","affiliation":[{"name":"Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jinming","family":"Xu","sequence":"additional","affiliation":[{"name":"Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1002\/rob.21597"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.3390\/s22051824"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9561328"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2006.1641761"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2016.2520560"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2022.3224667"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19842-7_29"},{"key":"ref8","author":"Samvelyan","year":"2019","journal-title":"The starcraft multi-agent challenge"},{"key":"ref9","author":"Baker","year":"2019","journal-title":"Emergent tool use from multi-agent autocurricula"},{"key":"ref10","author":"Wang","year":"2021","journal-title":"Collaborative visual navigation"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICUAS57906.2023.10156452"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/AGENTS.2019.8929192"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9812344"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2022.3146912"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.3390\/e21030294"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICPADS51040.2020.00032"},{"key":"ref17","article-title":"Multi-agent actor-critic for mixed cooperative-competitive environments","volume":"30","author":"Lowe","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref18","article-title":"Habitat 2.0: Training home assistants to rearrange their habitat","author":"Szot","year":"2021","journal-title":"Advances in Neural Information Processing Systems (NeurIPS)"},{"key":"ref19","author":"Hu","year":"2022","journal-title":"Marllib: Extending rllib for multi-agent reinforcement learning"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10161030"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10161129"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM.2019.8737442"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2019.2915221"},{"key":"ref24","article-title":"Stpls3d: A large-scale synthetic and real aerial photogrammetry 3d point cloud dataset","volume-title":"33rd British Machine Vision Conference 2022, BMVC 2022, London, UK, November 21-24, 2022","author":"Chen"},{"key":"ref25","author":"Schulman","year":"2017","journal-title":"Proximal policy optimization algorithms"},{"key":"ref26","first-page":"1928","article-title":"Asynchronous methods for deep reinforcement learning","volume-title":"International conference on machine learning","author":"Mnih"},{"key":"ref27","first-page":"1889","article-title":"Trust region policy optimization","volume-title":"International conference on machine learning","author":"Schulman"},{"key":"ref28","author":"de Witt","year":"2020","journal-title":"Is independent learning all you need in the starcraft multi-agent challenge?"},{"key":"ref29","first-page":"12 208","article-title":"Facmac: Factored multi-agent centralised policy gradients","volume":"34","author":"Peng","year":"2021","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref30","first-page":"24 611","article-title":"The surprising effectiveness of ppo in cooperative multi-agent games","volume":"35","author":"Yu","year":"2022","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.23860\/diss-li-hepfeng-2023"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CAC57257.2022.10054763"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i13.17353"}],"event":{"name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","location":"Yokohama, Japan","start":{"date-parts":[[2024,5,13]]},"end":{"date-parts":[[2024,5,17]]}},"container-title":["2024 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10609961\/10609862\/10611573.pdf?arnumber=10611573","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,11]],"date-time":"2024-08-11T04:19:06Z","timestamp":1723349946000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10611573\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,13]]},"references-count":33,"URL":"https:\/\/doi.org\/10.1109\/icra57147.2024.10611573","relation":{},"subject":[],"published":{"date-parts":[[2024,5,13]]}}}