{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,24]],"date-time":"2026-04-24T23:11:58Z","timestamp":1777072318073,"version":"3.51.4"},"reference-count":42,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"4","license":[{"start":{"date-parts":[[2023,12,1]],"date-time":"2023-12-01T00:00:00Z","timestamp":1701388800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,12,1]],"date-time":"2023-12-01T00:00:00Z","timestamp":1701388800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,12,1]],"date-time":"2023-12-01T00:00:00Z","timestamp":1701388800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100010664","name":"EU H2020- FET RoboRoyale","doi-asserted-by":"publisher","award":["964492"],"award-info":[{"award-number":["964492"]}],"id":[{"id":"10.13039\/100010664","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001824","name":"Czech Science Foundation","doi-asserted-by":"publisher","award":["20-27034J"],"award-info":[{"award-number":["20-27034J"]}],"id":[{"id":"10.13039\/501100001824","id-type":"DOI","asserted-by":"publisher"}]},{"name":"OP VVV","award":["CZ.02.101\/0.0\/0.0\/16_019\/0000765 RCI"],"award-info":[{"award-number":["CZ.02.101\/0.0\/0.0\/16_019\/0000765 RCI"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Cogn. Dev. Syst."],"published-print":{"date-parts":[[2023,12]]},"DOI":"10.1109\/tcds.2023.3239815","type":"journal-article","created":{"date-parts":[[2023,1,25]],"date-time":"2023-01-25T18:44:33Z","timestamp":1674672273000},"page":"2122-2131","source":"Crossref","is-referenced-by-count":48,"title":["Federated Reinforcement Learning for Collective Navigation of Robotic Swarms"],"prefix":"10.1109","volume":"15","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7787-6930","authenticated-orcid":false,"given":"Seongin","family":"Na","sequence":"first","affiliation":[{"name":"Department of Electrical and Electronic Engineering, The University of Manchester, Manchester, U.K."}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3598-1630","authenticated-orcid":false,"given":"Tom\u00e1\u0161","family":"Rou\u010dek","sequence":"additional","affiliation":[{"name":"AIC, FEE, Czech Technical University in Prague, Prague, Czechia"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9754-6728","authenticated-orcid":false,"given":"Ji\u0159\u00ed","family":"Ulrich","sequence":"additional","affiliation":[{"name":"AIC, FEE, Czech Technical University in Prague, Prague, Czechia"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jan","family":"Pikman","sequence":"additional","affiliation":[{"name":"AIC, FEE, Czech Technical University in Prague, Prague, Czechia"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4408-7916","authenticated-orcid":false,"given":"Tom\u00e1\u0161","family":"Krajn\u00edk","sequence":"additional","affiliation":[{"name":"AIC, FEE, Czech Technical University in Prague, Prague, Czechia"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0905-8324","authenticated-orcid":false,"given":"Barry","family":"Lennox","sequence":"additional","affiliation":[{"name":"Department of Electrical and Electronic Engineering, The University of Manchester, Manchester, U.K."}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7950-3193","authenticated-orcid":false,"given":"Farshad","family":"Arvin","sequence":"additional","affiliation":[{"name":"Department of Computer Science, Swarm and Computational Intelligence Laboratory, Durham University, Durham, U.K."}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.swevo.2020.100762"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/s11721-012-0075-2"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0151834"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1126\/scirobotics.abe4385"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/j.gfs.2019.04.011"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1126\/scirobotics.abf1628"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1126\/scirobotics.abf1538"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.3389\/frobt.2016.00029"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-74528-2"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-74089-6_3"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.3389\/frobt.2019.00059"},{"key":"ref12","volume-title":"Reinforcement Learning: An Introduction","author":"Sutton","year":"2018"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2020.3034800"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2022.3145346"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2017.8202312"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/tnnls.2022.3191021"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2021.3054625"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1177\/0278364920916531"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2019.2928811"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICCRE51898.2021.9435666"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11794"},{"key":"ref22","first-page":"6382","article-title":"Multi-agent actor-critic for mixed cooperative-competitive environments","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"30","author":"Lowe"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-43890-6_22"},{"key":"ref24","first-page":"1273","article-title":"Communication-efficient learning of deep networks from decentralized data","volume-title":"Proc. 20th Int. Conf. Artif. Intell. Statist. (AISTATS)","volume":"54","author":"McMahan"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.01.1900525"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1038\/s41598-020-69250-1"},{"key":"ref27","article-title":"Federated deep reinforcement learning","author":"Zhuo","year":"2020","journal-title":"arXiv:1901.08277[cs.LG]"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2020.2986803"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2019.2931179"},{"key":"ref30","article-title":"Continuous control with deep reinforcement learning","volume-title":"Proc. 4th Int. Conf. Learn. Represent. (ICLR)","author":"Lillicrap"},{"key":"ref31","first-page":"1","article-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017","journal-title":"arXiv:1707.06347"},{"key":"ref32","first-page":"1582","article-title":"Addressing function approximation error in actor-critic methods","volume-title":"Proc. Int. Conf. Mach. Learn. (PMLR)","author":"Fujimoto"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1038\/nature14236"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/JSAC.2018.2864373"},{"key":"ref35","first-page":"10707","article-title":"Shared experience actor-critic for multi-agent reinforcement learning","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"33","author":"Christianos"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1145\/3477314.3507043"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3161534.3161537"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/s10846-014-0041-x"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.55417\/fr.2022055"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/JSEN.2020.3013265"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.3389\/frobt.2022.791921"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2020.2965416"}],"container-title":["IEEE Transactions on Cognitive and Developmental Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7274989\/10360134\/10025836.pdf?arnumber=10025836","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,12]],"date-time":"2024-01-12T01:57:46Z","timestamp":1705024666000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10025836\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,12]]},"references-count":42,"journal-issue":{"issue":"4"},"URL":"https:\/\/doi.org\/10.1109\/tcds.2023.3239815","relation":{},"ISSN":["2379-8920","2379-8939"],"issn-type":[{"value":"2379-8920","type":"print"},{"value":"2379-8939","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,12]]}}}