{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T18:13:57Z","timestamp":1755800037020,"version":"3.44.0"},"reference-count":32,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,8,26]],"date-time":"2025-08-26T00:00:00Z","timestamp":1756166400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,8,26]],"date-time":"2025-08-26T00:00:00Z","timestamp":1756166400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,8,26]]},"DOI":"10.1109\/cog64752.2025.11114167","type":"proceedings-article","created":{"date-parts":[[2025,8,19]],"date-time":"2025-08-19T18:06:42Z","timestamp":1755626802000},"page":"1-8","source":"Crossref","is-referenced-by-count":0,"title":["A Continual Offline Reinforcement Learning Benchmark for Navigation Tasks"],"prefix":"10.1109","author":[{"given":"Anthony","family":"Kobanda","sequence":"first","affiliation":[{"name":"Inria, Univ. Lille, CNRS, UMR 9198-CRIStAL,Centrale Lille,Lille,France,F-59000"}]},{"given":"Odalric-Ambrym","family":"Maillard","sequence":"additional","affiliation":[{"name":"Inria, Univ. Lille, CNRS, UMR 9198-CRIStAL,Centrale Lille,Lille,France,F-59000"}]},{"given":"R\u00e9my","family":"Portelas","sequence":"additional","affiliation":[{"name":"Ubisoft La Forge,Bordeaux,France"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Reinforcement Learning: An Introduction, Second Edition","author":"Sutton","year":"2018","journal-title":"MIT Press"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2017.2743240"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1613\/jair.1.13673"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2024.3367329"},{"key":"ref5","article-title":"Goalconditioned imitation learning","author":"Ding","year":"2019","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2022\/770"},{"volume-title":"Offline reinforcement learning: Tutorial, review, and perspectives on open problems","year":"2020","author":"Levine","key":"ref7"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CoG57401.2023.10333201"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CoG47356.2020.9231705"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CoG60054.2024.10645657"},{"journal-title":"Godot","article-title":"Godot game engine","year":"2020","key":"ref11"},{"key":"ref12","article-title":"The atari grand challenge dataset","author":"Kurin","year":"2017","journal-title":"arXiv preprint arXiv"},{"key":"ref13","first-page":"2048","article-title":"Leveraging procedural generation to benchmark reinforcement learning","volume-title":"International conference on machine learning","author":"Cobbe","year":"2020"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CIG.2016.7860433"},{"volume-title":"Don\u2019t forget, there is more than forgetting: new metrics for continual learning","year":"2018","author":"D\u00edaz-Rodr\u00edguez","key":"ref15"},{"key":"ref16","article-title":"Continual offline reinforcement learning via diffusionbased dual generative replay","author":"Liu","year":"2024","journal-title":"arxiv"},{"volume-title":"Continual world: A robotic benchmark for continual reinforcement learning","year":"2021","author":"Wolczyk","key":"ref17"},{"key":"ref18","article-title":"Cora: Benchmarks, baselines, and metrics as a platform for continual reinforcement learning agents","volume-title":"Conference on Lifelong Learning Agents, PMLR","author":"Powers","year":"2022"},{"key":"ref19","article-title":"Experience replay for continual learning","author":"Rolnick","year":"2019","journal-title":"Advances in neural information processing systems"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9560793"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1611835114"},{"volume-title":"Maintaining plasticity in continual learning via regenerative regularization","year":"2023","author":"Kumar","key":"ref22"},{"key":"ref23","article-title":"Progressive neural networks","author":"Rusu","year":"2016","journal-title":"arxiv preprint"},{"key":"ref24","article-title":"Hierarchical subspaces of policies for continual offline reinforcement learning","author":"Kobanda","year":"2024","journal-title":"arXiv preprint arXiv"},{"key":"ref25","article-title":"Efficient active imitation learning with random network distillation","author":"Bir\u00e9","year":"2024","journal-title":"arXiv preprint arXiv"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11651"},{"key":"ref27","article-title":"Relay policy learning: Solving long-horizon tasks via imitation and reinforcement learning","author":"Gupta","year":"2019","journal-title":"arXiv preprint arXiv"},{"key":"ref28","article-title":"Learning neural network subspaces","volume-title":"International Conference on Machine Learning","author":"Wortsman","year":"2021"},{"key":"ref29","article-title":"Reinforcement learning from passive data via latent intentions","volume-title":"International Conference on Machine Learning, PMLR","author":"Ghosh","year":"2023"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref31","article-title":"Layer normalization","author":"Ba","year":"2016","journal-title":"arXiv preprint arXiv"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-021-10033-z"}],"event":{"name":"2025 IEEE Conference on Games (CoG)","start":{"date-parts":[[2025,8,26]]},"location":"Lisbon, Portugal","end":{"date-parts":[[2025,8,29]]}},"container-title":["2025 IEEE Conference on Games (CoG)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11113832\/11113841\/11114167.pdf?arnumber=11114167","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,20]],"date-time":"2025-08-20T06:19:46Z","timestamp":1755670786000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11114167\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,26]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/cog64752.2025.11114167","relation":{},"subject":[],"published":{"date-parts":[[2025,8,26]]}}}