{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,10]],"date-time":"2026-03-10T11:21:34Z","timestamp":1773141694671,"version":"3.50.1"},"reference-count":70,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"6","license":[{"start":{"date-parts":[[2025,12,1]],"date-time":"2025-12-01T00:00:00Z","timestamp":1764547200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Cogn. Dev. Syst."],"published-print":{"date-parts":[[2025,12]]},"DOI":"10.1109\/tcds.2025.3569352","type":"journal-article","created":{"date-parts":[[2025,5,12]],"date-time":"2025-05-12T13:45:49Z","timestamp":1747057549000},"page":"1503-1519","source":"Crossref","is-referenced-by-count":3,"title":["H-GRAIL: A Robotic Motivational Architecture to Tackle Open-Ended Learning Challenges"],"prefix":"10.1109","volume":"17","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-0507-8320","authenticated-orcid":false,"given":"Alejandro","family":"Romero","sequence":"first","affiliation":[{"name":"Integrated Group for Engineering Research (GII), CITIC Research Center, Universidade da Coru&#x00F1;a, Ferrol (A Coru&#x00F1;a), Spain"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1277-4447","authenticated-orcid":false,"given":"Gianluca","family":"Baldassarre","sequence":"additional","affiliation":[{"name":"Institute of Cognitive Sciences and Technologies (ISTC), National Research Council of Italy (CNR), Rome, Italy"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6807-524X","authenticated-orcid":false,"given":"Richard J.","family":"Duro","sequence":"additional","affiliation":[{"name":"Integrated Group for Engineering Research (GII), CITIC Research Center, Universidade da Coru&#x00F1;a, Ferrol (A Coru&#x00F1;a), Spain"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8748-9632","authenticated-orcid":false,"given":"Vieri Giuliano","family":"Santucci","sequence":"additional","affiliation":[{"name":"Institute of Cognitive Sciences and Technologies (ISTC), National Research Council of Italy (CNR), Rome, Italy"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2024.128073"},{"key":"ref2","article-title":"From machine learning to robotics: Challenges and opportunities for embodied intelligence","author":"Roy","year":"2021"},{"key":"ref3","article-title":"Open-ended learning leads to generally capable agents","author":"Team","year":"2021"},{"key":"ref4","article-title":"A definition of open-ended learning problems for goal-conditioned agents","author":"Sigaud","year":"2023"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/tcds.2023.3270081"},{"key":"ref6","article-title":"Open-endedness is essential for artificial superhuman intelligence","author":"Hughes","year":"2024"},{"key":"ref7","first-page":"131","article-title":"A definition of continual reinforcement learning","volume":"36","author":"Abel","year":"2024","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2019.01.012"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1080\/09540090310001655110"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1142\/S0219843604000149"},{"key":"ref11","volume-title":"Reinforcement Learning: An Introduction","author":"Sutton","year":"2018"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-32375-1"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.3389\/978-2-88963-485-9"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.3389\/fpsyg.2013.00907"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TAMD.2010.2056368"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2017.70"},{"key":"ref17","article-title":"Go-explore: A new approach for hard-exploration problems","author":"Ecoffet","year":"2019"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TCDS.2020.3042938"},{"key":"ref19","article-title":"Never give up: Learning directed exploration strategies","author":"Badia","year":"2020"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TCDS.2016.2538961"},{"key":"ref21","article-title":"Diversity is all you need: Learning skills without a reward function","volume-title":"Proc. 7th Int. Conf. Learn. Represent. (ICLR)","author":"Eysenbach","year":"2019"},{"key":"ref22","first-page":"3761","article-title":"Language as a cognitive tool to imagine goals in curiosity driven exploration","volume":"33","author":"Colas","year":"2020","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"ref23","first-page":"7783","article-title":"Skew-fit: State-covering self-supervised reinforcement learning","volume-title":"Proc. 37th Int. Conf. on Mach. Learn.","author":"Pong","year":"2020"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2021.3087733"},{"key":"ref25","first-page":"20516","article-title":"Interesting object, curious agent: Learning task-agnostic exploration","volume":"34","author":"Parisi","year":"2021","journal-title":"Adv. Neur. Inf. Process. Syst."},{"key":"ref26","first-page":"131","article-title":"Regularity as intrinsic reward for free play","volume-title":"Adv. Neural Inf. Proc. Syst.","volume":"36","author":"Sancaktar","year":"2024"},{"key":"ref27","first-page":"112","article-title":"Intrinsically motivated learning of hierarchical collections of skills","volume-title":"Proc. 3rd Int. Conf. Develop. Learn.","author":"Barto","year":"2004"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.3389\/fnbot.2013.00022"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/j.robot.2012.05.008"},{"key":"ref30","first-page":"1514","article-title":"Automatic goal generation for reinforcement learning agents","volume-title":"Proc. 35th Int. Conf. on Mach. Learn","author":"Florensa","year":"2018"},{"key":"ref31","first-page":"18474","article-title":"Autonomous reinforcement learning via subgoal curricula","volume":"34","author":"Sharma","year":"2021","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"ref32","first-page":"131","article-title":"Control what you can: Intrinsically motivated task-planning agent","volume":"32","author":"Blaes","year":"2019","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICAR53236.2021.9659371"},{"issue":"1","key":"ref34","first-page":"6818","article-title":"Intrinsically motivated goal exploration processes with automatic curriculum learning","volume":"23","author":"Forestier","year":"2022","journal-title":"J. Mach. Learn. Res."},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICDL53763.2022.9962200"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.3389\/fnbot.2018.00059"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN54540.2023.10191570"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.3389\/frobt.2022.762051"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/TCDS.2021.3057758"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/TCDS.2022.3231731"},{"key":"ref41","first-page":"205","article-title":"Augmenting autotelic agents with large language models","volume-title":"Proc. Conf. Lifelong Learn. Agents","author":"Colas","year":"2023"},{"key":"ref42","article-title":"A path towards autonomous machine intelligence version 0.9. 2, 2022-06-27","volume":"62","author":"LeCun","year":"2022","journal-title":"Open Rev."},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.3390\/s23031611"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.3233\/ICA-200633"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2019.10.124"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/DEVLRN.2019.8850713"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/DevLrn.2012.6400835"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1613\/jair.1.13554"},{"key":"ref49","first-page":"3074","article-title":"Rotting bandits","volume":"34","author":"Levine","year":"2017","journal-title":"Adv. Neur. Inf. Process. Syst."},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1145\/3453160"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.3233\/faia200373"},{"key":"ref52","first-page":"2547","article-title":"Learning multiple tasks with non-stationary interdependencies in autonomous robots","volume-title":"Proc. Int. Conf. Auton. Agents Multiagent Syst.","author":"Romero","year":"2023"},{"key":"ref53","first-page":"135","article-title":"Unsupervised learning of goal spaces for intrinsically motivated goal exploration","volume-title":"Proc. 6th Int. Conf. Learn. Representations (ICLR)","author":"P\u00e9r\u00e9","year":"2018"},{"key":"ref54","first-page":"134","article-title":"When should agents explore?","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Pislar","year":"2021"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2018.8593799"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9560922"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/CEC.2011.5949955"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/TEVC.2017.2704781"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1016\/j.bica.2016.07.003"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/TCDS.2023.3270081"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1016\/S0065-2407(08)60403-6"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.3389\/fnbot.2019.00098"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.3389\/fnbot.2018.00030"},{"key":"ref64","article-title":"Planning with neural networks and reinforcement learning","author":"Baldassarre","year":"2002"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/DEVLRN.2017.8329804"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/TAMD.2010.2062511"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/DEVLRN.2017.8329807"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.3389\/fnbot.2019.00045"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1016\/j.robot.2020.103710"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v30i1.10295"}],"container-title":["IEEE Transactions on Cognitive and Developmental Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/7274989\/11288412\/11002551.pdf?arnumber=11002551","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,16]],"date-time":"2025-12-16T18:33:12Z","timestamp":1765909992000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11002551\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12]]},"references-count":70,"journal-issue":{"issue":"6"},"URL":"https:\/\/doi.org\/10.1109\/tcds.2025.3569352","relation":{},"ISSN":["2379-8920","2379-8939"],"issn-type":[{"value":"2379-8920","type":"print"},{"value":"2379-8939","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,12]]}}}