{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,19]],"date-time":"2026-05-19T15:47:56Z","timestamp":1779205676568,"version":"3.51.4"},"reference-count":70,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,5,13]],"date-time":"2024-05-13T00:00:00Z","timestamp":1715558400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,5,13]],"date-time":"2024-05-13T00:00:00Z","timestamp":1715558400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,5,13]]},"DOI":"10.1109\/icra57147.2024.10611448","type":"proceedings-article","created":{"date-parts":[[2024,8,8]],"date-time":"2024-08-08T17:51:05Z","timestamp":1723139465000},"page":"515-522","source":"Crossref","is-referenced-by-count":7,"title":["Lifelong Robot Library Learning: Bootstrapping Composable and Generalizable Skills for Embodied Control with Language Models"],"prefix":"10.1109","author":[{"given":"Georgios","family":"Tziafas","sequence":"first","affiliation":[{"name":"University of Groningen,Department of Artificial Intelligence,the Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hamidreza","family":"Kasaei","sequence":"additional","affiliation":[{"name":"University of Groningen,Department of Artificial Intelligence,the Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Ai2-thor: An interactive 3d environment for visual ai","author":"Kolve","year":"2017"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00447"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00943"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1146\/annurev-control-101119-071628"},{"key":"ref5","article-title":"Rt-2: Vision-language-action models transfer web knowledge to robotic control","author":"Brohan","year":"2023"},{"key":"ref6","article-title":"Palm-e: An embodied multimodal language model","volume-title":"International Conference on Machine Learning","author":"Driess"},{"key":"ref7","article-title":"Vima: General robot manipulation with multimodal prompts","author":"Jiang","year":"2022"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/lra.2023.3295255"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2019.12.004"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2019.01.012"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2024.3367329\/mm1"},{"key":"ref12","article-title":"Language models are few-shot learners","author":"Brown","year":"2020"},{"key":"ref13","article-title":"Llama 2: Open foundation and fine-tuned chat models","author":"Touvron","year":"2023"},{"key":"ref14","article-title":"Palm: Scaling language modeling with pathways","author":"Chowdhery","year":"2022"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10160591"},{"key":"ref16","article-title":"Instruct2act: Mapping multi-modality instructions to robotic actions with large language model","author":"Huang","year":"2023"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10161317"},{"key":"ref18","article-title":"Chatgpt for robotics: Design principles and model abilities","author":"Vemprala","year":"2023"},{"key":"ref19","article-title":"Voxposer: Composable 3d value maps for robotic manipulation with language models","author":"Huang","year":"2023"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1126\/science.7761831"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3453483.3454080"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1177\/0278364915602060"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8460699"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2018.XIV.028"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2021.XVII.020"},{"key":"ref26","article-title":"Bc-z: Zero-shot task generalization with robotic imitation learning","author":"Jang","year":"2022"},{"key":"ref27","article-title":"Cliport: What and where pathways for robotic manipulation","author":"Shridhar","year":"2021"},{"key":"ref28","article-title":"Learning to interpret natural language commands through human-robot dialog","volume-title":"International Joint Conference on Artificial Intelligence","author":"Thomason"},{"key":"ref29","article-title":"Programmatically grounded, compositionally generalizable robotic manipulation","author":"Wang","year":"2023"},{"key":"ref30","author":"Tziafas","year":"2022","journal-title":"Enhancing interpretability and interactivity in robot manipulation: A neurosymbolic approach"},{"key":"ref31","article-title":"Language models as zero-shot planners: Extracting actionable knowledge for embodied agents","author":"Huang","year":"2022"},{"key":"ref32","article-title":"Do as i can, not as i say: Grounding language in robotic affordances","author":"Ahn","year":"2022","journal-title":"Conference on Robot Learning"},{"key":"ref33","article-title":"Inner monologue: Embodied reasoning through planning with language models","author":"Huang","year":"2022","journal-title":"Conference on Robot Learning"},{"key":"ref34","article-title":"Socratic models: Composing zero-shot multimodal reasoning with language","author":"Zeng","year":"2022"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2019\/880"},{"key":"ref36","article-title":"Pixl2r: Guiding reinforcement learning using natural language by mapping pixels to rewards","author":"Goyal","year":"2020"},{"key":"ref37","article-title":"Language as an abstraction for hierarchical deep reinforcement learning","author":"Jiang","year":"2019","journal-title":"Neural Information Processing Systems"},{"key":"ref38","article-title":"Language-conditioned imitation learning for robot manipulation tasks","author":"Stepputtis","year":"2020"},{"key":"ref39","article-title":"Learning language-conditioned robot behavior from offline data and crowd-sourced annotation","author":"Nair","year":"2021","journal-title":"Conference on Robot Learning"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-1197"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2022.XVIII.065"},{"key":"ref42","article-title":"Embodiedgpt: Vision-language pre-training via embodied chain of thought","author":"Mu","year":"2023"},{"key":"ref43","article-title":"Learning transferable visual models from natural language supervision","volume-title":"International Conference on Machine Learning","author":"Radford"},{"key":"ref44","article-title":"Open-vocabulary object detection via vision and language knowledge distillation","volume-title":"International Conference on Learning Representations","author":"Gu"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00180"},{"key":"ref46","article-title":"React: Synergizing reasoning and acting in language models","author":"Yao","year":"2022"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.naacl-long.463"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.495"},{"key":"ref49","article-title":"Webgpt: Browser-assisted question-answering with human feedback","author":"Nakano","year":"2021"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606763"},{"key":"ref51","article-title":"Voyager: An open-ended embodied agent with large language models","author":"Wang","year":"2023"},{"key":"ref52","article-title":"Assistgpt: A general multi-modal assistant that can plan, execute, inspect, and learn","author":"Gao","year":"2023"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1177\/0278364917706418"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1145\/3568162.3578623"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/IROS47612.2022.9981810"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10161068"},{"key":"ref57","article-title":"Language to rewards for robotic skill synthesis","author":"Yu","year":"2023"},{"key":"ref58","article-title":"Scaling up and distilling down: Language-guided robot skill acquisition","author":"Ha","year":"2023"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1410"},{"key":"ref60","volume-title":"New and improved embedding model, openai","year":"2022"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1145\/290941.291025"},{"key":"ref62","article-title":"Chain of thought prompting elicits reasoning in large language models","author":"Wei","year":"2022"},{"key":"ref63","volume-title":"Introducing chatgpt, openai","year":"2022"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.59287\/icaens.1127"},{"key":"ref65","volume-title":"Pybullet gymperium","year":"2019"},{"key":"ref66","article-title":"Transporter networks: Rearranging the visual world for robotic manipulation","author":"Zeng","year":"2020","journal-title":"Conference on Robot Learning"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/IROS45743.2020.9340777"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2004.1389727"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.33540\/2168"},{"key":"ref70","article-title":"Llama 2: Open foundation and fine-tuned chat models","author":"Touvron","year":"2023"}],"event":{"name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","location":"Yokohama, Japan","start":{"date-parts":[[2024,5,13]]},"end":{"date-parts":[[2024,5,17]]}},"container-title":["2024 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10609961\/10609862\/10611448.pdf?arnumber=10611448","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,11]],"date-time":"2024-08-11T04:17:53Z","timestamp":1723349873000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10611448\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,13]]},"references-count":70,"URL":"https:\/\/doi.org\/10.1109\/icra57147.2024.10611448","relation":{},"subject":[],"published":{"date-parts":[[2024,5,13]]}}}