{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,2]],"date-time":"2025-11-02T04:45:45Z","timestamp":1762058745184,"version":"build-2065373602"},"reference-count":45,"publisher":"IEEE","license":[{"start":{"date-parts":[[2022,5,23]],"date-time":"2022-05-23T00:00:00Z","timestamp":1653264000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,5,23]],"date-time":"2022-05-23T00:00:00Z","timestamp":1653264000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022,5,23]]},"DOI":"10.1109\/icra46639.2022.9811575","type":"proceedings-article","created":{"date-parts":[[2022,7,12]],"date-time":"2022-07-12T19:36:40Z","timestamp":1657654600000},"page":"6351-6357","source":"Crossref","is-referenced-by-count":15,"title":["Search-Based Task Planning with Learned Skill Effect Models for Lifelong Robotic Manipulation"],"prefix":"10.1109","author":[{"given":"Jacky","family":"Liang","sequence":"first","affiliation":[{"name":"Robotics Institute, Carnegie Mellon University"}]},{"given":"Mohit","family":"Sharma","sequence":"additional","affiliation":[{"name":"Robotics Institute, Carnegie Mellon University"}]},{"given":"Alex","family":"LaGrassa","sequence":"additional","affiliation":[{"name":"Robotics Institute, Carnegie Mellon University"}]},{"given":"Shivam","family":"Vats","sequence":"additional","affiliation":[{"name":"Robotics Institute, Carnegie Mellon University"}]},{"given":"Saumya","family":"Saxena","sequence":"additional","affiliation":[{"name":"Robotics Institute, Carnegie Mellon University"}]},{"given":"Oliver","family":"Kroemer","sequence":"additional","affiliation":[{"name":"Robotics Institute, Carnegie Mellon University"}]}],"member":"263","reference":[{"key":"ref39","article-title":"C-learning: Horizon-aware cumulative accessibility estimation","author":"naderian","year":"0","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1016\/j.robot.2019.07.003"},{"key":"ref33","article-title":"Interaction networks for learning about objects, relations and physics","author":"battaglia","year":"2016","journal-title":"Advances in neural information processing systems"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1016\/S0004-3702(99)00052-1"},{"key":"ref31","doi-asserted-by":"crossref","first-page":"440","DOI":"10.1609\/icaps.v30i1.6739","article-title":"Pddlstream: Integrating symbolic planners and blackbox samplers via optimistic adaptive planning","volume":"30","author":"garrett","year":"0","journal-title":"Proceedings of the International Conference on Automated Planning and Scheduling"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1177\/02783649211004615"},{"key":"ref37","article-title":"Fast graph representation learning with PyTorch Geometric","author":"fey","year":"0","journal-title":"ICLR Workshop on Representation Learning on Graphs and Manifolds"},{"key":"ref36","article-title":"Object and relation centric representations for push effect prediction","author":"tekden","year":"2021","journal-title":"ArXiv Preprint"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2018.2859448"},{"key":"ref34","article-title":"Reasoning about physical interactions with object-oriented prediction and planning","author":"janner","year":"0","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref10","first-page":"4732","article-title":"Universal planning networks: Learning generalizable representations for visuo-motor control","author":"srinivas","year":"0","journal-title":"International Conference on Machine Learning"},{"key":"ref40","article-title":"gamma-models: Generative temporal difference learning for infinite-horizon prediction","author":"janner","year":"2020","journal-title":"Advances in neural information processing systems"},{"key":"ref11","article-title":"Broadly-exploring, local-policy trees for long-horizon task planning","author":"ichter","year":"2020","journal-title":"ArXiv Preprint"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1613\/jair.5575"},{"key":"ref13","article-title":"A long horizon planning framework for manipulating rigid pointcloud objects","author":"simeonov","year":"0","journal-title":"Conference on Robot Learning (CoRL)"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9560782"},{"key":"ref15","article-title":"Deep affordance foresight: Planning through what can be done in the future","author":"xu","year":"2020","journal-title":"ArXiv Preprint"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v30i1.10226"},{"key":"ref17","article-title":"Deep reinforcement learning in parameterized action space","author":"hausknecht","year":"0","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref18","article-title":"Parametrized deep q-networks learning: Reinforcement learning with discrete-continuous hybrid action space","author":"xiong","year":"2018","journal-title":"ArXiv Preprint"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989468"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2018.8594313"},{"key":"ref4","article-title":"Skill transfer via partially amortized hierarchical planning","author":"xie","year":"0","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2015.7139553"},{"key":"ref3","article-title":"Reset-free lifelong learning with skill-space planning","author":"lu","year":"0","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref6","article-title":"Planning with goal-conditioned policies","author":"nasiriany","year":"2019","journal-title":"Advances in neural information processing systems"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/IROS45743.2020.9341182"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2021.3062342"},{"key":"ref8","article-title":"Planning under uncertainty to goal distributions","author":"conkey","year":"2020","journal-title":"ArXiv Preprint"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9196935"},{"key":"ref2","article-title":"Dynamics-aware unsupervised discovery of skills","author":"sharma","year":"0","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9561402"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/0921-8890(95)00004-Y"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/IROS45743.2020.9341532"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1016\/j.jco.2020.101483"},{"journal-title":"Skill discovery for exploration and planning using deep skill graphs","year":"2020","author":"bagaria","key":"ref22"},{"key":"ref21","doi-asserted-by":"crossref","first-page":"734","DOI":"10.1609\/icaps.v29i1.3542","article-title":"Pomhdp: Search-based belief space planning using multiple heuristics","volume":"29","author":"kim","year":"0","journal-title":"Proceedings of the International Conference on Automated Planning and Scheduling"},{"journal-title":"Isaac gym","year":"0","key":"ref42"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2011.5980391"},{"key":"ref41","article-title":"Learning accurate long-term dynamics for model-based reinforcement learning","author":"lambert","year":"2020","journal-title":"ArXiv Preprint"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2014.6942570"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511546877"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.3389\/frobt.2019.00123"},{"key":"ref43","article-title":"Gpu-accelerated robotic simulation for distributed reinforcement learning","author":"liang","year":"0","journal-title":"Conference on Robot Learning (CoRL)"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1177\/0278364913484072"}],"event":{"name":"2022 IEEE International Conference on Robotics and Automation (ICRA)","start":{"date-parts":[[2022,5,23]]},"location":"Philadelphia, PA, USA","end":{"date-parts":[[2022,5,27]]}},"container-title":["2022 International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9811522\/9811357\/09811575.pdf?arnumber=9811575","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,29]],"date-time":"2024-09-29T00:04:35Z","timestamp":1727568275000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9811575\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,5,23]]},"references-count":45,"URL":"https:\/\/doi.org\/10.1109\/icra46639.2022.9811575","relation":{},"subject":[],"published":{"date-parts":[[2022,5,23]]}}}