{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,13]],"date-time":"2026-03-13T14:57:42Z","timestamp":1773413862654,"version":"3.50.1"},"reference-count":76,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,5,19]],"date-time":"2025-05-19T00:00:00Z","timestamp":1747612800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,5,19]],"date-time":"2025-05-19T00:00:00Z","timestamp":1747612800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100000001","name":"NSF","doi-asserted-by":"publisher","award":["2024778,2149585"],"award-info":[{"award-number":["2024778,2149585"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,5,19]]},"DOI":"10.1109\/icra55743.2025.11127935","type":"proceedings-article","created":{"date-parts":[[2025,9,2]],"date-time":"2025-09-02T17:28:56Z","timestamp":1756834136000},"page":"1208-1216","source":"Crossref","is-referenced-by-count":1,"title":["Points2Plans: From Point Clouds to Long-Horizon Plans with Composable Relational Dynamics"],"prefix":"10.1109","author":[{"given":"Yixuan","family":"Huang","sequence":"first","affiliation":[{"name":"Stanford University"}]},{"given":"Christopher","family":"Agia","sequence":"additional","affiliation":[{"name":"Stanford University"}]},{"given":"Jimmy","family":"Wu","sequence":"additional","affiliation":[{"name":"Princeton University"}]},{"given":"Tucker","family":"Hermans","sequence":"additional","affiliation":[{"name":"University of Utah"}]},{"given":"Jeannette","family":"Bohg","sequence":"additional","affiliation":[{"name":"Stanford University"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Do as i can, not as i say: Grounding language in robotic affordances","author":"Ahn","year":"2022","journal-title":"arXiv preprint"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10160934"},{"key":"ref3","first-page":"1930","article-title":"Logic-geometric programming: An optimization-based approach to combined task and motion planning","author":"Toussaint","year":"2015","journal-title":"IJCAI"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1609\/icaps.v30i1.6739"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1146\/annurev-control-091420-084139"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48506.2021.9560841"},{"key":"ref7","first-page":"21847","article-title":"Accelerating robotic reinforcement learning via parameterized action primitives","volume":"34","author":"Dalal","year":"2021","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref8","first-page":"2262","article-title":"Skill-based model-based reinforcement learning","volume-title":"Proceedings of The 6th Conference on Robot Learning, ser. Proceedings of Machine Learning Research","volume":"205","author":"Shi","year":"2023"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10160220"},{"key":"ref10","first-page":"2905","article-title":"Generative skill chaining: Long-horizon skill planning with diffusion models","volume-title":"Conference on Robot Learning.","author":"Mishra","year":"2023"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/s10514-023-10131-7"},{"key":"ref12","first-page":"4","article-title":"Planning for Multi-Object Manipulation with Graph Neural Network Relational Classifiers","volume-title":"IEEE International Conference on Robotics and Automation (ICRA)","author":"Huang","year":"2023"},{"key":"ref13","first-page":"5","article-title":"Latent Space Planning for Multi-Object Manipulation with EnvironmentAware Relational Classifiers","volume-title":"IEEE Transactions on Robotics (T-RO)","author":"Huang","year":"2024"},{"key":"ref14","first-page":"701","article-title":"Learning neuro-symbolic skills for bilevel planning","volume-title":"Proceedings of The 6th Conference on Robot Learning, ser. Proceedings of Machine Learning Research","volume":"205","author":"Silver","year":"2023"},{"key":"ref15","article-title":"On the opportunities and risks of foundation models","author":"Bommasani","year":"2021","journal-title":"arXiv preprint"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1016\/j.robot.2008.10.024"},{"key":"ref17","first-page":"1443","article-title":"Learning parameterized skills","volume-title":"Proceedings of the 29th International Coference on International Conference on Machine Learning","author":"Da Silva","year":"2012"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1016\/j.robot.2012.11.010"},{"key":"ref19","first-page":"651","article-title":"Scalable deep reinforcement learning for vision-based robotic manipulation","volume-title":"Conference on robot learning.","author":"Kalashnikov","year":"2018"},{"key":"ref20","article-title":"XSkill: Cross embodiment skill discovery","volume-title":"7th Annual Conference on Robot Learning","author":"Xu","year":"2023"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2023.XIX.031"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989109"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/iros40897.2019.8967761"},{"key":"ref24","first-page":"148","article-title":"Sornet: Spatial objectcentric representations for sequential manipulation","volume-title":"Conference on Robot Learning.","author":"Yuan","year":"2022"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2023.3308061"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.15607\/rss.2024.xx.040"},{"key":"ref27","first-page":"2","article-title":"Inner monologue: Embodied reasoning through planning with language models","volume-title":"6th Annual Conference on Robot Learning","author":"Huang","year":"2022"},{"key":"ref28","article-title":"Palme: an embodied multimodal language model","volume-title":"Proceedings of the 40th International Conference on Machine Learning, ser. ICML\u201923.","author":"Driess","year":"2023"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10160591"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA48891.2023.10161317"},{"key":"ref31","article-title":"Regression planning networks","volume":"32","author":"Xu","year":"2019","journal-title":"Advances in neural information processing systems"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2022.3186635"},{"key":"ref33","article-title":"Pddl planning with pretrained large language models","volume-title":"NeurIPS 2022 foundation models for decision making workshop","author":"Silver","year":"2022"},{"key":"ref34","article-title":"Llm+ p: Empowering large language models with optimal planning proficiency","author":"Liu","year":"2023","journal-title":"arXiv preprint"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA57147.2024.10610455"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1016\/S0004-3702(99)00052-1"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v31i1.10916"},{"key":"ref38","article-title":"Data-efficient hierarchical reinforcement learning","volume":"31","author":"Nachum","year":"2018","journal-title":"Advances in neural information processing systems"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v30i1.10226"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9196958"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9812140"},{"key":"ref42","first-page":"2","article-title":"Generalization with lossy affordances: Leveraging broad offline data for learning visuomotor tasks","volume-title":"6th Annual Conference on Robot Learning","author":"Fang","year":"2022"},{"key":"ref43","first-page":"2","article-title":"Value function spaces: Skill-centric state abstractions for long-horizon reasoning","volume-title":"International Conference on Learning Representations","author":"Shah","year":"2022"},{"key":"ref44","first-page":"2","article-title":"Skill-based model-based reinforcement learning","volume-title":"6th Annual Conference on Robot Learning","author":"Shi","year":"2022"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8460689"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00876"},{"key":"ref47","first-page":"2","article-title":"Sequential dexterity: Chaining dexterous policies for long-horizon manipulation","volume-title":"7th Annual Conference on Robot Learning","author":"Chen","year":"2023"},{"key":"ref48","first-page":"2","article-title":"Adversarial skill chaining for long-horizon robot manipulation via terminal state regularization","volume-title":"5th Annual Conference on Robot Learning","author":"Lee","year":"2021"},{"key":"ref49","first-page":"5","article-title":"Predicting stable configurations for semantic placement of novel objects","volume-title":"5 th Annual Conference on Robot Learning","author":"Paxton","year":"2021"},{"key":"ref50","article-title":"Visual foresight: Model-based deep reinforcement learning for vision-based robotic control","author":"Ebert","year":"2018","journal-title":"arXiv preprint"},{"key":"ref51","first-page":"2555","article-title":"Learning latent dynamics for planning from pixels","volume-title":"International conference on machine learning.","author":"Hafner","year":"2019"},{"key":"ref52","first-page":"2","article-title":"Dream to control: Learning behaviors by latent imagination","volume-title":"International Conference on Learning Representations","author":"Hafner","year":"2020"},{"key":"ref53","first-page":"2","article-title":"Learning sequential acquisition policies for robot-assisted feeding","volume-title":"7th Annual Conference on Robot Learning","author":"Sundaresan","year":"2023"},{"key":"ref54","first-page":"112","article-title":"3d neural scene representations for visuomotor control","volume-title":"Conference on Robot Learning.","author":"Li","year":"2022"},{"key":"ref55","first-page":"2","article-title":"Robocook: Longhorizon elasto-plastic object manipulation with diverse tools","volume-title":"7th Annual Conference on Robot Learning","author":"Shi","year":"2023"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1177\/02783649231219020"},{"key":"ref57","first-page":"2","article-title":"A compositional object-based approach to learning physical dynamics","volume-title":"International Conference on Learning Representations","author":"Chang","year":"2017"},{"key":"ref58","article-title":"Interaction networks for learning about objects, relations and physics","volume":"29","author":"Battaglia","year":"2016","journal-title":"Advances in neural information processing systems"},{"key":"ref59","first-page":"4470","article-title":"Graph networks as learnable physics engines for inference and control","volume-title":"International conference on machine learning.","author":"Sanchez-Gonzalez","year":"2018"},{"key":"ref60","first-page":"2688","article-title":"Neural relational inference for interacting systems","volume-title":"International conference on machine learning.","author":"Kipf","year":"2018"},{"key":"ref61","first-page":"1755","article-title":"Learning multi-object dynamics with compositional neural radiance fields","volume-title":"Conference on robot learning.","author":"Driess","year":"2023"},{"key":"ref62","first-page":"1582","article-title":"A long horizon planning framework for manipulating rigid pointcloud objects","volume-title":"Conference on Robot Learning.","author":"Simeonov","year":"2021"},{"key":"ref63","article-title":"Diffskill: Skill abstraction from differentiable physics for deformable object manipulations with tools","volume-title":"International Conference on Learning Representation (ICLR)","author":"Lin","year":"2022"},{"key":"ref64","first-page":"2","article-title":"Planning with spatial-temporal abstraction from point clouds for deformable object manipulation","volume-title":"6th Annual Conference on Robot Learning","author":"Lin","year":"2022"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA57147.2024.10610240"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i10.26429"},{"key":"ref67","article-title":"From reals to logic and back: Inventing symbolic vocabularies, actions and models for planning from raw data","author":"Shah","year":"2024","journal-title":"arXiv preprint"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00371"},{"key":"ref69","first-page":"3","article-title":"Open-vocabulary object detection via vision and language knowledge distillation","volume-title":"International Conference on Learning Representations","author":"Gu","year":"2022"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2011.5980391"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.15607\/rss.2020.xvi.003"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00985"},{"key":"ref73","first-page":"8024","article-title":"Pytorch: An imperative style, highperformance deep learning library","volume-title":"Advances in Neural Information Processing Systems 32.","author":"Paszke","year":"2019"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1023\/A:1010091220143"},{"key":"ref75","article-title":"Isaac gym: High performance GPU based physics simulation for robot learning","volume-title":"Thirty-fifth Conference on Neural Information Processing Systems Datasets and Benchmarks Track (Round 2)","author":"Makoviychuk","year":"2021"},{"key":"ref76","article-title":"Gpt-4 technical report","author":"Achiam","year":"2023","journal-title":"arXiv preprint"}],"event":{"name":"2025 IEEE International Conference on Robotics and Automation (ICRA)","location":"Atlanta, GA, USA","start":{"date-parts":[[2025,5,19]]},"end":{"date-parts":[[2025,5,23]]}},"container-title":["2025 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11127273\/11127223\/11127935.pdf?arnumber=11127935","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,3]],"date-time":"2025-09-03T06:06:20Z","timestamp":1756879580000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11127935\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,19]]},"references-count":76,"URL":"https:\/\/doi.org\/10.1109\/icra55743.2025.11127935","relation":{},"subject":[],"published":{"date-parts":[[2025,5,19]]}}}