{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,28]],"date-time":"2026-05-28T06:01:57Z","timestamp":1779948117247,"version":"3.53.1"},"reference-count":85,"publisher":"IEEE","license":[{"start":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T00:00:00Z","timestamp":1773964800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T00:00:00Z","timestamp":1773964800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001804","name":"Canada Research Chair","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001804","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100021202","name":"Digital Research Alliance of Canada","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100021202","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026,3,20]]},"DOI":"10.1109\/3dv69130.2026.00056","type":"proceedings-article","created":{"date-parts":[[2026,5,27]],"date-time":"2026-05-27T19:40:49Z","timestamp":1779910849000},"page":"520-531","source":"Crossref","is-referenced-by-count":0,"title":["iTACO: Interactable Digital Twins of Articulated Objects from Casually Captured RGBD Videos"],"prefix":"10.1109","author":[{"given":"Weikun","family":"Peng","sequence":"first","affiliation":[{"name":"Simon Fraser University"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jun","family":"Lv","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Cewu","family":"Lu","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Manolis","family":"Savva","sequence":"additional","affiliation":[{"name":"Simon Fraser University"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/1276377.1276467"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00703"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51701.2025.00856"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.15607\/rss.2024.xx.124"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3721238.3730743"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3641519.3657463"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/358669.358692"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51701.2025.00581"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00425"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.00323"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19842-7_24"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00553"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.52202\/079017-3576"},{"key":"ref14","article-title":"Robot See Robot Do: Imitating Articulated Object Manipulation with Monocular 4D Reconstruction","volume-title":"8th Annual Conference on Robot Learning (CoRL)","author":"Kerr"},{"key":"ref15","article-title":"Adam: A Method for Stochastic Optimization","volume-title":"International Conference on Learning Representations (ICLR)","author":"Diederik"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00371"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00166"},{"key":"ref18","article-title":"Articulate-Anything: Automatic Modeling of Articulated Objects via a Vision-Language Foundation Model","volume-title":"International Conference on Learning Representations (ICLR)","author":"Le"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/3450626.3459852"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00376"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.00981"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.01591"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3731149"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00039"},{"key":"ref25","article-title":"SINGAPO: Single Image Controlled Generation of Articulated Parts in Object","volume-title":"International Conference on Learning Representations (ICLR)","author":"Liu"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51701.2025.00905"},{"key":"ref27","article-title":"Building Interactable Replicas of Complex Articulated Objects via Gaussian Splatting","volume-title":"International Conference on Learning Representations (ICLR)","author":"Liu"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/3DV62453.2024.00044"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9811859"},{"key":"ref30","article-title":"Real2code: Reconstruct articulated objects via code generation","volume-title":"International Conference on Learning Representations (ICLR)","author":"Mandi"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr52729.2023.02120"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2022.3198480"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr.2019.00100"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01276"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298631"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/IROS55552.2023.10342135"},{"key":"ref37","article-title":"Polycam","year":"2025","journal-title":"Polycam"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01018"},{"key":"ref39","article-title":"SAM 2: Segment Anything in Images and Videos","author":"Ravi","year":"2024","journal-title":"arXiv preprint arXiv"},{"key":"ref40","article-title":"Record3D","year":"2025","journal-title":"Record3d"},{"key":"ref41","author":"Ren","year":"2025","journal-title":"Grounded SAM 2: Ground and Track Anything in Videos"},{"key":"ref42","author":"Ren","year":"2024","journal-title":"Grounded SAM: Assembling Open-World Models for Diverse Visual Tasks"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00280"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00515"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.01491"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00881"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.01972"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/3dv62453.2024.00100"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1145\/1531326.1531377"},{"key":"ref50","article-title":"Aether: GeometricAware Unified World Modeling","volume-title":"Proceedings of the IEEE International Conference on Computer Vision (ICCV)","author":"Team"},{"key":"ref51","article-title":"Gemini: A Family of Highly Capable Multimodal Models","author":"Team","year":"2023","journal-title":"arXiv preprint arXiv"},{"key":"ref52","article-title":"DROID-SLAM: Deep Visual SLAM for Monocular, Stereo, and RGB-D Cameras","author":"Teed","year":"2021","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.15607\/rss.2024.xx.015"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9812272"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-49409-8_53"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51701.2025.00901"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.00983"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01956"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v39i8.32847"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00908"},{"key":"ref61","article-title":"Articulated Object Manipulation using Online Axis Estimation with SAM2-Based Tracking","author":"Wang","year":"2024","journal-title":"arXiv preprint arXiv"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01536"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01296"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00303"},{"key":"ref65","article-title":"Articulated Object Estimation in the Wild","volume-title":"1st Workshop on Egocentric Perception and Action for Robot Learning","author":"Werby"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01920"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01111"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-96-0972-7_17"},{"key":"ref69","author":"Xu","year":"2024","journal-title":"DAS3R: Dynamics-Aware Gaussian Splatting for Static Scene Reconstruction"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1145\/3386569.3392379"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1145\/3550469.3555390"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1145\/2897824.2925938"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1145\/3197517.3201396"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1145\/3355089.3356573"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1145\/3618327"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00709"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01572"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00288"},{"key":"ref79","article-title":"SAMPart3D: Segment Any Part in 3D Objects","author":"Yang","year":"2024","journal-title":"arXiv preprint arXiv"},{"key":"ref80","article-title":"Real-time Photorealistic Dynamic Scene Representation and Rendering with 4D Gaussian Splatting","volume-title":"International Conference on Learning Representations (ICLR)","author":"Yang"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA57147.2024.10610652"},{"key":"ref82","article-title":"MonST3R: A Simple Approach for Estimating Geometry in the Presence of Motion","volume-title":"International Conference on Learning Representations (ICLR)","author":"Zhang"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1145\/3730930"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19827-4_2"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51701.2025.00823"}],"event":{"name":"2026 International Conference on 3D Vision (3DV)","location":"Vancouver, BC, Canada","start":{"date-parts":[[2026,3,20]]},"end":{"date-parts":[[2026,3,23]]}},"container-title":["2026 International Conference on 3D Vision (3DV)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11533157\/11533158\/11533314.pdf?arnumber=11533314","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,28]],"date-time":"2026-05-28T05:02:52Z","timestamp":1779944572000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11533314\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,3,20]]},"references-count":85,"URL":"https:\/\/doi.org\/10.1109\/3dv69130.2026.00056","relation":{},"subject":[],"published":{"date-parts":[[2026,3,20]]}}}