{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,25]],"date-time":"2026-02-25T08:01:07Z","timestamp":1772006467493,"version":"3.50.1"},"reference-count":44,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"4","license":[{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Guangdong Provincial Educational Science Planning Project","award":["2025GXJK0629"],"award-info":[{"award-number":["2025GXJK0629"]}]},{"name":"Guangzhou Higher Education Teaching Research and Reform Project","award":["2024YBJG094"],"award-info":[{"award-number":["2024YBJG094"]}]},{"name":"Guangzhou Municipal Educational Science Planning Project","award":["202316577"],"award-info":[{"award-number":["202316577"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Robot. Autom. Lett."],"published-print":{"date-parts":[[2026,4]]},"DOI":"10.1109\/lra.2026.3662647","type":"journal-article","created":{"date-parts":[[2026,2,9]],"date-time":"2026-02-09T21:09:14Z","timestamp":1770671354000},"page":"4235-4242","source":"Crossref","is-referenced-by-count":0,"title":["ManiVID-3D: Generalizable View-Invariant Reinforcement Learning for Robotic Manipulation via Disentangled 3D Representations"],"prefix":"10.1109","volume":"11","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-7182-444X","authenticated-orcid":false,"given":"Zheng","family":"Li","sequence":"first","affiliation":[{"name":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"}]},{"given":"Pei","family":"Qu","sequence":"additional","affiliation":[{"name":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-7590-9647","authenticated-orcid":false,"given":"Yufei","family":"Jia","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, China"}]},{"given":"Shihui","family":"Zhou","sequence":"additional","affiliation":[{"name":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8388-7193","authenticated-orcid":false,"given":"Haizhou","family":"Ge","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4338-4414","authenticated-orcid":false,"given":"Jiahang","family":"Cao","sequence":"additional","affiliation":[{"name":"The University of Hong Kong, Hong Kong SAR, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7282-4541","authenticated-orcid":false,"given":"Jinni","family":"Zhou","sequence":"additional","affiliation":[{"name":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3894-9858","authenticated-orcid":false,"given":"Guyue","family":"Zhou","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9405-8232","authenticated-orcid":false,"given":"Jun","family":"Ma","sequence":"additional","affiliation":[{"name":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Grasping deformable objects via reinforcement learning with cross-modal attention to visuo-tactile inputs","author":"Lee","year":"2025"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.ins.2021.01.077"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v39i14.33599"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/IROS60139.2025.11246691"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2019.2898330"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA57147.2024.10610710"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2023.3259681"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.02575"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/IROS60139.2025.11247559"},{"key":"ref10","first-page":"30613","article-title":"Multi-view masked world models for visual robotic manipulation","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Seo","year":"2023"},{"key":"ref11","article-title":"RoboUniView: Visual-language model with unified view representation for robotic manipulation","author":"Liu","year":"2024"},{"key":"ref12","article-title":"Fast and robust: Task sampling with posterior and diversity synergies for adaptive decision-makers in randomized environments","author":"Qu","year":"2025"},{"key":"ref13","article-title":"RoboTwin 2.0: A scalable data generator and benchmark with strong domain randomization for robust bimanual robotic manipulation","author":"Chen","year":"2025"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.00169"},{"key":"ref15","first-page":"1815","article-title":"Learning to manipulate anywhere: A visual generalizable framework for reinforcement learning","volume-title":"Proc. Conf. Robot Learn.","author":"Yuan","year":"2025"},{"key":"ref16","first-page":"1173","article-title":"View-invariant policy learning via zero-shot novel view synthesis","volume-title":"Proc. Conf. Robot Learn.","author":"Tian","year":"2025"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2024.XX.067"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/iros60139.2025.11246340"},{"key":"ref20","first-page":"21507","article-title":"MoVie: Visual model-based policy adaptation for view generalization","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"36","author":"Yang","year":"2023"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-025-02472-w"},{"key":"ref22","first-page":"209","article-title":"RoVi-Aug: Robot and viewpoint augmentation for cross-embodiment robot learning","volume-title":"Proc. Conf. Robot Learn.","author":"Chen","year":"2025"},{"key":"ref23","first-page":"20393","article-title":"Spectrum random masking for generalization in image-based reinforcement learning","volume-title":"Proc. Adv. Neural Inform. Process. Syst.","volume":"35","author":"Huang","year":"2022"},{"key":"ref24","article-title":"Learning view-invariant world models for visual robotic manipulation","volume-title":"Proc. 13th Int. Conf. Learn. Representations","author":"Pang","year":"2025"},{"key":"ref25","first-page":"694","article-title":"RVT: Robotic view transformer for 3D object manipulation","volume-title":"Proc. Conf. Robot Learn.","author":"Goyal","year":"2023"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2024.3420937"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1007\/s00138-025-01728-2"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/WACV61041.2025.00351"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/WACV56688.2023.00158"},{"key":"ref30","first-page":"67459","article-title":"Towards a unified framework of contrastive learning for disentangled representations","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"36","author":"Matthes","year":"2023"},{"key":"ref31","article-title":"Representation learning with contrastive predictive coding","author":"Oord","year":"2018"},{"key":"ref32","article-title":"DisDP: Robust imitation learning via disentangled diffusion policies","volume-title":"Proc. Reinforcement Learn. Conf.","author":"Vanjani","year":"2025"},{"key":"ref33","article-title":"Merging and disentangling views in visual reinforcement learning for robotic manipulation","author":"Almuzairee","year":"2025"},{"key":"ref34","article-title":"Multi-view disentanglement for reinforcement learning with multiple cameras","volume-title":"Proc. Reinforcement Learn. Conf.","author":"Dunion","year":"2024"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1287\/opre.21.5.1071"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.5555\/3524938.3525087"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.52202\/079017-2473"},{"key":"ref38","first-page":"594","article-title":"DexPoint: Generalizable point cloud reinforcement learning for sim-to-real dexterous manipulation","volume-title":"Proc. Conf. Robot Learn.","author":"Qin","year":"2023"},{"key":"ref39","article-title":"PointNet : Deep hierarchical feature learning on point sets in a metric space","volume-title":"Proc. Adv. Neural Inform. Process. Syst.","volume":"30","author":"Qi","year":"2017,"},{"key":"ref40","article-title":"ManiSkill3: GPU parallelized robotics simulation and rendering for generalizable embodied AI","author":"Tao","year":"2024"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2012.6386109"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01111"},{"key":"ref43","article-title":"Spatial transformer networks","volume-title":"Proc. Adv. Neural Inform. Process. Syst.","volume":"28","author":"Jaderberg"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3070341"}],"container-title":["IEEE Robotics and Automation Letters"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/7083369\/11400564\/11386866.pdf?arnumber=11386866","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,25]],"date-time":"2026-02-25T07:04:55Z","timestamp":1772003095000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11386866\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,4]]},"references-count":44,"journal-issue":{"issue":"4"},"URL":"https:\/\/doi.org\/10.1109\/lra.2026.3662647","relation":{},"ISSN":["2377-3766","2377-3774"],"issn-type":[{"value":"2377-3766","type":"electronic"},{"value":"2377-3774","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,4]]}}}