{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,15]],"date-time":"2026-01-15T22:44:01Z","timestamp":1768517041541,"version":"3.49.0"},"reference-count":38,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,5,13]],"date-time":"2024-05-13T00:00:00Z","timestamp":1715558400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,5,13]],"date-time":"2024-05-13T00:00:00Z","timestamp":1715558400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,5,13]]},"DOI":"10.1109\/icra57147.2024.10610376","type":"proceedings-article","created":{"date-parts":[[2024,8,8]],"date-time":"2024-08-08T17:51:05Z","timestamp":1723139465000},"page":"12436-12442","source":"Crossref","is-referenced-by-count":4,"title":["CrossVideo: Self-supervised Cross-modal Contrastive Learning for Point Cloud Video Understanding"],"prefix":"10.1109","author":[{"given":"Yunze","family":"Liu","sequence":"first","affiliation":[{"name":"Tsinghua University"}]},{"given":"Changxi","family":"Chen","sequence":"additional","affiliation":[{"name":"Tsinghua University"}]},{"given":"Zifan","family":"Wang","sequence":"additional","affiliation":[{"name":"Tsinghua University"}]},{"given":"Li","family":"Yi","sequence":"additional","affiliation":[{"name":"Tsinghua University"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01398"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19818-2_2"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01154"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00114"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01694"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.02034"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00319"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00934"},{"key":"ref9","article-title":"Pointnet++: Deep hierarchical feature learning on point sets in a metric space","volume":"30","author":"Qi","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref10","article-title":"Pstnet: Point spatio-temporal convolution on point cloud sequences","author":"Fan","year":"2022"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00975"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"ref13","article-title":"Contrastive self-supervised sequential recommendation with robust augmentation","author":"Liu","year":"2021"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20086-1_35"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01871"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00836"},{"key":"ref17","article-title":"P4contrast: Contrastive learning with pairs of point-pixel pairs for rgb-d scene understanding","author":"Liu","year":"2020"},{"key":"ref18","first-page":"6027","article-title":"Learning physical graph representations from visual scenes","volume":"33","author":"Bear","year":"2020","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00964"},{"key":"ref20","first-page":"27061","article-title":"Point-m2ae: multi-scale masked autoencoders for hierarchical point cloud pre-training","volume":"35","author":"Zhang","year":"2022","journal-title":"Advances in neural information processing systems"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58580-8_34"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/iccv48922.2021.00327"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01009"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00827"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01533"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19824-3_32"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00647"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.73"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01101"},{"key":"ref30","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"International conference on machine learning","author":"Radford"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01229"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19836-6_36"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00967"},{"key":"ref34","article-title":"VideoMAE: Masked autoencoders are data-efficient learners for self-supervised video pretraining","author":"Tong","year":"2022","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00369"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3021756"},{"key":"ref37","article-title":"Asformer: Transformer for action segmentation","author":"Yi","year":"2021"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.502"}],"event":{"name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","location":"Yokohama, Japan","start":{"date-parts":[[2024,5,13]]},"end":{"date-parts":[[2024,5,17]]}},"container-title":["2024 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10609961\/10609862\/10610376.pdf?arnumber=10610376","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,10]],"date-time":"2024-08-10T05:48:19Z","timestamp":1723268899000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10610376\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,13]]},"references-count":38,"URL":"https:\/\/doi.org\/10.1109\/icra57147.2024.10610376","relation":{},"subject":[],"published":{"date-parts":[[2024,5,13]]}}}