{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T17:32:27Z","timestamp":1777656747104,"version":"3.51.4"},"publisher-location":"Cham","reference-count":113,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031198380","type":"print"},{"value":"9783031198397","type":"electronic"}],"license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-031-19839-7_25","type":"book-chapter","created":{"date-parts":[[2022,10,22]],"date-time":"2022-10-22T11:40:06Z","timestamp":1666438806000},"page":"424-443","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":45,"title":["Motion Inspired Unsupervised Perception and\u00a0Prediction in\u00a0Autonomous Driving"],"prefix":"10.1007","author":[{"given":"Mahyar","family":"Najibi","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jingwei","family":"Ji","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yin","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Charles R.","family":"Qi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xinchen","family":"Yan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Scott","family":"Ettinger","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dragomir","family":"Anguelov","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,10,23]]},"reference":[{"key":"25_CR1","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1007\/978-3-642-15552-9_3","volume-title":"Computer Vision \u2013 ECCV 2010","author":"S Agarwal","year":"2010","unstructured":"Agarwal, S., Snavely, N., Seitz, S.M., Szeliski, R.: Bundle adjustment in the large. In: Daniilidis, K., Maragos, P., Paragios, N. (eds.) ECCV 2010. LNCS, vol. 6312, pp. 29\u201342. Springer, Heidelberg (2010). https:\/\/doi.org\/10.1007\/978-3-642-15552-9_3"},{"key":"25_CR2","doi-asserted-by":"crossref","unstructured":"Bansal, M., Krizhevsky, A., Ogale, A.: ChauffeurNet: learning to drive by imitating the best and synthesizing the worst. arXiv preprint arXiv:1812.03079 (2018)","DOI":"10.15607\/RSS.2019.XV.031"},{"key":"25_CR3","unstructured":"Bau, D., et al.: GAN dissection: visualizing and understanding generative adversarial networks. In: ICLR (2019)"},{"key":"25_CR4","unstructured":"Besl, P.J., McKay, N.D.: Method for registration of 3-D shapes. In: Schenker, P.S. (eds.) Sensor Fusion IV: Ccontrol Paradigms and data Structures. vol. 1611, pp. 586\u2013606. SPIE, Bellingham Wash (1992)"},{"key":"25_CR5","unstructured":"Bewley, A., Sun, P., Mensink, T., Anguelov, D., Sminchisescu, C.: Range conditioned dilated convolutions for scale invariant 3D object detection (2020)"},{"key":"25_CR6","doi-asserted-by":"crossref","unstructured":"Caesar, H., et al.: Nuscenes: a multimodal dataset for autonomous driving. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.01164"},{"key":"25_CR7","unstructured":"Caine, B., et al.: Pseudo-labeling for scalable 3D object detection. arXiv preprint arXiv:2103.02093 (2021)"},{"key":"25_CR8","unstructured":"Casas, S., Luo, W., Urtasun, R.: IntentNet: learning to predict intention from raw sensor data. In: CoRL (2018)"},{"key":"25_CR9","doi-asserted-by":"crossref","unstructured":"Cen, J., Yun, P., Cai, J., Wang, M.Y., Liu, M.: Open-set 3D object detection. In: 3DV (2021)","DOI":"10.1109\/3DV53792.2021.00095"},{"key":"25_CR10","unstructured":"Chai, Y., Sapp, B., Bansal, M., Anguelov, D.: Multipath: Multiple probabilistic anchor trajectory hypotheses for behavior prediction. In: CoRL (2019)"},{"key":"25_CR11","doi-asserted-by":"crossref","unstructured":"Chang, M.F., et al.: Argoverse: 3D tracking and forecasting with rich maps. In: CVPR (2019)","DOI":"10.1109\/CVPR.2019.00895"},{"key":"25_CR12","doi-asserted-by":"crossref","unstructured":"Chen, Y., Liu, S., Shen, X., Jia, J.: Fast point r-CNN. In: ICCV (2019)","DOI":"10.1109\/ICCV.2019.00987"},{"issue":"3","key":"25_CR13","doi-asserted-by":"publisher","first-page":"145","DOI":"10.1016\/0262-8856(92)90066-C","volume":"10","author":"Y Chen","year":"1992","unstructured":"Chen, Y., Medioni, G.: Object modelling by registration of multiple range images. Image Vis. Comput. 10(3), 145\u2013155 (1992)","journal-title":"Image Vis. Comput."},{"key":"25_CR14","doi-asserted-by":"crossref","unstructured":"Chen, Y., et al.: GeoSim: realistic video simulation via geometry-aware composition for self-driving. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.00715"},{"key":"25_CR15","doi-asserted-by":"crossref","unstructured":"Cho, M., Kwak, S., Schmid, C., Ponce, J.: Unsupervised object discovery and localization in the wild: Part-based matching with bottom-up region proposals. In: CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298724"},{"key":"25_CR16","doi-asserted-by":"crossref","unstructured":"Cui, H., et al.: Multimodal trajectory predictions for autonomous driving using deep convolutional networks. In: ICRA (2019)","DOI":"10.1109\/ICRA.2019.8793868"},{"key":"25_CR17","unstructured":"Deng, B., Qi, C.R., Najibi, M., Funkhouser, T., Zhou, Y., Anguelov, D.: Revisiting 3D object detection from an egocentric perspective. In: NeurIPS (2021)"},{"key":"25_CR18","doi-asserted-by":"crossref","unstructured":"Dewan, A., Caselitz, T., Tipaldi, G.D., Burgard, W.: Motion-based detection and tracking in 3D lidar scans. In: ICRA (2016)","DOI":"10.1109\/ICRA.2016.7487649"},{"key":"25_CR19","unstructured":"Djuric, N., et al.: Short-term motion prediction of traffic actors for autonomous driving using deep convolutional networks (2018)"},{"key":"25_CR20","doi-asserted-by":"crossref","unstructured":"Duggal, S., et al.: Mending neural implicit modeling for 3D vehicle reconstruction in the wild. In: WACV (2022)","DOI":"10.1109\/WACV51458.2022.00035"},{"key":"25_CR21","doi-asserted-by":"crossref","unstructured":"Engelcke, M., Rao, D., Wang, D.Z., Tong, C.H., Posner, I.: Vote3deep: fast object detection in 3D point clouds using efficient convolutional neural networks. In: ICRA (2017)","DOI":"10.1109\/ICRA.2017.7989161"},{"key":"25_CR22","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"219","DOI":"10.1007\/978-3-319-45886-1_18","volume-title":"Pattern Recognition","author":"F Engelmann","year":"2016","unstructured":"Engelmann, F., St\u00fcckler, J., Leibe, B.: Joint object pose estimation and shape reconstruction in urban street scenes using 3D shape priors. In: Rosenhahn, B., Andres, B. (eds.) GCPR 2016. LNCS, vol. 9796, pp. 219\u2013230. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-45886-1_18"},{"key":"25_CR23","doi-asserted-by":"crossref","unstructured":"Engelmann, F., St\u00fcckler, J., Leibe, B.: SAMP: shape and motion priors for 4d vehicle reconstruction. In: WACV (2017)","DOI":"10.1109\/WACV.2017.51"},{"key":"25_CR24","unstructured":"Ester, M., et al.: A density-based algorithm for discovering clusters in large spatial databases with noise. In: KDD (1996)"},{"key":"25_CR25","doi-asserted-by":"crossref","unstructured":"Ettinger, S., et al.: Large scale interactive motion forecasting for autonomous driving: the Waymo open motion dataset. In: ICCV (2021)","DOI":"10.1109\/ICCV48922.2021.00957"},{"key":"25_CR26","doi-asserted-by":"crossref","unstructured":"Faktor, A., Irani, M.: \u201cClustering by composition\"-unsupervised discovery of image categories. In: ECCV (2012)","DOI":"10.1007\/978-3-642-33786-4_35"},{"key":"25_CR27","doi-asserted-by":"crossref","unstructured":"Fan, L., Xiong, X., Wang, F., Wang, N., Zhang, Z.: RangeDet: in defense of range view for lidar-based 3D object detection. In: ICCV (2021)","DOI":"10.1109\/ICCV48922.2021.00291"},{"key":"25_CR28","doi-asserted-by":"crossref","unstructured":"Gao, J., et al.: Encoding HD maps and agent dynamics from vectorized representation. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.01154"},{"key":"25_CR29","unstructured":"Grauman, K., Darrell, T.: Unsupervised learning of categories from sets of partially matching image features. In: CVPR (2006)"},{"key":"25_CR30","doi-asserted-by":"crossref","unstructured":"Gro\u00df, J., O\u0161ep, A., Leibe, B.: AlignNet-3D: fast point cloud registration of partially observed objects. In: 3DV (2019)","DOI":"10.1109\/3DV.2019.00074"},{"key":"25_CR31","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"283","DOI":"10.1007\/978-3-030-58558-7_17","volume-title":"Computer Vision \u2013 ECCV 2020","author":"J Gu","year":"2020","unstructured":"Gu, J., et al.: Weakly-supervised 3D shape completion in the wild. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12350, pp. 283\u2013299. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58558-7_17"},{"key":"25_CR32","doi-asserted-by":"crossref","unstructured":"Gu, J., Sun, C., Zhao, H.: DenseTNT: end-to-end trajectory prediction from dense goal sets. In: ICCV (2021)","DOI":"10.1109\/ICCV48922.2021.01502"},{"key":"25_CR33","doi-asserted-by":"crossref","unstructured":"Gu, X., Wang, Y., Wu, C., Lee, Y.J., Wang, P.: HplflowNet: hierarchical permutohedral lattice flowNet for scene flow estimation on large-scale point clouds. In: CVPR (2019)","DOI":"10.1109\/CVPR.2019.00337"},{"key":"25_CR34","doi-asserted-by":"crossref","unstructured":"He, C., Zeng, H., Huang, J., Hua, X.S., Zhang, L.: Structure aware single-stage 3D object detection from point cloud. In: CVPR, June 2020","DOI":"10.1109\/CVPR42600.2020.01189"},{"key":"25_CR35","doi-asserted-by":"crossref","unstructured":"Hong, J., Sapp, B., Philbin, J.: Rules of the road: Predicting driving behavior with a convolutional model of semantic interactions. In: CVPR (2019)","DOI":"10.1109\/CVPR.2019.00865"},{"key":"25_CR36","unstructured":"Houston, J., et al.: One thousand and one hours: Self-driving motion prediction dataset. arXiv preprint arXiv:2006.14480 (2020)"},{"key":"25_CR37","unstructured":"Insafutdinov, E., Dosovitskiy, A.: Unsupervised learning of shape and pose with differentiable point clouds. In: NeurIPS (2018)"},{"key":"25_CR38","doi-asserted-by":"crossref","unstructured":"Izadi, S., et al.: KinectFusion: real-time 3D reconstruction and interaction using a moving depth camera. In: Proceedings of the 24th Annual ACM Symposium on User Interface Software and Technology. pp. 559\u2013568 (2011)","DOI":"10.1145\/2047196.2047270"},{"key":"25_CR39","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"187","DOI":"10.1007\/978-3-319-46478-7_12","volume-title":"Computer Vision \u2013 ECCV 2016","author":"KR Jerripothula","year":"2016","unstructured":"Jerripothula, K.R., Cai, J., Yuan, J.: CATS: co-saliency activated tracklet selection for video co-localization. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9911, pp. 187\u2013202. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46478-7_12"},{"key":"25_CR40","doi-asserted-by":"crossref","unstructured":"Joulin, A., Bach, F., Ponce, J.: Discriminative clustering for image co-segmentation. In: CVPR (2010)","DOI":"10.1109\/CVPR.2010.5539868"},{"issue":"2","key":"25_CR41","doi-asserted-by":"publisher","first-page":"1589","DOI":"10.1109\/LRA.2021.3139542","volume":"7","author":"P Jund","year":"2022","unstructured":"Jund, P., Sweeney, C., Abdo, N., Chen, Z., Shlens, J.: Scalable scene flow from point clouds in the real world. IEEE Rob. Autom. Lett. 7(2), 1589\u20131596 (2022). https:\/\/doi.org\/10.1109\/LRA.2021.3139542","journal-title":"IEEE Rob. Autom. Lett."},{"key":"25_CR42","unstructured":"Kim, G., Torralba, A.: Unsupervised detection of regions of interest using iterative link analysis. In: NIPS (2009)"},{"key":"25_CR43","doi-asserted-by":"crossref","unstructured":"Lang, A.H., Vora, S., Caesar, H., Zhou, L., Yang, J., Beijbom, O.: Pointpillars: fast encoders for object detection from point clouds. In: CVPR (2019)","DOI":"10.1109\/CVPR.2019.01298"},{"key":"25_CR44","doi-asserted-by":"crossref","unstructured":"Lee, H., Grosse, R., Ranganath, R., Ng, A.Y.: Convolutional deep belief networks for scalable unsupervised learning of hierarchical representations. In: ICML (2009)","DOI":"10.1145\/1553374.1553453"},{"key":"25_CR45","unstructured":"Li, X., Pontes, J.K., Lucey, S.: Neural scene flow prior. In: NeurIPS (2021)"},{"key":"25_CR46","doi-asserted-by":"crossref","unstructured":"Li, Z., Wang, F., Wang, N.: Lidar r-CNN: An efficient and universal 3d object detector. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.00746"},{"key":"25_CR47","doi-asserted-by":"crossref","unstructured":"Liu, X., Qi, C.R., Guibas, L.J.: Flownet3d: learning scene flow in 3d point clouds. In: CVPR (2019)","DOI":"10.1109\/CVPR.2019.00062"},{"key":"25_CR48","doi-asserted-by":"crossref","unstructured":"Liu, Y., et al.: Opening up open-world tracking. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.01846"},{"key":"25_CR49","doi-asserted-by":"crossref","unstructured":"Liu, Y., Zhang, J., Fang, L., Jiang, Q., Zhou, B.: Multimodal motion prediction with stacked transformers. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.00749"},{"key":"25_CR50","doi-asserted-by":"crossref","unstructured":"Luo, C., Yang, X., Yuille, A.: Self-supervised pillar motion learning for autonomous driving. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.00320"},{"key":"25_CR51","doi-asserted-by":"crossref","unstructured":"Luo, W., Yang, B., Urtasun, R.: Fast and furious: Real time end-to-end 3d detection, tracking and motion forecasting with a single convolutional net. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00376"},{"key":"25_CR52","doi-asserted-by":"crossref","unstructured":"Manivasagam, S., et al.: LiDARSim: realistic lidar simulation by leveraging the real world. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.01118"},{"key":"25_CR53","doi-asserted-by":"crossref","unstructured":"Meyer, G.P., Laddha, A., Kee, E., Vallespi-Gonzalez, C., Wellington, C.K.: LaserNet: an efficient probabilistic 3D object detector for autonomous driving. In: CVPR (2019)","DOI":"10.1109\/CVPR.2019.01296"},{"key":"25_CR54","doi-asserted-by":"crossref","unstructured":"Misra, I., Girdhar, R., Joulin, A.: An end-to-end transformer model for 3D object detection. In: ICCV (2021)","DOI":"10.1109\/ICCV48922.2021.00290"},{"key":"25_CR55","doi-asserted-by":"crossref","unstructured":"Mittal, H., Okorn, B., Held, D.: Just go with the flow: self-supervised scene flow estimation. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.01119"},{"key":"25_CR56","doi-asserted-by":"crossref","unstructured":"Najibi, M., et al.: DOPS: learning to detect 3D objects and predict their 3D shapes. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.01193"},{"key":"25_CR57","doi-asserted-by":"crossref","unstructured":"Pang, Z., Li, Z., Wang, N.: Model-free vehicle tracking and state estimation in point cloud sequences. In: IROS (2021)","DOI":"10.1109\/IROS51168.2021.9636202"},{"key":"25_CR58","doi-asserted-by":"crossref","unstructured":"Phan-Minh, T., Grigore, E.C., Boulton, F.A., Beijbom, O., Wolff, E.M.: CoverNet: Multimodal behavior prediction using trajectory sets. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.01408"},{"key":"25_CR59","doi-asserted-by":"publisher","unstructured":"Pontes, J.K., Hays, J., Lucey, S.: Scene flow from point clouds with or without learning. In: 2020 International Conference on 3D Vision (3DV). pp. 261\u2013270 (2020). https:\/\/doi.org\/10.1109\/3DV50981.2020.00036","DOI":"10.1109\/3DV50981.2020.00036"},{"key":"25_CR60","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"527","DOI":"10.1007\/978-3-030-58604-1_32","volume-title":"Computer Vision \u2013 ECCV 2020","author":"G Puy","year":"2020","unstructured":"Puy, G., Boulch, A., Marlet, R.: FLOT: scene flow on point clouds guided by optimal transport. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12373, pp. 527\u2013544. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58604-1_32"},{"key":"25_CR61","doi-asserted-by":"crossref","unstructured":"Qi, C.R., Litany, O., He, K., Guibas, L.J.: Deep Hough voting for 3D object detection in point clouds. In: ICCV (2019)","DOI":"10.1109\/ICCV.2019.00937"},{"key":"25_CR62","doi-asserted-by":"crossref","unstructured":"Qi, C.R., et al.: Offboard 3D object detection from point cloud sequences. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.00607"},{"key":"25_CR63","unstructured":"Radford, A., Metz, L., Chintala, S.: Unsupervised representation learning with deep convolutional generative adversarial networks. In: ICLR (2015)"},{"key":"25_CR64","unstructured":"Rusinkiewicz, S., Levoy, M.: Efficient variants of the ICP algorithm. In: Proceedings Third International Conference on 3-D Digital Imaging and Modeling, pp. 145\u2013152. IEEE (2001)"},{"key":"25_CR65","unstructured":"Russell, B.C., Freeman, W.T., Efros, A.A., Sivic, J., Zisserman, A.: Using multiple segmentations to discover objects and their extent in image collections. In: CVPR (2006)"},{"key":"25_CR66","doi-asserted-by":"crossref","unstructured":"Sch\u00f6nberger, J.L., Frahm, J.M.: Structure-from-motion revisited. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.445"},{"key":"25_CR67","doi-asserted-by":"crossref","unstructured":"Shi, S., et al.: PV-RCNN: point-voxel feature set abstraction for 3D object detection. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.01054"},{"key":"25_CR68","doi-asserted-by":"crossref","unstructured":"Shi, S., Wang, X., Li, H.: PointRCNN : 3D object proposal generation and detection from point cloud. In: CVPR (2019)","DOI":"10.1109\/CVPR.2019.00086"},{"key":"25_CR69","doi-asserted-by":"crossref","unstructured":"Shi, W., Rajkumar, R.R.: Point-GNN: graph neural network for 3D object detection in a point cloud. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.00178"},{"key":"25_CR70","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"197","DOI":"10.1007\/978-3-030-11009-3_11","volume-title":"Computer Vision \u2013 ECCV 2018 Workshops","author":"M Simon","year":"2019","unstructured":"Simon, M., Milz, S., Amende, K., Gross, H.-M.: Complex-YOLO: an Euler-region-proposal for real-time 3D object detection on point clouds. In: Leal-Taix\u00e9, L., Roth, S. (eds.) ECCV 2018. LNCS, vol. 11129, pp. 197\u2013209. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-11009-3_11"},{"key":"25_CR71","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"385","DOI":"10.1007\/978-3-642-03767-2_47","volume-title":"Computer Analysis of Images and Patterns","author":"S Xia","year":"2009","unstructured":"Xia, S., Hancock, E.R.: Graph-based object class discovery. In: Jiang, X., Petkov, N. (eds.) CAIP 2009. LNCS, vol. 5702, pp. 385\u2013393. Springer, Heidelberg (2009). https:\/\/doi.org\/10.1007\/978-3-642-03767-2_47"},{"key":"25_CR72","unstructured":"Sohn, K., Zhou, G., Lee, C., Lee, H.: Learning and selecting features jointly with point-wise gated boltzmann machines. In: ICML (2013)"},{"key":"25_CR73","doi-asserted-by":"crossref","unstructured":"Song, S., Xiao, J.: Deep sliding shapes for Amodal 3D object detection in RGB-D images images. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.94"},{"key":"25_CR74","doi-asserted-by":"crossref","unstructured":"Stutz, D., Geiger, A.: Learning 3d shape completion from laser scan data with weak supervision. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00209"},{"key":"25_CR75","doi-asserted-by":"crossref","unstructured":"Sun, P., et al.: Scalability in perception for autonomous driving: Waymo open dataset. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.00252"},{"key":"25_CR76","doi-asserted-by":"crossref","unstructured":"Sun, P., et al.: RSN: range sparse net for efficient, accurate lidar 3d object detection. In: CVPR, pp. 5725\u20135734 (2021)","DOI":"10.1109\/CVPR46437.2021.00567"},{"key":"25_CR77","unstructured":"Tang, C., Tan, P.: Ba-Net: dense bundle adjustment network. In: ICLR (2019)"},{"key":"25_CR78","doi-asserted-by":"crossref","unstructured":"Tian, H., Chen, Y., Dai, J., Zhang, Z., Zhu, X.: Unsupervised object detection with lidar clues. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.00590"},{"key":"25_CR79","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"298","DOI":"10.1007\/3-540-44480-7_21","volume-title":"Vision Algorithms: Theory and Practice","author":"B Triggs","year":"2000","unstructured":"Triggs, B., McLauchlan, P.F., Hartley, R.I., Fitzgibbon, A.W.: Bundle adjustment \u2014 a modern synthesis. In: Triggs, B., Zisserman, A., Szeliski, R. (eds.) IWVA 1999. LNCS, vol. 1883, pp. 298\u2013372. Springer, Heidelberg (2000). https:\/\/doi.org\/10.1007\/3-540-44480-7_21"},{"key":"25_CR80","doi-asserted-by":"crossref","unstructured":"Tulsiani, S., Efros, A.A., Malik, J.: Multi-view consistency as supervisory signal for learning shape and pose prediction. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00306"},{"key":"25_CR81","doi-asserted-by":"crossref","unstructured":"Tulsiani, S., Zhou, T., Efros, A.A., Malik, J.: Multi-view supervision for single-view reconstruction via differentiable ray consistency. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.30"},{"key":"25_CR82","doi-asserted-by":"crossref","unstructured":"Ummenhofer, B., et al.: Demon: depth and motion network for learning monocular stereo. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.596"},{"key":"25_CR83","doi-asserted-by":"crossref","unstructured":"Varadarajan, B., et al.: Multipath++: efficient information fusion and trajectory aggregation for behavior prediction. CoRR arXiv:2111.14973 (2021)","DOI":"10.1109\/ICRA46639.2022.9812107"},{"key":"25_CR84","doi-asserted-by":"crossref","unstructured":"Vo, H.V., et al.: Unsupervised image matching and object discovery as optimization. In: CVPR (2019)","DOI":"10.1109\/CVPR.2019.00848"},{"key":"25_CR85","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"779","DOI":"10.1007\/978-3-030-58592-1_46","volume-title":"Computer Vision \u2013 ECCV 2020","author":"HV Vo","year":"2020","unstructured":"Vo, H.V., P\u00e9rez, P., Ponce, J.: Toward unsupervised, multi-object discovery in large-scale image collections. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12368, pp. 779\u2013795. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58592-1_46"},{"key":"25_CR86","unstructured":"Vo, V.H., Sizikova, E., Schmid, C., P\u00e9rez, P., Ponce, J.: Large-scale unsupervised object discovery. In: NeurIPS (2021)"},{"key":"25_CR87","unstructured":"Wang, D.Z., Posner, I.: Voting for voting in online point cloud object detection. In: Proceedings of Robotics: Science and Systems. Rome, Italy, July 2015"},{"key":"25_CR88","doi-asserted-by":"crossref","unstructured":"Wang, R., Yang, N., St\u00fcckler, J., Cremers, D.: Directshape: direct photometric alignment of shape priors for visual vehicle pose and shape estimation. In: ICRA (2020)","DOI":"10.1109\/ICRA40945.2020.9197095"},{"key":"25_CR89","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"18","DOI":"10.1007\/978-3-030-58542-6_2","volume-title":"Computer Vision \u2013 ECCV 2020","author":"Y Wang","year":"2020","unstructured":"Wang, Y., et al.: Pillar-based object detection for autonomous driving. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12367, pp. 18\u201334. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58542-6_2"},{"key":"25_CR90","doi-asserted-by":"crossref","unstructured":"Wang, Y., Solomon, J.M.: Deep closest point: Learning representations for point cloud registration. In: ICCV (2019)","DOI":"10.1109\/ICCV.2019.00362"},{"key":"25_CR91","doi-asserted-by":"crossref","unstructured":"Wang, Z., Li, S., Howard-Jenkins, H., Prisacariu, V., Chen, M.: Flownet3d++: Geometric losses for deep scene flow estimation. In: WACV (2020)","DOI":"10.1109\/WACV45572.2020.9093302"},{"key":"25_CR92","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"230","DOI":"10.1007\/978-3-030-58452-8_14","volume-title":"Computer Vision \u2013 ECCV 2020","author":"X Wei","year":"2020","unstructured":"Wei, X., Zhang, Y., Li, Z., Fu, Y., Xue, X.: DeepSFM: structure from motion via deep bundle adjustment. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12346, pp. 230\u2013247. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58452-8_14"},{"key":"25_CR93","unstructured":"Weng, X., Kitani, K.: A baseline for 3D multi-object tracking. arXiv preprint arXiv:1907.03961 (2019)"},{"key":"25_CR94","unstructured":"Wong, K., Wang, S., Ren, M., Liang, M., Urtasun, R.: Identifying unknown instances for autonomous driving. In: CoRL. PMLR (2020)"},{"key":"25_CR95","doi-asserted-by":"crossref","unstructured":"Wu, P., Chen, S., Metaxas, D.N.: MotionNet: joint perception and motion prediction for autonomous driving based on bird\u2019s eye view maps. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.01140"},{"key":"25_CR96","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"88","DOI":"10.1007\/978-3-030-58558-7_6","volume-title":"Computer Vision \u2013 ECCV 2020","author":"W Wu","year":"2020","unstructured":"Wu, W., Wang, Z.Y., Li, Z., Liu, W., Fuxin, L.: PointPWC-Net: cost volume on point clouds for (Self-)supervised scene flow estimation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12350, pp. 88\u2013107. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58558-7_6"},{"key":"25_CR97","doi-asserted-by":"crossref","unstructured":"Yan, X., et al.: Learning 6-DOF grasping interaction via deep geometry-aware 3D representations. In: ICRA (2018)","DOI":"10.1109\/ICRA.2018.8460609"},{"key":"25_CR98","unstructured":"Yan, X., Yang, J., Yumer, E., Guo, Y., Lee, H.: Perspective transformer nets: Learning single-view 3D object reconstruction without 3D supervision. In: NIPS (2016)"},{"key":"25_CR99","unstructured":"Yang, B., Bai, M., Liang, M., Zeng, W., Urtasun, R.: Auto4d: learning to label 4D objects from sequential point clouds. arXiv preprint arXiv:2101.06586 (2021)"},{"key":"25_CR100","doi-asserted-by":"crossref","unstructured":"Yang, B., Luo, W., Urtasun, R.: PIXOR: real-time 3D object detection from point clouds. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00798"},{"issue":"2","key":"25_CR101","doi-asserted-by":"publisher","first-page":"314","DOI":"10.1109\/TRO.2020.3033695","volume":"37","author":"H Yang","year":"2020","unstructured":"Yang, H., Shi, J., Carlone, L.: Teaser: fast and certifiable point cloud registration. IEEE Trans. Rob. 37(2), 314\u2013333 (2020)","journal-title":"IEEE Trans. Rob."},{"key":"25_CR102","doi-asserted-by":"crossref","unstructured":"Yang, Z., Sun, Y., Liu, S., Jia, J.: 3DSSD: point-based 3D single stage object detector. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.01105"},{"key":"25_CR103","doi-asserted-by":"crossref","unstructured":"Ye, M., Xu, S., Cao, T.: HvNet: hybrid voxel network for lidar based 3d object detection. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.00170"},{"key":"25_CR104","doi-asserted-by":"crossref","unstructured":"Ye, M., Cao, T., Chen, Q.: TPCN: temporal point cloud networks for motion forecasting. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.01116"},{"key":"25_CR105","unstructured":"Yuan, J., Liu, Z., Wu, Y.: Discriminative subvolume search for efficient action detection. In: CVPR (2009)"},{"key":"25_CR106","doi-asserted-by":"crossref","unstructured":"Yuan, Y., Weng, X., Ou, Y., Kitani, K.M.: AgentFormer: agent-aware transformers for socio-temporal multi-agent forecasting. In: ICCV (2021)","DOI":"10.1109\/ICCV48922.2021.00967"},{"key":"25_CR107","doi-asserted-by":"crossref","unstructured":"Zakharov, S., Kehl, W., Bhargava, A., Gaidon, A.: Autolabeling 3D objects with differentiable rendering of SDF shape priors. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.01224"},{"key":"25_CR108","doi-asserted-by":"crossref","unstructured":"Zeng, W., et al.: End-to-end interpretable neural motion planner. In: CVPR (2019)","DOI":"10.1109\/CVPR.2019.00886"},{"key":"25_CR109","doi-asserted-by":"crossref","unstructured":"Zheng, W., Tang, W., Jiang, L., Fu, C.W.: SE-SSD: self-ensembling single-stage object detector from point cloud. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.01426"},{"key":"25_CR110","doi-asserted-by":"crossref","unstructured":"Zhou, T., Brown, M., Snavely, N., Lowe, D.G.: Unsupervised learning of depth and ego-motion from video. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.700"},{"key":"25_CR111","unstructured":"Zhou, Y., et al.: End-to-end multi-view fusion for 3D object detection in lidar point clouds. In: CoRL (2020)"},{"key":"25_CR112","doi-asserted-by":"crossref","unstructured":"Zhou, Y., Tuzel, O.: VoxelNet: end-to-end learning for point cloud based 3D object detection. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00472"},{"key":"25_CR113","doi-asserted-by":"crossref","unstructured":"Zhu, R., Kiani Galoogahi, H., Wang, C., Lucey, S.: Rethinking reprojection: closing the loop for pose-aware shape reconstruction from a single image. In: ICCV (2017)","DOI":"10.1109\/ICCV.2017.16"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2022"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-19839-7_25","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,7]],"date-time":"2024-03-07T12:25:57Z","timestamp":1709814357000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-19839-7_25"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"ISBN":["9783031198380","9783031198397"],"references-count":113,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-19839-7_25","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022]]},"assertion":[{"value":"23 October 2022","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Tel Aviv","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Israel","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2022","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23 October 2022","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 October 2022","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2022","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2022.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"CMT","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"5804","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1645","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"28% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.21","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.91","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}