{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T20:49:16Z","timestamp":1775076556343,"version":"3.50.1"},"publisher-location":"Cham","reference-count":87,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031730290","type":"print"},{"value":"9783031730306","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,11,24]],"date-time":"2024-11-24T00:00:00Z","timestamp":1732406400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,24]],"date-time":"2024-11-24T00:00:00Z","timestamp":1732406400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-73030-6_27","type":"book-chapter","created":{"date-parts":[[2024,11,25]],"date-time":"2024-11-25T16:58:35Z","timestamp":1732553915000},"page":"484-503","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":10,"title":["SAMFusion: Sensor-Adaptive Multimodal Fusion for\u00a03D Object Detection in\u00a0Adverse Weather"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-2948-5368","authenticated-orcid":false,"given":"Edoardo","family":"Palladin","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0006-1337-0205","authenticated-orcid":false,"given":"Roland","family":"Dietze","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0007-7097-6227","authenticated-orcid":false,"given":"Praveen","family":"Narayanan","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2676-9833","authenticated-orcid":false,"given":"Mario","family":"Bijelic","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8054-9823","authenticated-orcid":false,"given":"Felix","family":"Heide","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,24]]},"reference":[{"key":"27_CR1","doi-asserted-by":"crossref","unstructured":"Bai, X., et al.: TransFusion: robust lidar-camera fusion for 3D object detection with transformers. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 1090\u20131099 (2022)","DOI":"10.1109\/CVPR52688.2022.00116"},{"key":"27_CR2","unstructured":"Baumann, N., et al.: CR3DT: camera-radar fusion for 3D detection and tracking. arXiv preprint arXiv:2403.15313 (2024)"},{"key":"27_CR3","doi-asserted-by":"crossref","unstructured":"Bijelic, M., et al.: Seeing through fog without seeing fog: deep multimodal sensor fusion in unseen adverse weather. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11682\u201311692 (2020)","DOI":"10.1109\/CVPR42600.2020.01170"},{"key":"27_CR4","doi-asserted-by":"crossref","unstructured":"Bijelic, M., Gruber, T., Ritter, W.: A benchmark for lidar sensors in fog: is detection breaking down? In: 2018 IEEE Intelligent Vehicles Symposium (IV), pp. 760\u2013767. IEEE (2018)","DOI":"10.1109\/IVS.2018.8500543"},{"key":"27_CR5","doi-asserted-by":"crossref","unstructured":"Bijelic, M., Gruber, T., Ritter, W.: Benchmarking image sensors under adverse weather conditions for autonomous driving. In: 2018 IEEE Intelligent Vehicles Symposium (IV), pp. 1773\u20131779. IEEE (2018)","DOI":"10.1109\/IVS.2018.8500659"},{"key":"27_CR6","doi-asserted-by":"crossref","unstructured":"Brazil, G., Liu, X.: M3D-RPN: monocular 3D region proposal network for object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 9287\u20139296 (2019)","DOI":"10.1109\/ICCV.2019.00938"},{"key":"27_CR7","doi-asserted-by":"crossref","unstructured":"Broedermann, T., Sakaridis, C., Dai, D., Van\u00a0Gool, L.: HRFuser: a multi-resolution sensor fusion architecture for 2D object detection. In: IEEE International Conference on Intelligent Transportation Systems (ITSC) (2023)","DOI":"10.1109\/ITSC57777.2023.10422432"},{"key":"27_CR8","doi-asserted-by":"crossref","unstructured":"Caesar, H., et al.: nuScenes: a multimodal dataset for autonomous driving. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11621\u201311631 (2020)","DOI":"10.1109\/CVPR42600.2020.01164"},{"key":"27_CR9","unstructured":"Cai, H., Zhang, Z., Zhou, Z., Li, Z., Ding, W., Zhao, J.: BEVFusion4D: learning lidar-camera fusion under bird\u2019s-eye-view via cross-modality guidance and temporal aggregation. arXiv preprint arXiv:2303.17099 (2023)"},{"issue":"5","key":"27_CR10","doi-asserted-by":"publisher","first-page":"1483","DOI":"10.1109\/TPAMI.2019.2956516","volume":"43","author":"Z Cai","year":"2019","unstructured":"Cai, Z., Vasconcelos, N.: Cascade R-CNN: high quality object detection and instance segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 43(5), 1483\u20131498 (2019)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"27_CR11","doi-asserted-by":"publisher","first-page":"213","DOI":"10.1007\/978-3-030-58452-8_13","volume-title":"Computer Vision \u2013 ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part I","author":"N Carion","year":"2020","unstructured":"Carion, N., Massa, F., Synnaeve, G., Usunier, N., Kirillov, A., Zagoruyko, S.: End-to-end object detection with transformers. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) Computer Vision \u2013 ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part I, pp. 213\u2013229. Springer International Publishing, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58452-8_13"},{"key":"27_CR12","doi-asserted-by":"crossref","unstructured":"Chen, X., Ma, H., Wan, J., Li, B., Xia, T.: Multi-view 3D object detection network for autonomous driving. In: Proceedings of the IEEE conference on Computer Vision and Pattern Recognition, pp. 1907\u20131915 (2017)","DOI":"10.1109\/CVPR.2017.691"},{"key":"27_CR13","doi-asserted-by":"crossref","unstructured":"Chen, X., Zhang, T., Wang, Y., Wang, Y., Zhao, H.: FUTR3D: a unified sensor fusion framework for 3D detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 172\u2013181 (2023)","DOI":"10.1109\/CVPRW59228.2023.00022"},{"key":"27_CR14","doi-asserted-by":"crossref","unstructured":"Chen, Y., Li, Y., Zhang, X., Sun, J., Jia, J.: Focal sparse convolutional networks for 3D object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5428\u20135437 (2022)","DOI":"10.1109\/CVPR52688.2022.00535"},{"key":"27_CR15","doi-asserted-by":"crossref","unstructured":"Chen, Y., Liu, J., Zhang, X., Qi, X., Jia, J.: LargeKernel3D: scaling up kernels in 3D sparse CNNs. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13488\u201313498 (2023)","DOI":"10.1109\/CVPR52729.2023.01296"},{"key":"27_CR16","doi-asserted-by":"crossref","unstructured":"Chen, Y., Liu, J., Zhang, X., Qi, X., Jia, J.: VoxelNext: fully sparse VoxelNet for 3D object detection and tracking. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 21674\u201321683 (2023)","DOI":"10.1109\/CVPR52729.2023.02076"},{"key":"27_CR17","unstructured":"Contributors, M.: MMDetection3D: OpenMMLab next-generation platform for general 3D object detection. https:\/\/github.com\/open-mmlab\/mmdetection3d (2020)"},{"key":"27_CR18","doi-asserted-by":"crossref","unstructured":"Diaz-Ruiz, C.A., et\u00a0al.: Ithaca365: dataset and driving perception under repeated and challenging weather conditions. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 21383\u201321392 (2022)","DOI":"10.1109\/CVPR52688.2022.02069"},{"key":"27_CR19","doi-asserted-by":"crossref","unstructured":"Ge, C., et al.: MetaBEV: solving sensor failures for BEV detection and map segmentation. arXiv preprint arXiv:2304.09801 (2023)","DOI":"10.1109\/ICCV51070.2023.00801"},{"key":"27_CR20","doi-asserted-by":"crossref","unstructured":"Geiger, A., Lenz, P., Stiller, C., Urtasun, R.: Vision meets robotics: the KITTI dataset. Int. J. Robot. Res. (IJRR) (2013)","DOI":"10.1177\/0278364913491297"},{"key":"27_CR21","doi-asserted-by":"crossref","unstructured":"Geiger, A., Lenz, P., Urtasun, R.: Are we ready for autonomous driving? The KITTI vision benchmark suite. In: 2012 IEEE Conference on Computer Vision and Pattern Recognition, pp. 3354\u20133361. IEEE (2012)","DOI":"10.1109\/CVPR.2012.6248074"},{"issue":"2","key":"27_CR22","doi-asserted-by":"publisher","first-page":"151","DOI":"10.1515\/aot-2014-0001","volume":"3","author":"Y Grauer","year":"2014","unstructured":"Grauer, Y.: Active gated imaging in driver assistance system. Adv. Optical Technol. 3(2), 151\u2013160 (2014)","journal-title":"Adv. Optical Technol."},{"key":"27_CR23","doi-asserted-by":"crossref","unstructured":"He, K., Gkioxari, G., Doll\u00e1r, P., Girshick, R.: Mask R-CNN. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2961\u20132969 (2017)","DOI":"10.1109\/ICCV.2017.322"},{"key":"27_CR24","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"27_CR25","doi-asserted-by":"crossref","unstructured":"Hu, Y., et al.: Planning-oriented autonomous driving (2023)","DOI":"10.1109\/CVPR52729.2023.01712"},{"key":"27_CR26","unstructured":"Huang, J., Huang, G., Zhu, Z., Ye, Y., Du, D.: BEVDet: high-performance multi-camera 3D object detection in bird-eye-view. arXiv preprint arXiv:2112.11790 (2021)"},{"key":"27_CR27","unstructured":"Huang, L., et al.: Leveraging vision-centric multi-modal expertise for 3D object detection. In: Advances in Neural Information Processing Systems, vol. 36 (2024)"},{"key":"27_CR28","doi-asserted-by":"publisher","unstructured":"Hwang, J.J., et al.: CramNet: camera-radar fusion with ray-constrained cross-attention for robust 3D object detection. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds) European Conference on Computer Vision, pp. 388\u2013405. Springer (2022). https:\/\/doi.org\/10.1007\/978-3-031-19839-7_23","DOI":"10.1007\/978-3-031-19839-7_23"},{"key":"27_CR29","doi-asserted-by":"crossref","unstructured":"Jiao, Y., Jie, Z., Chen, S., Chen, J., Ma, L., Jiang, Y.G.: MsmdFusion: fusing lidar and camera at multiple scales with multi-depth seeds for 3D object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 21643\u201321652 (2023)","DOI":"10.1109\/CVPR52729.2023.02073"},{"key":"27_CR30","doi-asserted-by":"crossref","unstructured":"Julca-Aguilar, F., Taylor, J., Bijelic, M., Mannan, F., Tseng, E., Heide, F.: Gated3D: monocular 3D object detection from temporal illumination cues. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 2938\u20132948 (2021)","DOI":"10.1109\/ICCV48922.2021.00293"},{"key":"27_CR31","doi-asserted-by":"crossref","unstructured":"Ku, J., Harakeh, A., Waslander, S.L.: In defense of classical image processing: Fast depth completion on the CPU. In: 2018 15th Conference on Computer and Robot Vision (CRV), pp. 16\u201322. IEEE (2018)","DOI":"10.1109\/CRV.2018.00013"},{"key":"27_CR32","doi-asserted-by":"crossref","unstructured":"Kuhn, H.W.: The Hungarian method for the assignment problem. Naval Res. Logistics (NRL) 52 (1955)","DOI":"10.1002\/nav.20053"},{"key":"27_CR33","doi-asserted-by":"crossref","unstructured":"Lang, A.H., Vora, S., Caesar, H., Zhou, L., Yang, J., Beijbom, O.: PointPillars: fast encoders for object detection from point clouds. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12697\u201312705 (2019)","DOI":"10.1109\/CVPR.2019.01298"},{"key":"27_CR34","doi-asserted-by":"crossref","unstructured":"Li, J., et al.: Practical stereo matching via cascaded recurrent network with adaptive correlation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16263\u201316272 (2022)","DOI":"10.1109\/CVPR52688.2022.01578"},{"key":"27_CR35","doi-asserted-by":"crossref","unstructured":"Li, P., Chen, X., Shen, S.: Stereo R-CNN based 3D object detection for autonomous driving. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7644\u20137652 (2019)","DOI":"10.1109\/CVPR.2019.00783"},{"key":"27_CR36","unstructured":"Li, Q., Wang, Y., Wang, Y., Zhao, H.: HDMapNet: an online HD map construction and evaluation framework. CoRR abs\/2107.06307 (2021)"},{"key":"27_CR37","first-page":"18442","volume":"35","author":"Y Li","year":"2022","unstructured":"Li, Y., Chen, Y., Qi, X., Li, Z., Sun, J., Jia, J.: Unifying voxel-based representation with transformer for 3D object detection. Adv. Neural. Inf. Process. Syst. 35, 18442\u201318455 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"27_CR38","doi-asserted-by":"crossref","unstructured":"Li, Y., et al.: BEVDepth: acquisition of reliable depth for multi-view 3d object detection. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol.\u00a037, pp. 1477\u20131485 (2023)","DOI":"10.1609\/aaai.v37i2.25233"},{"key":"27_CR39","doi-asserted-by":"crossref","unstructured":"Li, Z., et al.: BEVFormer: learning bird\u2019s-eye-view representation from multi-camera images via spatiotemporal transformers (2022)","DOI":"10.1007\/978-3-031-20077-9_1"},{"key":"27_CR40","doi-asserted-by":"crossref","unstructured":"Liang, M., Yang, B., Chen, Y., Hu, R., Urtasun, R.: Multi-task multi-sensor fusion for 3D object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7345\u20137353 (2019)","DOI":"10.1109\/CVPR.2019.00752"},{"key":"27_CR41","first-page":"10421","volume":"35","author":"T Liang","year":"2022","unstructured":"Liang, T., et al.: BEVFusion: a simple and robust lidar-camera fusion framework. Adv. Neural. Inf. Process. Syst. 35, 10421\u201310434 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"27_CR42","doi-asserted-by":"crossref","unstructured":"Lin, Z., et al.: RCBEVDet: radar-camera fusion in bird\u2019s eye view for 3D object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 14928\u201314937 (2024)","DOI":"10.1109\/CVPR52733.2024.01414"},{"key":"27_CR43","doi-asserted-by":"crossref","unstructured":"Liu, X., Zheng, C., Cheng, K.B., Xue, N., Qi, G.J., Wu, T.: Monocular 3D object detection with bounding box denoising in 3D by perceiver. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 6436\u20136446 (2023)","DOI":"10.1109\/ICCV51070.2023.00592"},{"key":"27_CR44","doi-asserted-by":"crossref","unstructured":"Liu, Y., et al.: PETRv2: a unified framework for 3D perception from multi-camera images. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3262\u20133272 (2023)","DOI":"10.1109\/ICCV51070.2023.00302"},{"key":"27_CR45","doi-asserted-by":"crossref","unstructured":"Liu, Z., Wu, Z., T\u00f3th, R.: Smoke: Single-stage monocular 3D object detection via keypoint estimation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, pp. 996\u2013997 (2020)","DOI":"10.1109\/CVPRW50498.2020.00506"},{"key":"27_CR46","doi-asserted-by":"crossref","unstructured":"Liu, Z., et al.: BEVFusion: multi-task multi-sensor fusion with unified bird\u2019s-eye view representation. In: 2023 IEEE International Conference on Robotics and Automation (ICRA), pp. 2774\u20132781. IEEE (2023)","DOI":"10.1109\/ICRA48891.2023.10160968"},{"key":"27_CR47","doi-asserted-by":"publisher","first-page":"311","DOI":"10.1007\/978-3-030-58601-0_19","volume-title":"Computer Vision \u2013 ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XIII","author":"X Ma","year":"2020","unstructured":"Ma, X., Liu, S., Xia, Z., Zhang, H., Zeng, X., Ouyang, W.: Rethinking Pseudo-LiDAR representation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) Computer Vision \u2013 ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XIII, pp. 311\u2013327. Springer International Publishing, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58601-0_19"},{"key":"27_CR48","unstructured":"Meyer, M., Kuschk, G.: Automotive radar dataset for deep learning based 3D object detection. In: 2019 16th European Radar Conference (EuRAD), pp. 129\u2013132. IEEE (2019)"},{"key":"27_CR49","doi-asserted-by":"crossref","unstructured":"Mirza, M.J., et al.: Robustness of object detectors in degrading weather conditions. In: 2021 IEEE International Intelligent Transportation Systems Conference (ITSC), pp. 2719\u20132724. IEEE (2021)","DOI":"10.1109\/ITSC48978.2021.9564505"},{"key":"27_CR50","doi-asserted-by":"crossref","unstructured":"Nabati, R., Qi, H.: CenterFusion: center-based radar and camera fusion for 3D object detection. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 1527\u20131536 (2021)","DOI":"10.1109\/WACV48630.2021.00157"},{"key":"27_CR51","unstructured":"Paszke, A., et al.: Automatic differentiation in PyTorch. In: NIPS 2017 Workshop on Autodiff (2017). https:\/\/openreview.net\/forum?id=BJJsrmfCZ"},{"key":"27_CR52","doi-asserted-by":"crossref","unstructured":"Peng, L., Chen, Z., Fu, Z., Liang, P., Cheng, E.: BEVSegFormer: bird\u2019s eye view semantic segmentation from arbitrary camera rigs (2022)","DOI":"10.1109\/WACV56688.2023.00588"},{"key":"27_CR53","doi-asserted-by":"crossref","unstructured":"Qi, C.R., Liu, W., Wu, C., Su, H., Guibas, L.J.: Frustum PointNets for 3D object detection from RGB-D data. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 918\u2013927 (2018)","DOI":"10.1109\/CVPR.2018.00102"},{"key":"27_CR54","unstructured":"Qi, C.R., Yi, L., Su, H., Guibas, L.J.: PointNet++: deep hierarchical feature learning on point sets in a metric space. In: Advances in Neural Information Processing Systems, vol. 30 (2017)"},{"key":"27_CR55","doi-asserted-by":"crossref","unstructured":"Ranftl, R., Bochkovskiy, A., Koltun, V.: Vision transformers for dense prediction. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 12179\u201312188 (2021)","DOI":"10.1109\/ICCV48922.2021.01196"},{"key":"27_CR56","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster R-CNN: towards real-time object detection with region proposal networks. In: Advances in Neural Information Processing Systems, vol. 28 (2015)"},{"key":"27_CR57","doi-asserted-by":"crossref","unstructured":"Shi, S., et al.: PV-RCNN: point-voxel feature set abstraction for 3D object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10529\u201310538 (2020)","DOI":"10.1109\/CVPR42600.2020.01054"},{"key":"27_CR58","doi-asserted-by":"crossref","unstructured":"Shi, S., Wang, X., Li, H.: PointRCNN: 3D object proposal generation and detection from point cloud. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 770\u2013779 (2019)","DOI":"10.1109\/CVPR.2019.00086"},{"issue":"8","key":"27_CR59","first-page":"2647","volume":"43","author":"S Shi","year":"2020","unstructured":"Shi, S., Wang, Z., Shi, J., Wang, X., Li, H.: From points to parts: 3D object detection from point cloud with part-aware and part-aggregation network. IEEE Trans. Pattern Anal. Mach. Intell. 43(8), 2647\u20132664 (2020)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"27_CR60","doi-asserted-by":"crossref","unstructured":"Simonelli, A., Bulo, S.R., Porzi, L., L\u00f3pez-Antequera, M., Kontschieder, P.: Disentangling monocular 3D object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 1991\u20131999 (2019)","DOI":"10.1109\/ICCV.2019.00208"},{"key":"27_CR61","doi-asserted-by":"crossref","unstructured":"Sindagi, V.A., Zhou, Y., Tuzel, O.: MVX-Net: multimodal VoxelNet for 3D object detection. In: 2019 International Conference on Robotics and Automation (ICRA), pp. 7276\u20137282. IEEE (2019)","DOI":"10.1109\/ICRA.2019.8794195"},{"key":"27_CR62","unstructured":"Sun, J., Cao, Y., Chen, Q.A., Mao, Z.M.: Towards robust $$\\{$$LiDAR-based$$\\}$$ perception in autonomous driving: General black-box adversarial sensor attack and countermeasures. In: 29th USENIX Security Symposium (USENIX Security 20), pp. 877\u2013894 (2020)"},{"key":"27_CR63","doi-asserted-by":"crossref","unstructured":"Uric\u00e1r, M., et al.: Desoiling dataset: restoring soiled areas on automotive fisheye cameras. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision Workshops (2019)","DOI":"10.1109\/ICCVW.2019.00526"},{"key":"27_CR64","doi-asserted-by":"crossref","unstructured":"Vora, S., Lang, A.H., Helou, B., Beijbom, O.: PointPainting: sequential fusion for 3D object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4604\u20134612 (2020)","DOI":"10.1109\/CVPR42600.2020.00466"},{"key":"27_CR65","doi-asserted-by":"crossref","unstructured":"Walia, A., et al.: Gated2Gated: self-supervised depth estimation from gated images. In: 2022 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 2801\u20132811 (2021)","DOI":"10.1109\/CVPR52688.2022.00283"},{"key":"27_CR66","doi-asserted-by":"crossref","unstructured":"Walz, S., Bijelic, M., Ramazzina, A., Walia, A., Mannan, F., Heide, F.: Gated Stereo: joint depth estimation from gated and wide-baseline active stereo cues. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13252\u201313262 (2023)","DOI":"10.1109\/CVPR52729.2023.01273"},{"key":"27_CR67","doi-asserted-by":"crossref","unstructured":"Wang, C., Ma, C., Zhu, M., Yang, X.: PointAugmenting: cross-modal augmentation for 3D object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11794\u201311803 (2021)","DOI":"10.1109\/CVPR46437.2021.01162"},{"key":"27_CR68","doi-asserted-by":"crossref","unstructured":"Wang, H., et al.: UNITR: a unified and efficient multi-modal transformer for bird\u2019s-eye-view representation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 6792\u20136802 (2023)","DOI":"10.1109\/ICCV51070.2023.00625"},{"key":"27_CR69","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1007\/978-3-030-58607-2_24","volume-title":"Computer Vision \u2013 ECCV 2020","author":"J Wang","year":"2020","unstructured":"Wang, J., Lan, S., Gao, M., Davis, L.S.: InfoFocus: 3D object detection for autonomous driving with dynamic information modeling. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12355, pp. 405\u2013420. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58607-2_24"},{"key":"27_CR70","doi-asserted-by":"crossref","unstructured":"Wang, S., Caesar, H., Nan, L., Kooij, J.F.: UniBEV: multi-modal 3D object detection with uniform BEV encoders for robustness against missing sensor modalities. arXiv preprint arXiv:2309.14516 (2023)","DOI":"10.1109\/IV55156.2024.10588783"},{"key":"27_CR71","doi-asserted-by":"crossref","unstructured":"Wang, T., Zhu, X., Pang, J., Lin, D.: FCOS3D: fully convolutional one-stage monocular 3D object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 913\u2013922 (2021)","DOI":"10.1109\/ICCVW54120.2021.00107"},{"key":"27_CR72","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"18","DOI":"10.1007\/978-3-030-58542-6_2","volume-title":"Computer Vision \u2013 ECCV 2020","author":"Y Wang","year":"2020","unstructured":"Wang, Y., et al.: Pillar-based object detection for autonomous driving. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12367, pp. 18\u201334. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58542-6_2"},{"key":"27_CR73","unstructured":"Wang, Y., Guizilini, V.C., Zhang, T., Wang, Y., Zhao, H., Solomon, J.: DETR3D: 3D object detection from multi-view images via 3D-to-2D queries. In: Conference on Robot Learning, pp. 180\u2013191. PMLR (2022)"},{"issue":"6","key":"27_CR74","doi-asserted-by":"publisher","first-page":"2425","DOI":"10.1007\/s00371-022-02672-2","volume":"39","author":"P Wu","year":"2023","unstructured":"Wu, P., et al.: PV-RCNN++: semantical point-voxel feature interaction for 3D object detection. Vis. Comput. 39(6), 2425\u20132440 (2023)","journal-title":"Vis. Comput."},{"key":"27_CR75","doi-asserted-by":"crossref","unstructured":"Xie, Y., et al.: SparseFusion: fusing multi-modal sparse representations for multi-sensor 3D object detection (2023)","DOI":"10.1109\/ICCV51070.2023.01613"},{"key":"27_CR76","doi-asserted-by":"crossref","unstructured":"Xu, S., Zhou, D., Fang, J., Yin, J., Bin, Z., Zhang, L.: FusionPainting: multimodal fusion with adaptive attention for 3D object detection. In: 2021 IEEE International Intelligent Transportation Systems Conference (ITSC), pp. 3047\u20133054. IEEE (2021)","DOI":"10.1109\/ITSC48978.2021.9564951"},{"key":"27_CR77","doi-asserted-by":"crossref","unstructured":"Yan, J., et al.: Cross modal transformer: towards fast and robust 3D object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 18268\u201318278 (2023)","DOI":"10.1109\/ICCV51070.2023.01675"},{"issue":"10","key":"27_CR78","doi-asserted-by":"publisher","first-page":"3337","DOI":"10.3390\/s18103337","volume":"18","author":"Y Yan","year":"2018","unstructured":"Yan, Y., Mao, Y., Li, B.: SECOND: sparsely embedded convolutional detection. Sensors 18(10), 3337 (2018)","journal-title":"Sensors"},{"key":"27_CR79","doi-asserted-by":"crossref","unstructured":"Yang, B., Luo, W., Urtasun, R.: PIXOR: real-time 3D object detection from point clouds. In: Proceedings of the IEEE conference on Computer Vision and Pattern Recognition, pp. 7652\u20137660 (2018)","DOI":"10.1109\/CVPR.2018.00798"},{"key":"27_CR80","doi-asserted-by":"crossref","unstructured":"Yang, Z., Sun, Y., Liu, S., Jia, J.: 3DSSD: point-based 3D single stage object detector. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11040\u201311048 (2020)","DOI":"10.1109\/CVPR42600.2020.01105"},{"key":"27_CR81","first-page":"1992","volume":"35","author":"Z Yang","year":"2022","unstructured":"Yang, Z., Chen, J., Miao, Z., Li, W., Zhu, X., Zhang, L.: DeepInteraction: 3D object detection via modality interaction. Adv. Neural. Inf. Process. Syst. 35, 1992\u20132005 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"27_CR82","doi-asserted-by":"crossref","unstructured":"Yin, T., Zhou, X., Krahenbuhl, P.: Center-based 3D object detection and tracking. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11784\u201311793 (2021)","DOI":"10.1109\/CVPR46437.2021.01161"},{"key":"27_CR83","first-page":"16494","volume":"34","author":"T Yin","year":"2021","unstructured":"Yin, T., Zhou, X., Kr\u00e4henb\u00fchl, P.: Multimodal virtual point 3D detection. Adv. Neural. Inf. Process. Syst. 34, 16494\u201316507 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"27_CR84","doi-asserted-by":"publisher","unstructured":"Yoo, J.H., Kim, Y., Kim, J., Choi, J.W.: 3D-CVF: generating joint camera and lidar features using cross-view spatial feature fusion for 3D object detection. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XXVII 16, pp. 720\u2013736. Springer (2020). https:\/\/doi.org\/10.1007\/978-3-030-58583-9_43","DOI":"10.1007\/978-3-030-58583-9_43"},{"key":"27_CR85","doi-asserted-by":"crossref","unstructured":"Zhang, J., Singh, S.: Visual-lidar odometry and mapping: low-drift, robust, and fast. In: 2015 IEEE International Conference on Robotics and Automation (ICRA), pp. 2174\u20132181. IEEE (2015)","DOI":"10.1109\/ICRA.2015.7139486"},{"key":"27_CR86","doi-asserted-by":"crossref","unstructured":"Zhou, Y., Tuzel, O.: VoxelNet: end-to-end learning for point cloud based 3D object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4490\u20134499 (2018)","DOI":"10.1109\/CVPR.2018.00472"},{"key":"27_CR87","unstructured":"Zhu, X., Su, W., Lu, L., Li, B., Wang, X., Dai, J.: Deformable $$\\{$$detr$$\\}$$: deformable transformers for end-to-end object detection. In: International Conference on Learning Representations (2021)"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-73030-6_27","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,25]],"date-time":"2024-11-25T17:20:26Z","timestamp":1732555226000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-73030-6_27"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,24]]},"ISBN":["9783031730290","9783031730306"],"references-count":87,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-73030-6_27","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,11,24]]},"assertion":[{"value":"24 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}