{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T21:31:45Z","timestamp":1778275905638,"version":"3.51.4"},"publisher-location":"Cham","reference-count":42,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031726545","type":"print"},{"value":"9783031726552","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,12,6]],"date-time":"2024-12-06T00:00:00Z","timestamp":1733443200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,12,6]],"date-time":"2024-12-06T00:00:00Z","timestamp":1733443200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-72655-2_12","type":"book-chapter","created":{"date-parts":[[2024,12,5]],"date-time":"2024-12-05T10:12:24Z","timestamp":1733393544000},"page":"203-220","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":25,"title":["Stream Query Denoising for\u00a0Vectorized HD-Map Construction"],"prefix":"10.1007","author":[{"given":"Shuo","family":"Wang","sequence":"first","affiliation":[]},{"given":"Fan","family":"Jia","sequence":"additional","affiliation":[]},{"given":"Weixin","family":"Mao","sequence":"additional","affiliation":[]},{"given":"Yingfei","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Yucheng","family":"Zhao","sequence":"additional","affiliation":[]},{"given":"Zehui","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Tiancai","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Chi","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Xiangyu","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Feng","family":"Zhao","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,12,6]]},"reference":[{"key":"12_CR1","doi-asserted-by":"crossref","unstructured":"Antonello, M., Carraro, M., Pierobon, M., Menegatti, E.: Fast and robust detection of fallen people from a mobile robot. In: 2017 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), pp. 4159\u20134166. IEEE (2017)","DOI":"10.1109\/IROS.2017.8206276"},{"key":"12_CR2","doi-asserted-by":"crossref","unstructured":"Bekir, E.: Introduction to Modern Navigation Systems. World Scientific (2007)","DOI":"10.1142\/9789812708755"},{"key":"12_CR3","doi-asserted-by":"crossref","unstructured":"Caesar, H., et al.: nuScenes: a multimodal dataset for autonomous driving. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11621\u201311631 (2020)","DOI":"10.1109\/CVPR42600.2020.01164"},{"key":"12_CR4","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"213","DOI":"10.1007\/978-3-030-58452-8_13","volume-title":"Computer Vision \u2013 ECCV 2020","author":"N Carion","year":"2020","unstructured":"Carion, N., Massa, F., Synnaeve, G., Usunier, N., Kirillov, A., Zagoruyko, S.: End-to-end object detection with transformers. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12346, pp. 213\u2013229. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58452-8_13"},{"key":"12_CR5","doi-asserted-by":"crossref","unstructured":"Chang, J., Wang, S., Xu, H.M., Chen, Z., Yang, C., Zhao, F.: DETRDistill: a universal knowledge distillation framework for DETR-families. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 6898\u20136908 (2023)","DOI":"10.1109\/ICCV51070.2023.00635"},{"key":"12_CR6","doi-asserted-by":"crossref","unstructured":"Chen, Z., Li, Z., Wang, S., Fu, D., Zhao, F.: Learning from noisy data for semi-supervised 3d object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 6929\u20136939 (2023)","DOI":"10.1109\/ICCV51070.2023.00638"},{"key":"12_CR7","unstructured":"Chung, J., Gulcehre, C., Cho, K., Bengio, Y.: Empirical evaluation of gated recurrent neural networks on sequence modeling. arXiv preprint arXiv:1412.3555 (2014)"},{"key":"12_CR8","doi-asserted-by":"crossref","unstructured":"Ding, W., Qiao, L., Qiu, X., Zhang, C.: PivotNet: vectorized pivot learning for end-to-end HD map construction. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3672\u20133682 (2023)","DOI":"10.1109\/ICCV51070.2023.00340"},{"key":"12_CR9","doi-asserted-by":"crossref","unstructured":"Fu, T., Wang, X., Yu, H., Niu, K., Li, B., Xue, X.: Denoising-MOT: towards multiple object tracking with severe occlusions. In: Proceedings of the 31st ACM International Conference on Multimedia, pp. 2734\u20132743 (2023)","DOI":"10.1145\/3581783.3611728"},{"key":"12_CR10","doi-asserted-by":"crossref","unstructured":"Han, C., et al.: Exploring recurrent long-term temporal fusion for multi-view 3D perception. arXiv preprint arXiv:2303.05970 (2023)","DOI":"10.1109\/LRA.2024.3401172"},{"issue":"2","key":"12_CR11","first-page":"943","volume":"3","author":"AM Hasan","year":"2009","unstructured":"Hasan, A.M., Samsudin, K., Ramli, A.R., Azmir, R., Ismaeel, S.: A review of navigation systems (integration and algorithms). Aust. J. Basic Appl. Sci. 3(2), 943\u2013959 (2009)","journal-title":"Aust. J. Basic Appl. Sci."},{"key":"12_CR12","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"12_CR13","unstructured":"Huang, J., Huang, G.: BEVDet4D: exploit temporal cues in multi-camera 3D object detection. arXiv preprint arXiv:2203.17054 (2022)"},{"key":"12_CR14","doi-asserted-by":"crossref","unstructured":"Lee, Y., Hwang, J.w., Lee, S., Bae, Y., Park, J.: An energy and GPU-computation efficient backbone network for real-time object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops (2019)","DOI":"10.1109\/CVPRW.2019.00103"},{"key":"12_CR15","doi-asserted-by":"crossref","unstructured":"Li, F., Zhang, H., Liu, S., Guo, J., Ni, L.M., Zhang, L.: DN-DETR: accelerate DETR training by introducing query denoising. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13619\u201313627 (2022)","DOI":"10.1109\/CVPR52688.2022.01325"},{"key":"12_CR16","doi-asserted-by":"crossref","unstructured":"Li, F., et al.: Mask DINO: towards a unified transformer-based framework for object detection and segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3041\u20133050 (2023)","DOI":"10.1109\/CVPR52729.2023.00297"},{"key":"12_CR17","doi-asserted-by":"crossref","unstructured":"Li, Q., Wang, Y., Wang, Y., Zhao, H.: HDMapNet: an online HD map construction and evaluation framework. In: 2022 International Conference on Robotics and Automation (ICRA), pp. 4628\u20134634. IEEE (2022)","DOI":"10.1109\/ICRA46639.2022.9812383"},{"key":"12_CR18","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/978-3-031-20077-9_1","volume-title":"Computer Vision \u2013 ECCV 2022","author":"Z Li","year":"2022","unstructured":"Li, Z., et al.: BEVFormer: learning bird\u2019s-eye-view representation from multi-camera images via spatiotemporal transformers. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) ECCV 2022. LNCS, vol. 13669, pp. 1\u201318. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-20077-9_1"},{"key":"12_CR19","unstructured":"Liao, B., et al.: MapTR: structured modeling and learning for online vectorized HD map construction. arXiv preprint arXiv:2208.14437 (2022)"},{"key":"12_CR20","unstructured":"Lin, X., Lin, T., Pei, Z., Huang, L., Su, Z.: Sparse4D v2: recurrent temporal fusion with sparse model. arXiv preprint arXiv:2305.14018 (2023)"},{"key":"12_CR21","unstructured":"Liu, S., et al.: DAB-DETR: dynamic anchor boxes are better queries for DETR. arXiv preprint arXiv:2201.12329 (2022)"},{"key":"12_CR22","unstructured":"Liu, Y., Yuan, T., Wang, Y., Wang, Y., Zhao, H.: VectorMapNet: end-to-end vectorized HD map learning. In: International Conference on Machine Learning, pp. 22352\u201322369. PMLR (2023)"},{"key":"12_CR23","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"531","DOI":"10.1007\/978-3-031-19812-0_31","volume-title":"Computer Vision \u2013 ECCV 2022","author":"Y Liu","year":"2022","unstructured":"Liu, Y., Wang, T., Zhang, X., Sun, J.: PETR: position embedding transformation for multi-view 3D object detection. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) ECCV 2022. LNCS, vol. 13687, pp. 531\u2013548. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-19812-0_31"},{"key":"12_CR24","doi-asserted-by":"crossref","unstructured":"Liu, Y., et al.: PETRv2: a unified framework for 3D perception from multi-camera images. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3262\u20133272 (2023)","DOI":"10.1109\/ICCV51070.2023.00302"},{"key":"12_CR25","unstructured":"Loshchilov, I., Hutter, F.: Fixing weight decay regularization in Adam (2018)"},{"key":"12_CR26","doi-asserted-by":"crossref","unstructured":"Park, D., Ambrus, R., Guizilini, V., Li, J., Gaidon, A.: Is pseudo-lidar needed for monocular 3D object detection? In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3142\u20133152 (2021)","DOI":"10.1109\/ICCV48922.2021.00313"},{"key":"12_CR27","doi-asserted-by":"crossref","unstructured":"Peng, L., Chen, Z., Fu, Z., Liang, P., Cheng, E.: BEVSegFormer: bird\u2019s eye view semantic segmentation from arbitrary camera rigs. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 5935\u20135943 (2023)","DOI":"10.1109\/WACV56688.2023.00588"},{"key":"12_CR28","doi-asserted-by":"crossref","unstructured":"Qiao, L., Ding, W., Qiu, X., Zhang, C.: End-to-end vectorized HD-map construction with piecewise Bezier curve. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13218\u201313228 (2023)","DOI":"10.1109\/CVPR52729.2023.01270"},{"key":"12_CR29","doi-asserted-by":"crossref","unstructured":"Qin, Z., Chen, J., Chen, C., Chen, X., Li, X.: UniFusion: unified multi-view fusion transformer for spatial-temporal representation in bird\u2019s-eye-view. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 8690\u20138699 (2023)","DOI":"10.1109\/ICCV51070.2023.00798"},{"key":"12_CR30","doi-asserted-by":"crossref","unstructured":"Shan, T., Englot, B.: LeGO-LOAM: lightweight and ground-optimized lidar odometry and mapping on variable terrain. In: 2018 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), pp. 4758\u20134765. IEEE (2018)","DOI":"10.1109\/IROS.2018.8594299"},{"key":"12_CR31","doi-asserted-by":"crossref","unstructured":"Wang, S., Liu, Y., Wang, T., Li, Y., Zhang, X.: Exploring object-centric temporal modeling for efficient multi-view 3D object detection. arXiv preprint arXiv:2303.11926 (2023)","DOI":"10.1109\/ICCV51070.2023.00335"},{"key":"12_CR32","doi-asserted-by":"crossref","unstructured":"Wang, S., et al.: Towards domain generalization for multi-view 3D object detection in bird-eye-view. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13333\u201313342 (2023)","DOI":"10.1109\/CVPR52729.2023.01281"},{"key":"12_CR33","doi-asserted-by":"crossref","unstructured":"Wang, Y., et al.: Multi-modal 3D object detection in autonomous driving: a survey. Int. J. Comput. Vision 1\u201331 (2023)","DOI":"10.2139\/ssrn.4398254"},{"key":"12_CR34","unstructured":"Wilson, B., et\u00a0al.: Argoverse 2: next generation datasets for self-driving perception and forecasting. arXiv preprint arXiv:2301.00493 (2023)"},{"key":"12_CR35","unstructured":"Wu, D., et al.: The 1st-place solution for CVPR 2023 OpenLane topology in autonomous driving challenge. arXiv preprint arXiv:2306.09590 (2023)"},{"key":"12_CR36","doi-asserted-by":"crossref","unstructured":"Yang, C., et\u00a0al.: BEVFormer v2: adapting modern image backbones to bird\u2019s-eye-view recognition via perspective supervision. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 17830\u201317839 (2023)","DOI":"10.1109\/CVPR52729.2023.01710"},{"key":"12_CR37","doi-asserted-by":"crossref","unstructured":"Yuan, T., Liu, Y., Wang, Y., Wang, Y., Zhao, H.: StreamMapNet: streaming mapping network for vectorized online HD map construction. arXiv preprint arXiv:2308.12570 (2023)","DOI":"10.1109\/WACV57701.2024.00719"},{"key":"12_CR38","doi-asserted-by":"publisher","first-page":"58443","DOI":"10.1109\/ACCESS.2020.2983149","volume":"8","author":"E Yurtsever","year":"2020","unstructured":"Yurtsever, E., Lambert, J., Carballo, A., Takeda, K.: A survey of autonomous driving: Common practices and emerging technologies. IEEE Access 8, 58443\u201358469 (2020)","journal-title":"IEEE Access"},{"key":"12_CR39","unstructured":"Zhang, H., et al.: DINO: DETR with improved denoising anchor boxes for end-to-end object detection. arXiv preprint arXiv:2203.03605 (2022)"},{"key":"12_CR40","doi-asserted-by":"crossref","unstructured":"Zhang, J., Singh, S.: LOAM: Lidar odometry and mapping in real-time. In: Robotics: Science and systems, Berkeley, CA, vol.\u00a02, pp.\u00a01\u20139 (2014)","DOI":"10.15607\/RSS.2014.X.007"},{"key":"12_CR41","unstructured":"Zhang, Y., et al.: BEVerse: unified perception and prediction in birds-eye-view for vision-centric autonomous driving. arXiv preprint arXiv:2205.09743 (2022)"},{"key":"12_CR42","unstructured":"Zhu, X., Su, W., Lu, L., Li, B., Wang, X., Dai, J.: Deformable DETR: deformable transformers for end-to-end object detection. arXiv preprint arXiv:2010.04159 (2020)"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-72655-2_12","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,5]],"date-time":"2024-12-05T11:30:31Z","timestamp":1733398231000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-72655-2_12"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,6]]},"ISBN":["9783031726545","9783031726552"],"references-count":42,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-72655-2_12","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,12,6]]},"assertion":[{"value":"6 December 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}