{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T17:47:42Z","timestamp":1777657662304,"version":"3.51.4"},"publisher-location":"Cham","reference-count":70,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031729034","type":"print"},{"value":"9783031729041","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,11,21]],"date-time":"2024-11-21T00:00:00Z","timestamp":1732147200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,21]],"date-time":"2024-11-21T00:00:00Z","timestamp":1732147200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-72904-1_19","type":"book-chapter","created":{"date-parts":[[2024,11,20]],"date-time":"2024-11-20T13:28:19Z","timestamp":1732109299000},"page":"321-339","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["MeshVPR: Citywide Visual Place Recognition Using 3D Meshes"],"prefix":"10.1007","author":[{"given":"Gabriele","family":"Berton","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lorenz","family":"Junglas","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Riccardo","family":"Zaccone","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Thomas","family":"Pollok","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Barbara","family":"Caputo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Carlo","family":"Masone","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,11,21]]},"reference":[{"issue":"4","key":"19_CR1","doi-asserted-by":"publisher","first-page":"5526","DOI":"10.1109\/LRA.2020.3009075","volume":"5","author":"E Alberti","year":"2020","unstructured":"Alberti, E., Tavera, A., Masone, C., Caputo, B.: IDDA: a large-scale multi-domain dataset for autonomous driving. IEEE Robot. Autom. Lett. 5(4), 5526\u20135533 (2020)","journal-title":"IEEE Robot. Autom. Lett."},{"key":"19_CR2","doi-asserted-by":"publisher","first-page":"194","DOI":"10.1016\/j.neucom.2022.09.127","volume":"513","author":"A Ali-bey","year":"2022","unstructured":"Ali-bey, A., Chaib-draa, B., Gigu\u00e8re, P.: GSV-cities: toward appropriate supervised visual place recognition. Neurocomputing 513, 194\u2013203 (2022)","journal-title":"Neurocomputing"},{"key":"19_CR3","doi-asserted-by":"crossref","unstructured":"Ali-bey, A., Chaib-draa, B., Gigu\u00e8re, P.: MixVPR: feature mixing for visual place recognition. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 2998\u20133007 (2023)","DOI":"10.1109\/WACV56688.2023.00301"},{"key":"19_CR4","doi-asserted-by":"crossref","unstructured":"Arandjelovi\u0107, R., Zisserman, A.: Three things everyone should know to improve object retrieval. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 2911\u20132918 (2012)","DOI":"10.1109\/CVPR.2012.6248018"},{"issue":"6","key":"19_CR5","doi-asserted-by":"publisher","first-page":"1437","DOI":"10.1109\/TPAMI.2017.2711011","volume":"40","author":"R Arandjelovi\u0107","year":"2018","unstructured":"Arandjelovi\u0107, R., Gronat, P., Torii, A., Pajdla, T., Sivic, J.: NetVLAD: CNN architecture for weakly supervised place recognition. IEEE Trans. Pattern Anal. Mach. Intell. 40(6), 1437\u20131451 (2018). https:\/\/doi.org\/10.1109\/TPAMI.2017.2711011","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"19_CR6","series-title":"Advances in Computer Vision and Pattern Recognition","doi-asserted-by":"publisher","first-page":"255","DOI":"10.1007\/978-3-319-25781-5_14","volume-title":"Large-Scale Visual Geo-Localization","author":"M Aubry","year":"2016","unstructured":"Aubry, M., Russell, B., Sivic, J.: Visual geo-localization of non-photographic depictions via 2D\u20133D alignment. In: Zamir, A.R.R., Hakeem, A., Van Van Gool, L., Shah, M., Szeliski, R. (eds.) Large-Scale Visual Geo-Localization. ACVPR, pp. 255\u2013275. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-25781-5_14"},{"key":"19_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"584","DOI":"10.1007\/978-3-319-10590-1_38","volume-title":"Computer Vision \u2013 ECCV 2014","author":"A Babenko","year":"2014","unstructured":"Babenko, A., Slesarev, A., Chigorin, A., Lempitsky, V.: Neural codes for image retrieval. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8689, pp. 584\u2013599. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-10590-1_38"},{"key":"19_CR8","doi-asserted-by":"publisher","unstructured":"Berton, G., Masone, C., Caputo, B.: Rethinking visual geo-localization for large-scale applications. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 4868\u20134878 (2022). https:\/\/doi.org\/10.1109\/CVPR52688.2022.00483","DOI":"10.1109\/CVPR52688.2022.00483"},{"key":"19_CR9","doi-asserted-by":"crossref","unstructured":"Berton, G., Paolicelli, V., Masone, C., Caputo, B.: Adaptive-attentive geolocalization from few queries: a hybrid approach. In: IEEE Winter Conference on Applications of Computer Vision, pp. 2918\u20132927 (2021)","DOI":"10.3389\/fcomp.2022.841817"},{"key":"19_CR10","doi-asserted-by":"crossref","unstructured":"Berton, G., Trivigno, G., Caputo, B., Masone, C.: EigenPlaces: training viewpoint robust models for visual place recognition. In: IEEE International Conference on Computer Vision, pp. 11080\u201311090 (2023)","DOI":"10.1109\/ICCV51070.2023.01017"},{"key":"19_CR11","doi-asserted-by":"publisher","unstructured":"Cakir, F., He, K., Xia, X., Kulis, B., Sclaroff, S.: Deep metric learning to rank. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 1861\u20131870 (2019). https:\/\/doi.org\/10.1109\/CVPR.2019.00196","DOI":"10.1109\/CVPR.2019.00196"},{"key":"19_CR12","doi-asserted-by":"publisher","unstructured":"Chai, X., Yang, J., Yan, X., Di, C., Ye, T.: Efficient underground tunnel place recognition algorithm based on farthest point subsampling and dual-attention transformer. Sensors 23(22) (2023). https:\/\/doi.org\/10.3390\/s23229261","DOI":"10.3390\/s23229261"},{"key":"19_CR13","doi-asserted-by":"publisher","unstructured":"Cheng, R., et al.: Hierarchical visual localization for visually impaired people using multimodal images. Expert Syst. Appl. 165, 113743 (2021). https:\/\/doi.org\/10.1016\/j.eswa.2020.113743, https:\/\/www.sciencedirect.com\/science\/article\/pii\/S0957417420305674","DOI":"10.1016\/j.eswa.2020.113743"},{"key":"19_CR14","doi-asserted-by":"publisher","unstructured":"Deschaud, J.E., Duque, D., Richa, J.P., Velasco-Forero, S., Marcotegui, B., Goulette, F.: Paris-CARLA-3D: a real and synthetic outdoor point cloud dataset for challenging tasks in 3D mapping. Remote Sens. 13(22) (2021). https:\/\/doi.org\/10.3390\/rs13224713, https:\/\/www.mdpi.com\/2072-4292\/13\/22\/4713","DOI":"10.3390\/rs13224713"},{"key":"19_CR15","unstructured":"Dosovitskiy, A., Ros, G., Codevilla, F., Lopez, A., Koltun, V.: CARLA: an open urban driving simulator. In: Proceedings of the 1st Annual Conference on Robot Learning, pp. 1\u201316 (2017)"},{"key":"19_CR16","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"369","DOI":"10.1007\/978-3-030-58548-8_22","volume-title":"Computer Vision \u2013 ECCV 2020","author":"Y Ge","year":"2020","unstructured":"Ge, Y., Wang, H., Zhu, F., Zhao, R., Li, H.: Self-supervising fine-grained region similarities for large-scale image localization. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12349, pp. 369\u2013386. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58548-8_22"},{"issue":"2","key":"19_CR17","doi-asserted-by":"publisher","first-page":"1924","DOI":"10.1109\/LRA.2019.2898427","volume":"4","author":"S Hausler","year":"2019","unstructured":"Hausler, S., Jacobson, A., Milford, M.: Multi-process fusion: visual place recognition using multiple image processing methods. IEEE Robot. Autom. Lett. 4(2), 1924\u20131931 (2019)","journal-title":"IEEE Robot. Autom. Lett."},{"key":"19_CR18","doi-asserted-by":"crossref","unstructured":"Irschara, A., Zach, C., Frahm, J.M., Bischof, H.: From structure-from-motion point clouds to fast location recognition. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 2599\u20132606. IEEE (2009)","DOI":"10.1109\/CVPR.2009.5206587"},{"key":"19_CR19","doi-asserted-by":"crossref","unstructured":"Izquierdo, S., Civera, J.: Optimal transport aggregation for visual place recognition. In: IEEE Conference on Computer Vision and Pattern Recognition (2024)","DOI":"10.1109\/CVPR52733.2024.01672"},{"key":"19_CR20","unstructured":"Khosla, P., et al.: Supervised contrastive learning. In: Larochelle, H., Ranzato, M., Hadsell, R., Balcan, M., Lin, H. (eds.) Conference on Neural Information Processing Systems (2020). https:\/\/proceedings.neurips.cc\/paper\/2020\/hash\/d89a66c7c80a29b1bdbab0f2a1a94af8-Abstract.html"},{"key":"19_CR21","doi-asserted-by":"crossref","unstructured":"Kim, H.J., Dunn, E., Frahm, J.M.: Learned contextual feature reweighting for image geo-localization. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 3251\u20133260 (2017)","DOI":"10.1109\/CVPR.2017.346"},{"key":"19_CR22","unstructured":"Kingma, D., Ba, J.: Adam: A method for stochastic optimization. In: International Conference on Learning Representations (2015)"},{"issue":"4","key":"19_CR23","doi-asserted-by":"publisher","first-page":"788","DOI":"10.1080\/13658816.2022.2140808","volume":"37","author":"B Lei","year":"2023","unstructured":"Lei, B., Stouffs, R., Biljecki, F.: Assessing and benchmarking 3D city models. Int. J. Geogr. Inf. Sci. 37(4), 788\u2013809 (2023). https:\/\/doi.org\/10.1080\/13658816.2022.2140808","journal-title":"Int. J. Geogr. Inf. Sci."},{"key":"19_CR24","doi-asserted-by":"crossref","unstructured":"Li, Y., et al.: MatrixCity: a large-scale city dataset for city-scale neural rendering and beyond. In: IEEE International Conference on Computer Vision, pp. 3205\u20133215 (2023)","DOI":"10.1109\/ICCV51070.2023.00297"},{"key":"19_CR25","doi-asserted-by":"crossref","unstructured":"Lin, C.H., et al.: InfiniCity: infinite-scale city synthesis. In: IEEE International Conference on Computer Vision, pp. 22808\u201322818 (2023)","DOI":"10.1109\/ICCV51070.2023.02085"},{"key":"19_CR26","doi-asserted-by":"publisher","unstructured":"Liu, L., Li, H., Dai, Y.: Stochastic attraction-repulsion embedding for large scale image localization. In: IEEE International Conference on Computer Vision, pp. 2570\u20132579 (2019). https:\/\/doi.org\/10.1109\/ICCV.2019.00266","DOI":"10.1109\/ICCV.2019.00266"},{"key":"19_CR27","doi-asserted-by":"crossref","unstructured":"Lowe, D.G.: Distinctive image features from scale-invariant keypoints. Int. J. Comput. Vision 60(2), 91\u2013110 (2004). http:\/\/dx.doi.org\/10.1023\/B:VISI.0000029664.99615.94","DOI":"10.1023\/B:VISI.0000029664.99615.94"},{"issue":"1","key":"19_CR28","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1177\/0278364916679498","volume":"36","author":"W Maddern","year":"2017","unstructured":"Maddern, W., Pascoe, G., Linegar, C., Newman, P.: 1 Year, 1000km: the Oxford RobotCar dataset. Int. J. Robot. Res. 36(1), 3\u201315 (2017). https:\/\/doi.org\/10.1177\/0278364916679498","journal-title":"Int. J. Robot. Res."},{"key":"19_CR29","doi-asserted-by":"publisher","first-page":"19516","DOI":"10.1109\/ACCESS.2021.3054937","volume":"9","author":"C Masone","year":"2021","unstructured":"Masone, C., Caputo, B.: A survey on deep visual place recognition. IEEE Access 9, 19516\u201319547 (2021). https:\/\/doi.org\/10.1109\/ACCESS.2021.3054937","journal-title":"IEEE Access"},{"issue":"4","key":"19_CR30","doi-asserted-by":"publisher","first-page":"10383","DOI":"10.1109\/LRA.2022.3194310","volume":"7","author":"R Mereu","year":"2022","unstructured":"Mereu, R., Trivigno, G., Berton, G., Masone, C., Caputo, B.: Learning sequential descriptors for sequence-based visual place recognition. IEEE Robot. Autom. Lett. 7(4), 10383\u201310390 (2022). https:\/\/doi.org\/10.1109\/LRA.2022.3194310","journal-title":"IEEE Robot. Autom. Lett."},{"key":"19_CR31","doi-asserted-by":"publisher","first-page":"1038","DOI":"10.1109\/TRO.2008.2004520","volume":"24","author":"M Milford","year":"2008","unstructured":"Milford, M., Wyeth, G.: Mapping a suburb with a single camera using a biologically inspired slam system. IEEE Trans. Rob. 24, 1038\u20131053 (2008)","journal-title":"IEEE Trans. Rob."},{"key":"19_CR32","doi-asserted-by":"crossref","unstructured":"Moreau, A., Piasco, N., Bennehar, M., Tsishkou, D.V., Stanciulescu, B., de\u00a0La\u00a0Fortelle, A.: CROSSFIRE: camera relocalization on self-supervised features from an implicit representation. 2023 IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 252\u2013262 (2023). https:\/\/api.semanticscholar.org\/CorpusID:257427144","DOI":"10.1109\/ICCV51070.2023.00030"},{"key":"19_CR33","unstructured":"Moreau, A., Piasco, N., Tsishkou, D.V., Stanciulescu, B., de\u00a0La\u00a0Fortelle, A.: LENS: localization enhanced by nerf synthesis. In: Conference on Robot Learning (2021). https:\/\/api.semanticscholar.org\/CorpusID:238744321"},{"key":"19_CR34","doi-asserted-by":"crossref","unstructured":"Neubert, P., Schubert, S.: Hyperdimensional computing as a framework for systematic aggregation of image descriptors. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 16938\u201316947 (2021)","DOI":"10.1109\/CVPR46437.2021.01666"},{"key":"19_CR35","unstructured":"van\u00a0den Oord, A., Li, Y., Vinyals, O.: Representation learning with contrastive predictive coding. CoRR abs\/1807.03748 (2018). http:\/\/arxiv.org\/abs\/1807.03748"},{"key":"19_CR36","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"589","DOI":"10.1007\/978-3-031-20047-2_34","volume-title":"Computer Vision \u2013 ECCV 2022","author":"V Panek","year":"2022","unstructured":"Panek, V., Kukelova, Z., Sattler, T.: MeshLoc: mesh-based visual localization. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) ECCV 2022. LNCS, vol. 13682, pp. 589\u2013609. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-20047-2_34"},{"key":"19_CR37","doi-asserted-by":"crossref","unstructured":"Panek, V., Kukelova, Z., Sattler, T.: Visual localization using imperfect 3D models from the internet. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 13175\u201313186 (2023)","DOI":"10.1109\/CVPR52729.2023.01266"},{"key":"19_CR38","doi-asserted-by":"crossref","unstructured":"Peng, G., Zhang, J., Li, H., Wang, D.: Attentional pyramid pooling of salient visual residuals for place recognition. In: IEEE International Conference on Computer Vision, pp. 885\u2013894 (2021)","DOI":"10.1109\/ICCV48922.2021.00092"},{"key":"19_CR39","doi-asserted-by":"publisher","unstructured":"Philbin, J., Chum, O., Isard, M., Sivic, J., Zisserman, A.: Object retrieval with large vocabularies and fast spatial matching. In: IEEE Conference on Computer Vision and Pattern Recognition, pp.\u00a01\u20138 (2007). https:\/\/doi.org\/10.1109\/CVPR.2007.383172","DOI":"10.1109\/CVPR.2007.383172"},{"key":"19_CR40","doi-asserted-by":"publisher","unstructured":"Philbin, J., Chum, O., Isard, M., Sivic, J., Zisserman, A.: Lost in quantization: improving particular object retrieval in large scale image databases. In: IEEE Conference on Computer Vision and Pattern Recognition, pp.\u00a01\u20138 (2008). https:\/\/doi.org\/10.1109\/CVPR.2008.4587635","DOI":"10.1109\/CVPR.2008.4587635"},{"key":"19_CR41","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"670","DOI":"10.1007\/978-3-030-33720-9_52","volume-title":"Advances in Visual Computing","author":"T Pollok","year":"2019","unstructured":"Pollok, T., Junglas, L., Ruf, B., Schumann, A.: UnrealGT: using unreal engine to generate ground truth datasets. In: Bebis, G., et al. (eds.) ISVC 2019. LNCS, vol. 11844, pp. 670\u2013682. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-33720-9_52"},{"key":"19_CR42","doi-asserted-by":"publisher","unstructured":"Qiu, W., et al.: UnrealCV: virtual worlds for computer vision. In: ACM MM, pp. 1221\u20131224. ACM (2017). https:\/\/doi.org\/10.1145\/3123266.3129396, https:\/\/dl.acm.org\/doi\/10.1145\/3123266.3129396","DOI":"10.1145\/3123266.3129396"},{"issue":"7","key":"19_CR43","doi-asserted-by":"publisher","first-page":"1655","DOI":"10.1109\/TPAMI.2018.2846566","volume":"41","author":"F Radenovi\u0107","year":"2019","unstructured":"Radenovi\u0107, F., Tolias, G., Chum, O.: Fine-tuning CNN image retrieval with no human annotation. IEEE Trans. Pattern Anal. Mach. Intell. 41(7), 1655\u20131668 (2019). https:\/\/doi.org\/10.1109\/TPAMI.2018.2846566","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"3","key":"19_CR44","doi-asserted-by":"publisher","first-page":"251","DOI":"10.3169\/mta.4.251","volume":"4","author":"AS Razavian","year":"2016","unstructured":"Razavian, A.S., Sullivan, J., Carlsson, S., Maki, A.: Visual instance retrieval with deep convolutional networks. ITE Trans. Media Technol. Appl. 4(3), 251\u2013258 (2016). https:\/\/doi.org\/10.3169\/mta.4.251","journal-title":"ITE Trans. Media Technol. Appl."},{"key":"19_CR45","doi-asserted-by":"publisher","unstructured":"Sallam\u00a0Fatouh, W., Farouk\u00a0Ali, H., Abd Elrazek\u00a0Mashali, S., Shouki\u00a0Seliem, A.: Image-based localization for augmented reality application: a review. In: Proceedings of the 2021 5th International Conference on Virtual and Augmented Reality Simulations, ICVARS 2021, pp. 7\u201316. Association for Computing Machinery, New York (2021). https:\/\/doi.org\/10.1145\/3463914.3463916","DOI":"10.1145\/3463914.3463916"},{"key":"19_CR46","doi-asserted-by":"crossref","unstructured":"Sarlin, P.E., Cadena, C., Siegwart, R., Dymczyk, M.: From coarse to fine: robust hierarchical localization at large scale. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 12716\u201312725 (2019)","DOI":"10.1109\/CVPR.2019.01300"},{"key":"19_CR47","unstructured":"Sarlin, P.E., Debraine, F., Dymczyk, M., Siegwart, R., Cadena, C.: Leveraging deep visual descriptors for hierarchical efficient localization. In: Conference on Robot Learning, pp. 456\u2013465. Proceeding of Machine Learning Research (2018)"},{"key":"19_CR48","doi-asserted-by":"crossref","unstructured":"Sarlin, P.E., DeTone, D., Malisiewicz, T., Rabinovich, A.: SuperGlue: learning feature matching with graph neural networks. In: IEEE Conference on Computer Vision and Pattern Recognition (2020). https:\/\/arxiv.org\/abs\/1911.11763","DOI":"10.1109\/CVPR42600.2020.00499"},{"key":"19_CR49","doi-asserted-by":"crossref","unstructured":"Sattler, T., Weyand, T., Leibe, B., Kobbelt, L.: Image retrieval for image-based localization revisited. In: British Machine Vision Conference, vol.\u00a01, p.\u00a04 (2012)","DOI":"10.5244\/C.26.76"},{"key":"19_CR50","doi-asserted-by":"publisher","unstructured":"Schubert, S., Neubert, P., Garg, S., Milford, M., Fischer, T.: Visual place recognition: a tutorial. IEEE Robot. Autom. Mag. 2\u201316 (2023). https:\/\/doi.org\/10.1109\/MRA.2023.3310859","DOI":"10.1109\/MRA.2023.3310859"},{"key":"19_CR51","series-title":"Springer Proceedings in Advanced Robotics","doi-asserted-by":"publisher","first-page":"621","DOI":"10.1007\/978-3-319-67361-5_40","volume-title":"Field and Service Robotics","author":"S Shah","year":"2018","unstructured":"Shah, S., Dey, D., Lovett, C., Kapoor, A.: AirSim: high-fidelity visual and physical simulation for autonomous vehicles. In: Hutter, M., Siegwart, R. (eds.) Field and Service Robotics. SPAR, vol. 5, pp. 621\u2013635. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-319-67361-5_40"},{"key":"19_CR52","doi-asserted-by":"publisher","unstructured":"Shan, Q., Wu, C., Curless, B., Furukawa, Y., Hernandez, C., Seitz, S.M.: Accurate geo-registration by ground-to-aerial image matching. In: International Conference on 3D Vision (3DV), vol.\u00a01, pp. 525\u2013532 (2014). https:\/\/doi.org\/10.1109\/3DV.2014.69","DOI":"10.1109\/3DV.2014.69"},{"key":"19_CR53","doi-asserted-by":"publisher","unstructured":"Sibbing, D., Sattler, T., Leibe, B., Kobbelt, L.: Sift-realistic rendering. In: International Conference on 3D Vision (3DV), pp. 56\u201363 (2013). https:\/\/doi.org\/10.1109\/3DV.2013.16","DOI":"10.1109\/3DV.2013.16"},{"key":"19_CR54","doi-asserted-by":"publisher","unstructured":"Song, H.O., Xiang, Y., Jegelka, S., Savarese, S.: Deep metric learning via lifted structured feature embedding. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 4004\u20134012 (2016). https:\/\/doi.org\/10.1109\/CVPR.2016.434","DOI":"10.1109\/CVPR.2016.434"},{"key":"19_CR55","doi-asserted-by":"crossref","unstructured":"Sun, Y., et al.: Circle loss: a unified perspective of pair similarity optimization. In: IEEE Conference on Computer Vision and Pattern Recognition pp. 6397\u20136406 (2020). https:\/\/api.semanticscholar.org\/CorpusID:211296865","DOI":"10.1109\/CVPR42600.2020.00643"},{"key":"19_CR56","doi-asserted-by":"crossref","unstructured":"Suomela, L., Kalliola, J., Edelman, H., K\u00e4m\u00e4r\u00e4inen, J.K.: Placenav: Topological navigation through place recognition. In: IEEE International Conference on Robotics and Automation (2024)","DOI":"10.1109\/ICRA57147.2024.10610575"},{"key":"19_CR57","doi-asserted-by":"crossref","unstructured":"Taira, H., et al.: InLoc: indoor visual localization with dense matching and view synthesis. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 7199\u20137209 (2018)","DOI":"10.1109\/CVPR.2018.00752"},{"key":"19_CR58","doi-asserted-by":"crossref","unstructured":"Taira, H., et al.: Is this the right place? Geometric-semantic pose verification for indoor visual localization. In: IEEE International Conference on Computer Vision, pp. 4373\u20134383 (2019)","DOI":"10.1109\/ICCV.2019.00447"},{"key":"19_CR59","unstructured":"Tolias, G., Sicre, R., J\u00e9gou, H.: Particular object retrieval with integral max-pooling of CNN activations. In: International Conference on Learning Representations, pp. 1\u201312. International Conference on Learning Representations, San Juan Rico (2016). https:\/\/inria.hal.science\/hal-01842218"},{"issue":"2","key":"19_CR60","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1109\/TPAMI.2017.2667665","volume":"40","author":"A Torii","year":"2018","unstructured":"Torii, A., Arandjelovi\u0107, R., Sivic, J., Okutomi, M., Pajdla, T.: 24\/7 place recognition by view synthesis. IEEE Trans. Pattern Anal. Mach. Intell. 40(2), 257\u2013271 (2018)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"19_CR61","doi-asserted-by":"publisher","first-page":"814","DOI":"10.1109\/TPAMI.2019.2941876","volume":"43","author":"A Torii","year":"2021","unstructured":"Torii, A., et al.: Are large-scale 3D models really necessary for accurate visual localization? IEEE Trans. Pattern Anal. Mach. Intell. 43, 814\u2013829 (2021)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"3","key":"19_CR62","doi-asserted-by":"publisher","first-page":"814","DOI":"10.1109\/TPAMI.2019.2941876","volume":"43","author":"A Torii","year":"2019","unstructured":"Torii, A., et al.: Are large-scale 3D models really necessary for accurate visual localization? IEEE Trans. Pattern Anal. Mach. Intell. 43(3), 814\u2013829 (2019)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"19_CR63","doi-asserted-by":"crossref","unstructured":"Trivigno, G., Berton, G., Aragon, J., Caputo, B., Masone, C.: Divide &classify: fine-grained classification for city-wide visual geo-localization. In: IEEE International Conference on Computer Vision, pp. 11142\u201311152 (2023)","DOI":"10.1109\/ICCV51070.2023.01023"},{"issue":"4","key":"19_CR64","doi-asserted-by":"publisher","first-page":"9207","DOI":"10.1109\/LRA.2022.3187491","volume":"7","author":"A Vallone","year":"2022","unstructured":"Vallone, A., Warburg, F., Hansen, H., Hauberg, S., Civera, J.: Danish airs and grounds: a dataset for aerial-to-street-level place recognition and localization. IEEE Robot. Autom. Lett. 7(4), 9207\u20139214 (2022). https:\/\/doi.org\/10.1109\/LRA.2022.3187491","journal-title":"IEEE Robot. Autom. Lett."},{"key":"19_CR65","doi-asserted-by":"crossref","unstructured":"Wang, X., Han, X., Huang, W., Dong, D., Scott, M.R.: Multi-similarity loss with general pair weighting for deep metric learning. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 5022\u20135030 (2019)","DOI":"10.1109\/CVPR.2019.00516"},{"key":"19_CR66","doi-asserted-by":"publisher","unstructured":"Warburg, F., Hauberg, S., L\u00f3pez-Antequera, M., Gargallo, P., Kuang, Y., Civera, J.: Mapillary street-level sequences: a dataset for lifelong place recognition. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 2623\u20132632 (2020). https:\/\/doi.org\/10.1109\/CVPR42600.2020.00270","DOI":"10.1109\/CVPR42600.2020.00270"},{"key":"19_CR67","unstructured":"Zeng, F., Jacobson, A., Smith, D.W., Boswell, N., Peynot, T., Milford, M.: Enhancing underground visual place recognition with Shannon entropy saliency. In: IEEE International Conference on Robotics and Automation (2017). https:\/\/api.semanticscholar.org\/CorpusID:196111988"},{"key":"19_CR68","doi-asserted-by":"publisher","unstructured":"Zhang, J., Cao, Y., Wu, Q.: Vector of locally and adaptively aggregated descriptors for image feature representation. Pattern Recogn. 116, 107952 (2021). https:\/\/doi.org\/10.1016\/j.patcog.2021.107952, https:\/\/www.sciencedirect.com\/science\/article\/pii\/S0031320321001394","DOI":"10.1016\/j.patcog.2021.107952"},{"key":"19_CR69","doi-asserted-by":"publisher","first-page":"821","DOI":"10.1007\/s11263-020-01399-8","volume":"129","author":"Z Zhang","year":"2021","unstructured":"Zhang, Z., Sattler, T., Scaramuzza, D.: Reference pose generation for long-term visual localization via learned features and view synthesis. Int. J. Comput. Vision 129, 821\u2013844 (2021)","journal-title":"Int. J. Comput. Vision"},{"key":"19_CR70","doi-asserted-by":"crossref","unstructured":"Zhu, S., Yang, L., Chen, C., Shah, M., Shen, X., Wang, H.: R2Former: unified retrieval and reranking transformer for place recognition. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 19370\u201319380 (2023)","DOI":"10.1109\/CVPR52729.2023.01856"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-72904-1_19","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,15]],"date-time":"2025-03-15T19:51:30Z","timestamp":1742068290000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-72904-1_19"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,21]]},"ISBN":["9783031729034","9783031729041"],"references-count":70,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-72904-1_19","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,11,21]]},"assertion":[{"value":"21 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}