{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,18]],"date-time":"2026-03-18T09:02:39Z","timestamp":1773824559453,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":80,"publisher":"ACM","funder":[{"name":"Chantier Scientifique Notre-Dame de Paris &#x5c;&#x2f; Minist&#xc3a8;re de la Culture &#x5c;&#x2f; CNRS &#x5c;&#x2f; EPRNDP, France","award":[""],"award-info":[{"award-number":[""]}]},{"name":"CNRS MITI and the French Ministry of Culture within the framework of the national scientific action Notre-Dame de Paris","award":[""],"award-info":[{"award-number":[""]}]},{"name":"European Research Council &#x28;ERC&#x29; Advanced Grant nDame&#x5c;&#x5c;_Heritage&#x3a; n-Dimensional analysis and memorization ecosystem for building cathedrals of knowledge in Heritage Science","award":["ID&#x3a;101055423"],"award-info":[{"award-number":["ID&#x3a;101055423"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,10,27]]},"DOI":"10.1145\/3746273.3760200","type":"proceedings-article","created":{"date-parts":[[2025,10,25]],"date-time":"2025-10-25T14:53:01Z","timestamp":1761403981000},"page":"31-40","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Composed Image Retrieval For Visual Localization: Evaluation For Architectural Contents"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-5015-6068","authenticated-orcid":false,"given":"Emile","family":"Blettery","sequence":"first","affiliation":[{"name":"UPR CNRS 2002 MAP ; LASTIG, Univ. Gustave Eiffel, IGN-ENSG, Marseille &amp; Champs-sur-Marne, France"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3666-5146","authenticated-orcid":false,"given":"Valerie","family":"Gouet-Brunet","sequence":"additional","affiliation":[{"name":"LASTIG, Univ. Gustave Eiffel, IGN-ENSG, Champs-sur-Marne, France"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0656-3165","authenticated-orcid":false,"given":"Livio","family":"de Luca","sequence":"additional","affiliation":[{"name":"MAP, UPR CNRS 2002, Marseille, France"}]}],"member":"320","published-online":{"date-parts":[[2025,10,26]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"iSEARLE: Improving Textual Inversion for Zero-Shot Composed Image Retrieval. arXiv 2405.02951","author":"Agnolucci Lorenzo","year":"2024","unstructured":"Lorenzo Agnolucci, Alberto Baldrati, Marco Bertini, and Alberto Del Bimbo. 2024. iSEARLE: Improving Textual Inversion for Zero-Shot Composed Image Retrieval. arXiv 2405.02951 (2024)."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.150"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00083"},{"key":"e_1_3_2_1_4_1","volume-title":"Sentence-level Prompts Benefit Composed Image Retrieval. In International Conference on Learning Representations (ICLR).","author":"Yang","year":"2024","unstructured":"Yang bai, Xinxing Xu, Yong Liu, Salman Khan, Fahad Khan, Wangmeng Zuo, Rick Siow Mong Goh, and Chun-Mei Feng. 2024. Sentence-level Prompts Benefit Composed Image Retrieval. In International Conference on Learning Representations (ICLR)."},{"key":"e_1_3_2_1_5_1","unstructured":"Alberto Baldrati Marco Bertini Tiberio Uricchio and Alberto Del Bimbo. [n.d.]. Composed Image Retrieval using Contrastive Learning and Task-oriented CLIP-based Features. ACM Transactions on Multimedia Computing Communications and Applications ([n.d.])."},{"key":"e_1_3_2_1_6_1","volume-title":"Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 5396-5407","author":"Berton Gabriele","year":"2022","unstructured":"Gabriele Berton, Riccardo Mereu, Gabriele Trivigno, Carlo Masone, Gabriela Csurka, Torsten Sattler, and Barbara Caputo. 2022. Deep visual geo-localization benchmark. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 5396-5407."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/3475720.3484444"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"crossref","unstructured":"Emile Blettery and Val\u00e9rie Gouet-Brunet. 2024. Heritage Iconographic Content Structuring: from Automatic Linking to Visual Validation. In Journal on Computing and Cultural Heritage.","DOI":"10.1145\/3666007"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"crossref","unstructured":"Dylan Campbell Liu Liu and Stephen Gould. 2020. Solving the Blind Perspective-n-Point Problem End-To-End with Robust Differentiable Geometric Optimization. In ECCV. * equal contribution.","DOI":"10.1007\/978-3-030-58536-5_15"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58565-5_43"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/3DV53792.2021.00125"},{"key":"e_1_3_2_1_12_1","volume-title":"Deep learning for instance retrieval: A survey","author":"Chen Wei","year":"2022","unstructured":"Wei Chen, Yu Liu, Weiping Wang, Erwin M Bakker, Theodoros Georgiou, Paul Fieguth, Li Liu, and Michael S Lew. 2022. Deep learning for instance retrieval: A survey. IEEE Transactions on Pattern Analysis and Machine Intelligence (2022)."},{"key":"e_1_3_2_1_13_1","volume-title":"European Conference on Computer Vision.","author":"Csurka Gabriella","year":"2002","unstructured":"Gabriella Csurka, C. Dance, Lixin Fan, J. Willamowski, and C\u00e9dric Bray. 2002. Visual categorization with bags of keypoints. In European Conference on Computer Vision."},{"key":"e_1_3_2_1_14_1","volume-title":"International Conference on Computer Vision Theory and Applications","volume":"2","author":"Delvinioti Agni","year":"2014","unstructured":"Agni Delvinioti, Herv\u00e9 J\u00e9gou, Laurent Amsaleg, and Michael E Houle. 2014. Image retrieval with reciprocal and shared nearest neighbors. In International Conference on Computer Vision Theory and Applications, Vol. 2. 321-328. doi:10. 5220\/0004672303210328"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01181"},{"key":"e_1_3_2_1_17_1","volume-title":"Composed Image Retrieval for Training-Free Domain Conversion. arXiv 2412.03297","author":"Efthymiadis Nikos","year":"2024","unstructured":"Nikos Efthymiadis, Bill Psomas, Zakaria Laskar, Konstantinos Karantzalos, Yannis Avrithis, Ond\u0159ej Chum, and Giorgos Tolias. 2024. Composed Image Retrieval for Training-Free Domain Conversion. arXiv 2412.03297 (2024)."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.5194\/isprsarchives-xl-5-w1-81-2013"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58604-1_11"},{"key":"e_1_3_2_1_20_1","first-page":"3041","volume-title":"CVPR","author":"Hartley Richard","year":"2011","unstructured":"Richard Hartley, Khurrum Aftab, and Jochen Trumpf. 2011. L1 rotation averaging using the Weiszfeld algorithm. In CVPR 2011. IEEE, 3041-3048."},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511811685"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_2_1_23_1","volume-title":"Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition.","author":"Huang Huaibo","year":"2023","unstructured":"Huaibo Huang, Xiaoqiang Zhou, Jie Cao, Ran He, and Tieniu Tan. 2023. Vision Transformer with Super Token Sampling. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition."},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.105"},{"key":"e_1_3_2_1_25_1","volume-title":"HyCIR: Boosting Zero-Shot Composed Image Retrieval with Synthetic Labels. arXiv 2407.05795","author":"Jiang Yingying","year":"2024","unstructured":"Yingying Jiang, Hanchao Jia, Xiaobing Wang, and Peng Hao. 2024. HyCIR: Boosting Zero-Shot Composed Image Retrieval with Synthetic Labels. arXiv 2407.05795 (2024)."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995464"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2017.113"},{"key":"e_1_3_2_1_28_1","unstructured":"Seongwon Lee Suhyeon Lee Hongje Seong and Euntai Kim. 2023. Revisiting Self-Similarity: Structural Embedding for Image Retrieval. In Computer Vision and Pattern Recognition (CVPR)."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00530"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1007\/S11263-008-0152-6"},{"key":"e_1_3_2_1_31_1","volume-title":"European Conference on Computer Vision. Springer, 71-91","author":"Leroy Vincent","year":"2024","unstructured":"Vincent Leroy, Yohann Cabon, and J\u00e9r\u00f4me Revaud. 2024. Grounding image matching in 3d with mast3r. In European Conference on Computer Vision. Springer, 71-91."},{"key":"e_1_3_2_1_32_1","volume-title":"Sepvit: Separable vision transformer. arXiv preprint arXiv:2203.15380","author":"Li Wei","year":"2022","unstructured":"Wei Li, Xing Wang, Xin Xia, Jie Wu, Jiashi Li, Xuefeng Xiao, Min Zheng, and Shiping Wen. 2022. Sepvit: Separable vision transformer. arXiv preprint arXiv:2203.15380 (2022)."},{"key":"e_1_3_2_1_33_1","volume-title":"Imagine and Seek: Improving Composed Image Retrieval with an Imagined Proxy. arXiv 2411.16752","author":"Li You","year":"2024","unstructured":"You Li, Fan Ma, and Yi Yang. 2024. Imagine and Seek: Improving Composed Image Retrieval with an Imagined Proxy. arXiv 2411.16752 (2024)."},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1080\/0952813X.2021.1938695"},{"key":"e_1_3_2_1_35_1","volume-title":"International Conference on Computer Vision. https:\/\/arxiv.org\/pdf\/2306","author":"Lindenberger Philipp","year":"2023","unstructured":"Philipp Lindenberger, Paul-Edouard Sarlin, and Marc Pollefeys. 2023. LightGlue: Local Feature Matching at Light Speed. In International Conference on Computer Vision. https:\/\/arxiv.org\/pdf\/2306.13643.pdf"},{"key":"e_1_3_2_1_36_1","first-page":"1178","article-title":"Camera orientation optimization in stereo vision systems for low measurement error","volume":"26","author":"Liu Xingjian","year":"2020","unstructured":"Xingjian Liu, Wenyuan Chen,Harikrishnan Madhusudanan, Linghao Du, and Yu Sun. 2020. Camera orientation optimization in stereo vision systems for low measurement error. IEEE\/ASME Transactions on Mechatronics 26, 2 (2020), 1178-1182.","journal-title":"IEEE\/ASME Transactions on Mechatronics"},{"key":"e_1_3_2_1_37_1","volume-title":"IEEE Winter Conference on Applications of Computer Vision (WACV).","author":"Liu Zheyuan","year":"2024","unstructured":"Zheyuan Liu, Weixuan Sun, Yicong Hong, Damien Teney, and Stephen Gould. 2024. Bi-Directional Training for Composed Image Retrieval via Text Prompt Learning. In IEEE Winter Conference on Applications of Computer Vision (WACV)."},{"key":"e_1_3_2_1_38_1","unstructured":"Zheyuan Liu Weixuan Sun Damien Teney and Stephen Gould. 2023. Candidate Set Re-ranking for Composed Image Retrieval with Dual Multi-modal Encoder. In arXiv.org."},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-020-01359-2"},{"key":"e_1_3_2_1_40_1","volume-title":"Proceedings of the IEEE\/CVF International Conference on Computer Vision. 252-262","author":"Moreau Arthur","year":"2023","unstructured":"Arthur Moreau, Nathan Piasco, Moussab Bennehar, Dzmitry Tsishkou, Bogdan Stanciulescu, and Arnaud de La Fortelle. 2023. Crossfire: Camera relocalization on self-supervised features from an implicit representation. In Proceedings of the IEEE\/CVF International Conference on Computer Vision. 252-262."},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.109655"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00778-024-00864-x"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1109\/3DV50981.2020.00058"},{"key":"e_1_3_2_1_46_1","volume-title":"Composed Image Retrieval for Remote Sensing. In IGARSS 2024-2024 IEEE International Geoscience and Remote Sensing Symposium. IEEE, 8526-8534","author":"Psomas Bill","year":"2024","unstructured":"Bill Psomas,Ioannis Kakogeorgiou, Nikos Efthymiadis, Giorgos Tolias, Ond\u0159ej Chum, Yannis Avrithis, and Konstantinos Karantzalos. 2024. Composed Image Retrieval for Remote Sensing. In IGARSS 2024-2024 IEEE International Geoscience and Remote Sensing Symposium. IEEE, 8526-8534."},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2846566"},{"key":"e_1_3_2_1_48_1","volume-title":"Learning Transferable Visual Models From Natural Language Supervision. In International Conference on Machine Learning (ICML).","author":"Radford Alec","year":"2021","unstructured":"Alec Radford, Jong Wook Kim, Chris Hallacy, Aditya Ramesh, Gabriel Goh, Sandhini Agarwal, Girish Sastry, Amanda Askell, Pamela Mishkin, Jack Clark, Gretchen Krueger, and Ilya Sutskever. 2021. Learning Transferable Visual Models From Natural Language Supervision. In International Conference on Machine Learning (ICML)."},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1186\/s40965-017-0027-2"},{"key":"e_1_3_2_1_50_1","volume-title":"Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","author":"Sariyildiz Mert Bulent","year":"2025","unstructured":"Mert Bulent Sariyildiz, Philippe Weinzaepfel, Thomas Lucas, Pau De Jorge, Diane Larlus, and Yannis Kalantidis. 2025. DUNE: Distilling a Universal Encoder from heterogenous 2D and 3D teachers. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). Nashville, Tennessee, USA."},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00326"},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10593-2_54"},{"key":"e_1_3_2_1_53_1","volume-title":"Conference on Computer Vision and Pattern Recognition. 3302-3312","author":"Sattler Torsten","year":"2019","unstructured":"Torsten Sattler, Qunjie Zhou, Marc Pollefeys, and Laura Leal-Taixe. 2019. Un-derstanding the limitations of cnn-based absolute camera pose regression. In Conference on Computer Vision and Pattern Recognition. 3302-3312. doi:10.1109\/ CVPR.2019.00342"},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.445"},{"key":"e_1_3_2_1_55_1","first-page":"25932","article-title":"Re-ranking for image retrieval and transductive few-shot classification","author":"Shen Xi","year":"2021","unstructured":"Xi Shen, Yang Xiao, Hu Shell Xu, Othman Sbai, and Mathieu Aubry. 2021. Re-ranking for image retrieval and transductive few-shot classification. In Advances on Neural Information Processing Systems. 25932-25943. https:\/\/proceedings.neurips.cc\/paper\/2021\/hash\/d9fc0cdb67638d50f411432d0d41d0ba-Abstract.html","journal-title":"Advances on Neural Information Processing Systems."},{"key":"e_1_3_2_1_56_1","first-page":"1","volume-title":"International Conference on Learning Representations","author":"Simonyan Karen","year":"2015","unstructured":"Karen Simonyan and Andrew Zisserman. 2015. Very deep convolutional net-works for large-scale image recognition. International Conference on Learning Representations (2015), 1-14. https:\/\/arxiv.org\/pdf\/1409.1556.pdf%E3%80%82"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"publisher","DOI":"10.1109\/iccv.2003.1238663"},{"key":"e_1_3_2_1_58_1","volume-title":"A Comprehensive Survey on Composed Image Retrieval. arXiv 2502.18495","author":"Song Xuemeng","year":"2025","unstructured":"Xuemeng Song, Haoqiang Lin, Haokun Wen, Bohan Hou, Mingzhu Xu, and Liqiang Nie. 2025. A Comprehensive Survey on Composed Image Retrieval. arXiv 2502.18495 (2025)."},{"key":"e_1_3_2_1_59_1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2016.2568743"},{"key":"e_1_3_2_1_60_1","volume-title":"Training-free zero-shot composed image retrieval with local concept reranking. arXiv preprint arXiv:2312.08924","author":"Sun Shitong","year":"2023","unstructured":"Shitong Sun, Fanghua Ye, and Shaogang Gong. 2023. Training-free zero-shot composed image retrieval with local concept reranking. arXiv preprint arXiv:2312.08924 (2023)."},{"key":"e_1_3_2_1_61_1","doi-asserted-by":"publisher","DOI":"10.1007\/S11263-015-0810-4"},{"key":"e_1_3_2_1_62_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_27"},{"key":"e_1_3_2_1_63_1","volume-title":"SPARO: Selective Attention for Robust and Compositional Transformer Encodings for Vision. In European Conference on Computer Vision (ECCV).","author":"Vani Ankit","year":"2024","unstructured":"Ankit Vani, Bac Nguyen, Samuel Lavoie, Ranjay Krishna,and Aaron Courville. 2024. SPARO: Selective Attention for Robust and Compositional Transformer Encodings for Vision. In European Conference on Computer Vision (ECCV)."},{"key":"e_1_3_2_1_64_1","volume-title":"End-to-end 2d-3d registration between image and lidar point cloud for vehicle localization. arXiv preprint arXiv:2306.11346","author":"Wang Guangming","year":"2023","unstructured":"Guangming Wang, Yu Zheng, Yanfeng Guo, Zhe Liu, Yixiang Zhu, Wolfram Burgard, and Hesheng Wang. 2023. End-to-end 2d-3d registration between image and lidar point cloud for vehicle localization. arXiv preprint arXiv:2306.11346 (2023)."},{"key":"e_1_3_2_1_65_1","doi-asserted-by":"publisher","DOI":"10.1007\/S11432-019-2811-8"},{"key":"e_1_3_2_1_66_1","volume-title":"Pro-ceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 20881-20891","author":"Wang Shuzhe","year":"2024","unstructured":"Shuzhe Wang, Juho Kannala, and Daniel Barath. 2024. DGC-GNN: Leveraging Geometry and Color Cues for Visual Descriptor-Free 2D-3D Matching. In Pro-ceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 20881-20891."},{"key":"e_1_3_2_1_67_1","volume-title":"Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). 20697-20709","author":"Wang Shuzhe","year":"2024","unstructured":"Shuzhe Wang, Vincent Leroy, Yohann Cabon, Boris Chidlovskii, and Jerome Revaud. 2024. DUSt3R: Geometric 3D Vision Made Easy. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). 20697-20709."},{"key":"e_1_3_2_1_68_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00061"},{"key":"e_1_3_2_1_69_1","doi-asserted-by":"publisher","DOI":"10.1145\/3607542.3617353"},{"key":"e_1_3_2_1_70_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01139"},{"key":"e_1_3_2_1_71_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01156"},{"key":"e_1_3_2_1_72_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6248032"},{"key":"e_1_3_2_1_73_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-021-01469-5"},{"key":"e_1_3_2_1_74_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00309"},{"key":"e_1_3_2_1_75_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33709-3_47"},{"key":"e_1_3_2_1_76_1","unstructured":"Xuanmeng Zhang Minyue Jiang Zhedong Zheng Xiao Tan Errui Ding and Yi Yang. 2020. Understanding Image Retrieval Re-Ranking: A Graph Neural Network Perspective. (2020). https:\/\/arxiv.org\/abs\/2012.07620"},{"key":"e_1_3_2_1_77_1","volume-title":"Indica-tive Image Retrieval: Turning Blackbox Learning into Grey. arXiv preprint","author":"Zhang Xulu","year":"2022","unstructured":"Xulu Zhang, Zhenqun Yang, Hao Tian, Qing Li, and Xiaoyong Wei. 2022. Indica-tive Image Retrieval: Turning Blackbox Learning into Grey. arXiv preprint (2022). https:\/\/arxiv.org\/abs\/2201.11898"},{"key":"e_1_3_2_1_78_1","volume-title":"Learning Spatial-context-aware Global Visual Feature Representation for Instance Image Retrieval. In IEEE International Conference on Computer Vision (ICCV).","author":"Zhang Zhongyan","year":"2023","unstructured":"Zhongyan Zhang, Lei Wang, Luping Zhou, and Piotr Koniusz. 2023. Learning Spatial-context-aware Global Visual Feature Representation for Instance Image Retrieval. In IEEE International Conference on Computer Vision (ICCV)."},{"key":"e_1_3_2_1_79_1","volume-title":"2020 IEEE International Conference on Robotics and Automation (ICRA). IEEE, 3319-3326","author":"Zhou Qunjie","year":"2020","unstructured":"Qunjie Zhou, Torsten Sattler, Marc Pollefeys, and Laura Leal-Taixe. 2020. To learn or not to learn: Visual localization from essential matrices. In 2020 IEEE International Conference on Robotics and Automation (ICRA). IEEE, 3319-3326."},{"key":"e_1_3_2_1_80_1","volume-title":"Proceedings of the Conference on Computer Vision and Pattern Recognition (CVPR).","author":"Zhu Sijie","year":"2023","unstructured":"Sijie Zhu, Linjie Yang, Chen Chen, Mubarak Shah, Xiaohui Shen, and Heng Wang. 2023. Former: Unified etrieval and eranking Transformer for Place Recognition. In Proceedings of the Conference on Computer Vision and Pattern Recognition (CVPR)."}],"event":{"name":"MM '25:The 33rd ACM International Conference on Multimedia","location":"Dublin Ireland","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 7th International Workshop on analySis, Understanding and proMotion of heritAge Contents"],"original-title":[],"deposited":{"date-parts":[[2025,10,25]],"date-time":"2025-10-25T14:53:12Z","timestamp":1761403992000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3746273.3760200"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,26]]},"references-count":80,"alternative-id":["10.1145\/3746273.3760200","10.1145\/3746273"],"URL":"https:\/\/doi.org\/10.1145\/3746273.3760200","relation":{},"subject":[],"published":{"date-parts":[[2025,10,26]]},"assertion":[{"value":"2025-10-26","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}