{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T15:57:41Z","timestamp":1781539061324,"version":"3.54.5"},"publisher-location":"New York, NY, USA","reference-count":68,"publisher":"ACM","license":[{"start":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T00:00:00Z","timestamp":1781481600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/legalcode"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,6,16]]},"DOI":"10.1145\/3805622.3810746","type":"proceedings-article","created":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T14:42:57Z","timestamp":1781534577000},"page":"615-624","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Real-Time Retrieval-Free Camera Pose Estimation via Sparse Cross-Modal 2D\u20133D Matching with Projection-Guided Refinement"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-3094-0688","authenticated-orcid":false,"given":"Fan","family":"Wu","sequence":"first","affiliation":[{"name":"IRT b&lt;&gt;com, Cesson-S\u00e9vign\u00e9, France and Lab-STICC UMR 6285, IMT Atlantique, Plouzan\u00e9, France"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8409-6246","authenticated-orcid":false,"given":"Amine","family":"Kacete","sequence":"additional","affiliation":[{"name":"IRT b&lt;&gt;com, Cesson-S\u00e9vign\u00e9, France"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9485-8638","authenticated-orcid":false,"given":"J\u00e9r\u00f4me","family":"Royan","sequence":"additional","affiliation":[{"name":"IRT b&lt;&gt;com, Cesson-S\u00e9vign\u00e9, France"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2215-1865","authenticated-orcid":false,"given":"Guillaume","family":"Moreau","sequence":"additional","affiliation":[{"name":"Lab-STICC UMR 6285, IMT Atlantique, Plouzan\u00e9, France"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2026,6,15]]},"reference":[{"key":"e_1_3_3_1_2_2","doi-asserted-by":"crossref","unstructured":"Thuan\u00a0Bui Bach Tuan\u00a0Tran Dinh and Joo-Ho Lee. 2022. FeatLoc: Absolute pose regressor for indoor 2D sparse features with simplistic view synthesizing. ISPRS Journal of Photogrammetry and Remote Sensing 189 (2022) 50\u201362.","DOI":"10.1016\/j.isprsjprs.2022.04.021"},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00639"},{"key":"e_1_3_3_1_4_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01264-9_46"},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"publisher","DOI":"10.1117\/12.57955"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00488"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.267"},{"key":"e_1_3_3_1_8_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00489"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"crossref","unstructured":"Eric Brachmann and Carsten Rother. 2021. Visual camera re-localization from RGB and RGB-D images using DSAC. IEEE transactions on pattern analysis and machine intelligence 44 9 (2021) 5847\u20135865.","DOI":"10.1109\/TPAMI.2021.3070754"},{"key":"e_1_3_3_1_10_2","doi-asserted-by":"crossref","unstructured":"Bach-Thuan Bui Huy-Hoang Bui Dinh-Tuan Tran and Joo-Ho Lee. 2024. D2S: Representing sparse descriptors and 3D coordinates for camera relocalization. IEEE Robotics and Automation Letters 9 2 (2024) 1234\u20131241.","DOI":"10.1109\/LRA.2024.3487503"},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"crossref","unstructured":"Yujin Chen Ruizhi Chen Mengyun Liu Aoran Xiao Dewen Wu and Shuheng Zhao. 2018. Indoor visual positioning aided by CNN-based image retrieval: Training-free 3D modeling-free. Sensors 18 8 (2018) 2692.","DOI":"10.3390\/s18082692"},{"key":"e_1_3_3_1_12_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00905"},{"key":"e_1_3_3_1_13_2","doi-asserted-by":"crossref","unstructured":"Haowen Deng Mai Bui Nassir Navab Leonidas Guibas Slobodan Ilic and Tolga Birdal. 2022. Deep bingham networks: Dealing with uncertainty and ambiguity in pose estimation. International Journal of Computer Vision 130 7 (2022) 1627\u20131654.","DOI":"10.1007\/s11263-022-01612-w"},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.01560"},{"key":"e_1_3_3_1_15_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8794280"},{"key":"e_1_3_3_1_16_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2006.199"},{"key":"e_1_3_3_1_17_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00425"},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.02520"},{"key":"e_1_3_3_1_19_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.01077"},{"key":"e_1_3_3_1_20_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2016.7487679"},{"key":"e_1_3_3_1_21_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.336"},{"key":"e_1_3_3_1_22_2","doi-asserted-by":"crossref","unstructured":"Bernhard Kerbl Georgios Kopanas Thomas Leimk\u00fchler and George Drettakis. 2023. 3D Gaussian Splatting for Real-Time Radiance Field Rendering. ACM Trans. Graph. 42 4 (2023) 139\u20131.","DOI":"10.1145\/3592433"},{"key":"e_1_3_3_1_23_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2017.113"},{"key":"e_1_3_3_1_24_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01200"},{"key":"e_1_3_3_1_25_2","doi-asserted-by":"publisher","DOI":"10.1109\/IROS60139.2025.11247012"},{"key":"e_1_3_3_1_26_2","volume-title":"The Thirteenth International Conference on Learning Representations","author":"Liu Changkun","year":"2025","unstructured":"Changkun Liu, Shuai Chen, Yash\u00a0Sanjay Bhalgat, Siyan HU, Ming Cheng, Zirui Wang, Victor\u00a0Adrian Prisacariu, and Tristan Braud. 2025. GS-CPR: Efficient Camera Pose Refinement via 3D Gaussian Splatting. In The Thirteenth International Conference on Learning Representations."},{"key":"e_1_3_3_1_27_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA57147.2024.10610903"},{"key":"e_1_3_3_1_28_2","first-page":"256","volume-title":"European Conference on Computer Vision","author":"Lu Xiaoyong","year":"2024","unstructured":"Xiaoyong Lu and Songlin Du. 2024. Raising the ceiling: conflict-free local feature matching with dynamic view switching. In European Conference on Computer Vision. Springer, Milan, Italy, 256\u2013273."},{"key":"e_1_3_3_1_29_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2017.107"},{"key":"e_1_3_3_1_30_2","doi-asserted-by":"crossref","unstructured":"Ben Mildenhall Pratul\u00a0P Srinivasan Matthew Tancik Jonathan\u00a0T Barron Ravi Ramamoorthi and Ren Ng. 2021. Nerf: Representing scenes as neural radiance fields for view synthesis. Commun. ACM 65 1 (2021) 99\u2013106.","DOI":"10.1145\/3503250"},{"key":"e_1_3_3_1_31_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00030"},{"key":"e_1_3_3_1_32_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA55743.2025.11127431"},{"key":"e_1_3_3_1_33_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01072"},{"key":"e_1_3_3_1_34_2","doi-asserted-by":"publisher","DOI":"10.1109\/3DV62453.2024.00139"},{"key":"e_1_3_3_1_35_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00259"},{"key":"e_1_3_3_1_36_2","first-page":"69","volume-title":"Proceedings of the British Machine Vision Conference (BMVC)","author":"Purkait Pulak","year":"2018","unstructured":"Pulak Purkait, Cheng Zhao, and Christopher Zach. 2018. Synthetic View Generation for Absolute Pose Regression and Image Synthesis. In Proceedings of the British Machine Vision Conference (BMVC). BMVA Press, Newcastle, United Kingdom, 69."},{"key":"e_1_3_3_1_37_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01300"},{"key":"e_1_3_3_1_38_2","first-page":"456","volume-title":"Proceedings of the Conference on Robot Learning (CoRL)","author":"Sarlin Paul-Edouard","year":"2018","unstructured":"Paul-Edouard Sarlin, Fr\u00e9d\u00e9ric Debraine, Marcin Dymczyk, Roland Siegwart, and Cesar Cadena. 2018. Leveraging deep visual descriptors for hierarchical efficient localization. In Proceedings of the Conference on Robot Learning (CoRL). PMLR, Z\u00fcrich, Switzerland, 456\u2013465."},{"key":"e_1_3_3_1_39_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00326"},{"key":"e_1_3_3_1_40_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126302"},{"key":"e_1_3_3_1_41_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33718-5_54"},{"key":"e_1_3_3_1_42_2","doi-asserted-by":"crossref","unstructured":"Torsten Sattler Bastian Leibe and Leif Kobbelt. 2016. Efficient & effective prioritized matching for large-scale image-based localization. IEEE transactions on pattern analysis and machine intelligence 39 9 (2016) 1744\u20131756.","DOI":"10.1109\/TPAMI.2016.2611662"},{"key":"e_1_3_3_1_43_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00342"},{"key":"e_1_3_3_1_44_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.445"},{"key":"e_1_3_3_1_45_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.377"},{"key":"e_1_3_3_1_46_2","unstructured":"Rashik Shrestha Bishad Koju Abhigyan Bhusal Danda\u00a0Pani Paudel and Fran\u00e7ois Rameau. 2023. CaLDiff: Camera localization in NeRF via pose diffusion. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2312.15242 (2023)."},{"key":"e_1_3_3_1_47_2","doi-asserted-by":"publisher","DOI":"10.1109\/IROS60139.2025.11246406"},{"key":"e_1_3_3_1_48_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00881"},{"key":"e_1_3_3_1_49_2","unstructured":"Yuan Sun Xuan Wang Yunfan Zhang Jie Zhang Caigui Jiang Yu Guo and Fei Wang. 2023. iComma: Inverting 3D Gaussian Splatting for Camera Pose Estimation via Comparing and Matching. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2312.09031 (2023)."},{"key":"e_1_3_3_1_50_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00096"},{"key":"e_1_3_3_1_51_2","volume-title":"International Conference on Learning Representations (ICLR)","author":"Tian Yonglong","year":"2020","unstructured":"Yonglong Tian, Dilip Krishnan, and Phillip Isola. 2020. Contrastive Representation Distillation. In International Conference on Learning Representations (ICLR)."},{"key":"e_1_3_3_1_52_2","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2016.41"},{"key":"e_1_3_3_1_53_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.75"},{"key":"e_1_3_3_1_54_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i06.6608"},{"key":"e_1_3_3_1_55_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.00499"},{"key":"e_1_3_3_1_56_2","doi-asserted-by":"crossref","unstructured":"Junyi Wang and Yue Qi. 2024. Visual camera relocalization using both hand-crafted and learned features. Pattern Recognition 145 (2024) 109914.","DOI":"10.1016\/j.patcog.2023.109914"},{"key":"e_1_3_3_1_57_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01956"},{"key":"e_1_3_3_1_58_2","unstructured":"Zhaohui Wang Rong Wei Jingbo Yu Dong Li Xiangde Liu et\u00a0al. 2025. R3GS: Gaussian Splatting for Robust Reconstruction and Relocalization in Unconstrained Image Collections. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2505.15294 (2025)."},{"key":"e_1_3_3_1_59_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA57147.2024.10611622"},{"key":"e_1_3_3_1_60_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00013"},{"key":"e_1_3_3_1_61_2","doi-asserted-by":"crossref","unstructured":"Shun Yao Yongmei Cheng Fei Yang and Mikhail\u00a0G Mozerov. 2025. Implicit Neural Representation Model for Camera Relocalization in Multiple Scenes. Pattern Recognition 158 (2025) 111791.","DOI":"10.1016\/j.patcog.2025.111791"},{"key":"e_1_3_3_1_62_2","doi-asserted-by":"publisher","DOI":"10.1109\/IROS51168.2021.9636708"},{"key":"e_1_3_3_1_63_2","doi-asserted-by":"crossref","unstructured":"Jiahao Yin Xinyu Zhou Huahui Xiao Zhili Liu Wei Li Xue Li and Shengyin Fan. 2022. HAPOR: Hierarchical-features aligned projection optimization for relocalization. IEEE Robotics and Automation Letters 8 3 (2022) 1447\u20131454.","DOI":"10.1109\/LRA.2022.3226069"},{"key":"e_1_3_3_1_64_2","unstructured":"Hailin Yu Youji Feng Weicai Ye Mingxuan Jiang Hujun Bao and Guofeng Zhang. 2022. Improving feature-based visual localization by geometry-aided matching. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2211.08712 (2022)."},{"key":"e_1_3_3_1_65_2","doi-asserted-by":"publisher","DOI":"10.1145\/3206025.3206080"},{"key":"e_1_3_3_1_66_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.29"},{"key":"e_1_3_3_1_67_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i7.28576"},{"key":"e_1_3_3_1_68_2","first-page":"108","volume-title":"European Conference on Computer Vision (ECCV)","author":"Zhou Qunjie","year":"2024","unstructured":"Qunjie Zhou, Maxim Maximov, Or Litany, and Laura Leal-Taix\u00e9. 2024. The NeRFect Match: Exploring NeRF Features for Visual Localization. In European Conference on Computer Vision (ECCV). Springer, Milan, Italy, 108\u2013127."},{"key":"e_1_3_3_1_69_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02048"}],"event":{"name":"ICMR '26: International Conference on Multimedia Retrieval","location":"Amsterdam The Netherlands","acronym":"ICMR '26","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 2026 International Conference on Multimedia Retrieval"],"original-title":[],"deposited":{"date-parts":[[2026,6,15]],"date-time":"2026-06-15T15:41:38Z","timestamp":1781538098000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3805622.3810746"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,6,15]]},"references-count":68,"alternative-id":["10.1145\/3805622.3810746","10.1145\/3805622"],"URL":"https:\/\/doi.org\/10.1145\/3805622.3810746","relation":{},"subject":[],"published":{"date-parts":[[2026,6,15]]},"assertion":[{"value":"2026-06-15","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}