{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T16:42:41Z","timestamp":1777653761769,"version":"3.51.4"},"reference-count":51,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2023,5,24]],"date-time":"2023-05-24T00:00:00Z","timestamp":1684886400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,5,24]],"date-time":"2023-05-24T00:00:00Z","timestamp":1684886400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2024,3]]},"DOI":"10.1007\/s00371-023-02889-9","type":"journal-article","created":{"date-parts":[[2023,5,24]],"date-time":"2023-05-24T18:02:16Z","timestamp":1684951336000},"page":"1839-1851","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":11,"title":["MIVI: multi-stage feature matching for infrared and visible image"],"prefix":"10.1007","volume":"40","author":[{"given":"Yide","family":"Di","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yun","family":"Liao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kaijun","family":"Zhu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hao","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yijia","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qing","family":"Duan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Junhui","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8663-9870","authenticated-orcid":false,"given":"Mingyu","family":"Lu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,5,24]]},"reference":[{"key":"2889_CR1","doi-asserted-by":"publisher","first-page":"3334","DOI":"10.1109\/TIP.2022.3169693","volume":"31","author":"D Cheng","year":"2022","unstructured":"Cheng, D., Zhou, J., Wang, N., Gao, X.: Hybrid dynamic contrast and probability distillation for unsupervised person Re-Id. IEEE Trans. Image Process. 31, 3334\u20133346 (2022). https:\/\/doi.org\/10.1109\/TIP.2022.3169693","journal-title":"IEEE Trans. Image Process."},{"key":"2889_CR2","doi-asserted-by":"publisher","unstructured":"Taira, H., Okutomi, M., Sattler, T., Cimpoi, M., Pollefeys, M., Sivic, J., Pajdla, T., Torii, A.: Inloc: indoor visual localization with dense matching and view synthesis. In: 2018 IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2018, Salt Lake City, UT, USA, June 18\u201322, 2018, pp. 7199\u20137209. Computer Vision Foundation \/ IEEE Computer Society (2018). https:\/\/doi.org\/10.1109\/CVPR.2018.00752. http:\/\/openaccess.thecvf.com\/content_cvpr_2018\/html\/Taira_InLoc_Indoor_Visual_CVPR_2018_paper.html","DOI":"10.1109\/CVPR.2018.00752"},{"issue":"4","key":"2889_CR3","doi-asserted-by":"publisher","first-page":"8726","DOI":"10.1109\/LRA.2021.3111760","volume":"6","author":"S Yoon","year":"2021","unstructured":"Yoon, S., Kim, A.: Line as a visual sentence: context-aware line descriptor for visual localization. IEEE Robot. Autom. Lett. 6(4), 8726\u20138733 (2021). https:\/\/doi.org\/10.1109\/LRA.2021.3111760","journal-title":"IEEE Robot. Autom. Lett."},{"key":"2889_CR4","doi-asserted-by":"publisher","unstructured":"Lindenberger, P., Sarlin, P., Larsson, V., Pollefeys, M.: Pixel-perfect structure-from-motion with featuremetric refinement. In: 2021 IEEE\/CVF International Conference on Computer Vision, ICCV 2021, Montreal, QC, Canada, October 10\u201317, 2021, pp. 5967\u20135977. IEEE (2021). https:\/\/doi.org\/10.1109\/ICCV48922.2021.00593","DOI":"10.1109\/ICCV48922.2021.00593"},{"key":"2889_CR5","doi-asserted-by":"publisher","unstructured":"Sch\u00f6nberger, J.L., Frahm, J.: Structure-from-motion revisited. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2016, Las Vegas, NV, USA, June 27\u201330, 2016, pp. 4104\u20134113. IEEE Computer Society (2016). https:\/\/doi.org\/10.1109\/CVPR.2016.445","DOI":"10.1109\/CVPR.2016.445"},{"key":"2889_CR6","doi-asserted-by":"crossref","unstructured":"Chen, H., Hu, W., Yang, K., Bai, J., Wang, K.: Panoramic annular SLAM with loop closure and global optimization. CoRR abs\/2102.13400 (2021) arXiv:2102.13400","DOI":"10.1364\/AO.424280"},{"issue":"22","key":"2889_CR7","doi-asserted-by":"publisher","first-page":"8830","DOI":"10.1016\/j.eswa.2015.07.035","volume":"42","author":"J Son","year":"2015","unstructured":"Son, J., Kim, S., Sohn, K.: A multi-vision sensor-based fast localization system with image matching for challenging outdoor environments. Expert Syst. Appl. 42(22), 8830\u20138839 (2015). https:\/\/doi.org\/10.1016\/j.eswa.2015.07.035","journal-title":"Expert Syst. Appl."},{"issue":"11","key":"2889_CR8","doi-asserted-by":"publisher","first-page":"16491","DOI":"10.1007\/s11042-020-10213-z","volume":"80","author":"X Liu","year":"2021","unstructured":"Liu, X., Li, J., Pan, J., Wang, S.: An advanced gradient texture feature descriptor based on phase information for infrared and visible image matching. Multim. Tools Appl. 80(11), 16491\u201316511 (2021). https:\/\/doi.org\/10.1007\/s11042-020-10213-z","journal-title":"Multim. Tools Appl."},{"key":"2889_CR9","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TGRS.2021.3099506","volume":"60","author":"S Cui","year":"2022","unstructured":"Cui, S., Ma, A., Wan, Y., Zhong, Y., Luo, B., Xu, M.: Cross-modality image matching network with modality-invariant feature representation for airborne-ground thermal infrared and visible datasets. IEEE Trans. Geosci. Remote. Sens. 60, 1\u201314 (2022). https:\/\/doi.org\/10.1109\/TGRS.2021.3099506","journal-title":"IEEE Trans. Geosci. Remote. Sens."},{"key":"2889_CR10","doi-asserted-by":"publisher","unstructured":"Sun, J., Shen, Z., Wang, Y., Bao, H., Zhou, X.: Loftr: Detector-free local feature matching with transformers. In: IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2021, Virtual, June 19\u201325, 2021, pp. 8922\u20138931. Computer Vision Foundation\/IEEE (2021). https:\/\/doi.org\/10.1109\/CVPR46437.2021.00881. https:\/\/openaccess.thecvf.com\/content\/CVPR2021\/html\/Sun_LoFTR_Detector-Free_Local_Feature_Matching_With_Transformers_CVPR_2021_paper.html","DOI":"10.1109\/CVPR46437.2021.00881"},{"key":"2889_CR11","doi-asserted-by":"publisher","unstructured":"B\u00f6kman, G., Kahl, F.: A case for using rotation invariant features in state of the art feature matchers. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, CVPR Workshops 2022, New Orleans, LA, USA, June 19\u201320, 2022, pp. 5106\u20135115. IEEE (2022). https:\/\/doi.org\/10.1109\/CVPRW56347.2022.00559","DOI":"10.1109\/CVPRW56347.2022.00559"},{"key":"2889_CR12","unstructured":"Tang, S., Zhang, J., Zhu, S., Tan, P.: Quadtree attention for vision transformers. In: The Tenth International Conference on Learning Representations, ICLR 2022, Virtual Event, April 25\u201329, 2022. OpenReview.net (2022). https:\/\/openreview.net\/forum?id=fR-EnKWL_Zb"},{"key":"2889_CR13","doi-asserted-by":"publisher","unstructured":"Wang, Q., Zhang, J., Yang, K., Peng, K., Stiefelhagen, R.: Matchformer: interleaving attention in transformers for feature matching. In: Wang, L., Gall, J., Chin, T., Sato, I., Chellappa, R. (eds.) Computer Vision\u2014ACCV 2022\u201416th Asian Conference on Computer Vision, Macao, China, December 4\u20138, 2022, Proceedings, Part III. Lecture Notes in Computer Science, vol. 13843, pp. 256\u2013273. Springer (2022). https:\/\/doi.org\/10.1007\/978-3-031-26313-2_16","DOI":"10.1007\/978-3-031-26313-2_16"},{"issue":"2","key":"2889_CR14","doi-asserted-by":"publisher","first-page":"595","DOI":"10.1109\/TPAMI.2019.2930192","volume":"43","author":"D Bhattacharjee","year":"2021","unstructured":"Bhattacharjee, D., Roy, H.: Pattern of local gravitational force (PLGF): a novel local image descriptor. IEEE Trans. Pattern Anal. Mach. Intell. 43(2), 595\u2013607 (2021). https:\/\/doi.org\/10.1109\/TPAMI.2019.2930192","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"4","key":"2889_CR15","doi-asserted-by":"publisher","first-page":"568","DOI":"10.1109\/LGRS.2018.2876661","volume":"16","author":"MA Ghannadi","year":"2019","unstructured":"Ghannadi, M.A., Saadatseresht, M.: A modified local binary pattern descriptor for SAR image matching. IEEE Geosci. Remote. Sens. Lett. 16(4), 568\u2013572 (2019). https:\/\/doi.org\/10.1109\/LGRS.2018.2876661","journal-title":"IEEE Geosci. Remote. Sens. Lett."},{"issue":"2","key":"2889_CR16","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1023\/B:VISI.0000029664.99615.94","volume":"60","author":"DG Lowe","year":"2004","unstructured":"Lowe, D.G.: Distinctive image features from scale-invariant keypoints. Int. J. Comput. Vis. 60(2), 91\u2013110 (2004). https:\/\/doi.org\/10.1023\/B:VISI.0000029664.99615.94","journal-title":"Int. J. Comput. Vis."},{"key":"2889_CR17","doi-asserted-by":"publisher","unstructured":"Rublee, E., Rabaud, V., Konolige, K., Bradski, G.R.: ORB: an efficient alternative to SIFT or SURF. In: Metaxas, D.N., Quan, L., Sanfeliu, A., Gool, L.V. (eds.) IEEE International Conference on Computer Vision, ICCV 2011, Barcelona, Spain, November 6\u201313, 2011, pp. 2564\u20132571. IEEE Computer Society (2011). https:\/\/doi.org\/10.1109\/ICCV.2011.6126544","DOI":"10.1109\/ICCV.2011.6126544"},{"key":"2889_CR18","doi-asserted-by":"publisher","unstructured":"Yi, K.M., Trulls, E., Lepetit, V., Fua, P.: LIFT: learned invariant feature transform. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) Computer Vision\u2014ECCV 2016\u201414th European Conference, Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part VI. Lecture Notes in Computer Science, vol. 9910, pp. 467\u2013483. Springer (2016). https:\/\/doi.org\/10.1007\/978-3-319-46466-4_28","DOI":"10.1007\/978-3-319-46466-4_28"},{"key":"2889_CR19","doi-asserted-by":"publisher","unstructured":"Luo, Z., Zhou, L., Bai, X., Chen, H., Zhang, J., Yao, Y., Li, S., Fang, T., Quan, L.: Aslfeat: learning local features of accurate shape and localization. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2020, Seattle, WA, USA, June 13\u201319, 2020, pp. 6588\u20136597. Computer Vision Foundation\/IEEE (2020). https:\/\/doi.org\/10.1109\/CVPR42600.2020.00662. https:\/\/openaccess.thecvf.com\/content_CVPR_2020\/html\/Luo_ASLFeat_Learning_Local_Features_of_Accurate_Shape_and_Localization_CVPR_2020_paper.html","DOI":"10.1109\/CVPR42600.2020.00662"},{"key":"2889_CR20","doi-asserted-by":"publisher","unstructured":"DeTone, D., Malisiewicz, T., Rabinovich, A.: Superpoint: Self-supervised interest point detection and description. In: 2018 IEEE Conference on Computer Vision and Pattern Recognition Workshops, CVPR Workshops 2018, Salt Lake City, UT, USA, June 18\u201322, 2018, pp. 224\u2013236. Computer Vision Foundation\/IEEE Computer Society (2018). https:\/\/doi.org\/10.1109\/CVPRW.2018.00060. http:\/\/openaccess.thecvf.com\/content_cvpr_2018_workshops\/w9\/html\/DeTone_SuperPoint_Self-Supervised_Interest_CVPR_2018_paper.html","DOI":"10.1109\/CVPRW.2018.00060"},{"key":"2889_CR21","doi-asserted-by":"publisher","unstructured":"Fang, Y., Wang, K., Cheng, R., Yang, K.: CFVL: A coarse-to-fine vehicle localizer with omnidirectional perception across severe appearance variations. In: IEEE Intelligent Vehicles Symposium, IV 2020, Las Vegas, NV, USA, October 19\u2013November 13, 2020, pp. 1885\u20131891. IEEE (2020). https:\/\/doi.org\/10.1109\/IV47402.2020.9304612","DOI":"10.1109\/IV47402.2020.9304612"},{"issue":"28\u201329","key":"2889_CR22","doi-asserted-by":"publisher","first-page":"35629","DOI":"10.1007\/s11042-021-10830-2","volume":"80","author":"Y Di","year":"2021","unstructured":"Di, Y., Zhu, X., Jin, X., Dou, Q., Zhou, W., Duan, Q.: Color-UNet++: a resolution for colorization of grayscale images using improved UNet++. Multimed. Tools Appl. 80(28\u201329), 35629\u201335648 (2021). https:\/\/doi.org\/10.1007\/s11042-021-10830-2","journal-title":"Multimed. Tools Appl."},{"key":"2889_CR23","doi-asserted-by":"publisher","unstructured":"Han, X., Leung, T., Jia, Y., Sukthankar, R., Berg, A.C.: Matchnet: unifying feature and metric learning for patch-based matching. In: IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2015, Boston, MA, USA, June 7\u201312, 2015, pp. 3279\u20133286. IEEE Computer Society (2015). https:\/\/doi.org\/10.1109\/CVPR.2015.7298948","DOI":"10.1109\/CVPR.2015.7298948"},{"key":"2889_CR24","doi-asserted-by":"crossref","unstructured":"Balntas, V., Riba, E., Ponsa, D., Mikolajczyk, K.: Learning local feature descriptors with triplets and shallow convolutional neural networks. In: Wilson, R.C., Hancock, E.R., Smith, W.A.P. (eds.) Proceedings of the British Machine Vision Conference 2016, BMVC 2016, York, UK, September 19\u201322, 2016. BMVA Press (2016). http:\/\/www.bmva.org\/bmvc\/2016\/papers\/paper119\/index.html","DOI":"10.5244\/C.30.119"},{"key":"2889_CR25","unstructured":"Mishchuk, A., Mishkin, D., Radenovic, F., Matas, J.: Working hard to know your neighbor\u2019s margins: local descriptor learning loss. In: Guyon, I., von Luxburg, U., Bengio, S., Wallach, H.M., Fergus, R., Vishwanathan, S.V.N., Garnett, R. (eds.) Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017, December 4\u20139, 2017, Long Beach, CA, USA, pp. 4826\u20134837 (2017). https:\/\/proceedings.neurips.cc\/paper\/2017\/hash\/831caa1b600f852b7844499430ecac17-Abstract.html"},{"key":"2889_CR26","doi-asserted-by":"publisher","first-page":"448","DOI":"10.1109\/JSTARS.2021.3134676","volume":"15","author":"Y Liao","year":"2022","unstructured":"Liao, Y., Di, Y., Zhou, H., Li, A., Liu, J., Lu, M., Duan, Q.: Feature matching and position matching between optical and SAR with local deep feature descriptor. IEEE JIEEE J. Sel. Top. Appl. Earth Obs. Remote. Sens. 15, 448\u2013462 (2022). https:\/\/doi.org\/10.1109\/JSTARS.2021.3134676","journal-title":"IEEE JIEEE J. Sel. Top. Appl. Earth Obs. Remote. Sens."},{"key":"2889_CR27","doi-asserted-by":"publisher","unstructured":"Giang, K.T., Song, S., Jo, S.: TopicFM: robust and interpretable feature matching with topic-assisted. CoRR abs\/2207.00328 (2022). arXiv:2207.00328. https:\/\/doi.org\/10.48550\/arXiv.2207.00328","DOI":"10.48550\/arXiv.2207.00328"},{"key":"2889_CR28","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A.N., Kaiser, L., Polosukhin, I.: Attention is all you need. In: Guyon, I., von Luxburg, U., Bengio, S., Wallach, H.M., Fergus, R., Vishwanathan, S.V.N., Garnett, R. (eds.) Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017, December 4\u20139, 2017, Long Beach, CA, USA, pp. 5998\u20136008 (2017). https:\/\/proceedings.neurips.cc\/paper\/2017\/hash\/3f5ee243547dee91fbd053c1c4a845aa-Abstract.html"},{"key":"2889_CR29","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., Weissenborn, D., Zhai, X., Unterthiner, T., Dehghani, M., Minderer, M., Heigold, G., Gelly, S., Uszkoreit, J., Houlsby, N.: An image is worth $$16\\times 16$$ words: transformers for image recognition at scale. In: 9th International Conference on Learning Representations, ICLR 2021, Virtual Event, Austria, May 3\u20137, 2021. OpenReview.net (2021). https:\/\/openreview.net\/forum?id=YicbFdNTTy"},{"key":"2889_CR30","doi-asserted-by":"publisher","unstructured":"Liu, Z., Lin, Y., Cao, Y., Hu, H., Wei, Y., Zhang, Z., Lin, S., Guo, B.: Swin transformer: hierarchical vision transformer using shifted windows. In: 2021 IEEE\/CVF International Conference on Computer Vision, ICCV 2021, Montreal, QC, Canada, October 10\u201317, 2021, pp. 9992\u201310002. IEEE (2021). https:\/\/doi.org\/10.1109\/ICCV48922.2021.00986","DOI":"10.1109\/ICCV48922.2021.00986"},{"issue":"19","key":"2889_CR31","doi-asserted-by":"publisher","first-page":"4244","DOI":"10.3390\/s19194244","volume":"19","author":"X Liu","year":"2019","unstructured":"Liu, X., Li, J., Pan, J.: Feature point matching based on distinct wavelength phase congruency and log-gabor filters in infrared and visible images. Sensors 19(19), 4244 (2019). https:\/\/doi.org\/10.3390\/s19194244","journal-title":"Sensors"},{"issue":"5","key":"2889_CR32","doi-asserted-by":"publisher","DOI":"10.1117\/1.JEI.24.5.053017","volume":"24","author":"F Wu","year":"2015","unstructured":"Wu, F., Wang, B., Yi, X., Li, M., Hao, J., Qin, H., Zhou, H.: Visible and infrared image registration based on visual salient features. J. Electron. Imaging 24(5), 053017 (2015). https:\/\/doi.org\/10.1117\/1.JEI.24.5.053017","journal-title":"J. Electron. Imaging"},{"key":"2889_CR33","doi-asserted-by":"publisher","first-page":"42562","DOI":"10.1109\/ACCESS.2020.2976767","volume":"8","author":"C Min","year":"2020","unstructured":"Min, C., Gu, Y., Yang, F., Li, Y., Lian, W.: Non-rigid registration for infrared and visible images via Gaussian weighted shape context and enhanced affine transformation. IEEE Access 8, 42562\u201342575 (2020). https:\/\/doi.org\/10.1109\/ACCESS.2020.2976767","journal-title":"IEEE Access"},{"key":"2889_CR34","doi-asserted-by":"publisher","unstructured":"Wang, L., Gao, C., Zhao, Y., Song, T., Feng, Q.: Infrared and visible image registration using transformer adversarial network. In: 2018 IEEE International Conference on Image Processing, ICIP 2018, Athens, Greece, October 7\u201310, 2018, pp. 1248\u20131252. IEEE (2018). https:\/\/doi.org\/10.1109\/ICIP.2018.8451370","DOI":"10.1109\/ICIP.2018.8451370"},{"key":"2889_CR35","doi-asserted-by":"publisher","unstructured":"Arar, M., Ginger, Y., Danon, D., Bermano, A.H., Cohen-Or, D.: Unsupervised multi-modal image registration via geometry preserving image-to-image translation. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2020, Seattle, WA, USA, June 13\u201319, 2020, pp. 13407\u201313416. Computer Vision Foundation\/IEEE (2020). https:\/\/doi.org\/10.1109\/CVPR42600.2020.01342. https:\/\/openaccess.thecvf.com\/content_CVPR_2020\/html\/Arar_Unsupervised_Multi-Modal_Image_Registration_via_Geometry_Preserving_Image-to-Image_Translation_CVPR_2020_paper.html","DOI":"10.1109\/CVPR42600.2020.01342"},{"key":"2889_CR36","doi-asserted-by":"publisher","unstructured":"Hrkac, T., Kalafatic, Z., Krapac, J.: Infrared-visual image registration based on corners and Hausdorff distance. In: Ersb\u00f8ll, B.K., Pedersen, K.S. (eds.) Image Analysis, 15th Scandinavian Conference, SCIA 2007, Aalborg, Denmark, June 10\u201314, 2007, Proceedings. Lecture Notes in Computer Science, vol. 4522, pp. 383\u2013392. Springer (2007). https:\/\/doi.org\/10.1007\/978-3-540-73040-8_39","DOI":"10.1007\/978-3-540-73040-8_39"},{"issue":"3","key":"2889_CR37","doi-asserted-by":"publisher","first-page":"772","DOI":"10.1016\/j.patcog.2014.09.005","volume":"48","author":"J Ma","year":"2015","unstructured":"Ma, J., Zhao, J., Ma, Y., Tian, J.: Non-rigid visible and infrared face registration via regularized gaussian fields criterion. Pattern Recognit. 48(3), 772\u2013784 (2015). https:\/\/doi.org\/10.1016\/j.patcog.2014.09.005","journal-title":"Pattern Recognit."},{"key":"2889_CR38","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107377","volume":"106","author":"C Min","year":"2020","unstructured":"Min, C., Gu, Y., Li, Y., Yang, F.: Non-rigid infrared and visible image registration by enhanced affine transformation. Pattern Recognit. 106, 107377 (2020). https:\/\/doi.org\/10.1016\/j.patcog.2020.107377","journal-title":"Pattern Recognit."},{"key":"2889_CR39","doi-asserted-by":"publisher","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-net: Convolutional networks for biomedical image segmentation. In: Navab, N., Hornegger, J., III, W.M.W., Frangi, A.F. (eds.) Medical Image Computing and Computer-Assisted Intervention\u2014MICCAI 2015\u201418th International Conference Munich, Germany, October 5\u20139, 2015, Proceedings, Part III. Lecture Notes in Computer Science, vol. 9351, pp. 234\u2013241. Springer (2015). https:\/\/doi.org\/10.1007\/978-3-319-24574-4_28","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"2889_CR40","doi-asserted-by":"publisher","unstructured":"Sarlin, P., DeTone, D., Malisiewicz, T., Rabinovich, A.: Superglue: learning feature matching with graph neural networks. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2020, Seattle, WA, USA, June 13\u201319, 2020, pp. 4937\u20134946. Computer Vision Foundation\/IEEE (2020). https:\/\/doi.org\/10.1109\/CVPR42600.2020.00499. https:\/\/openaccess.thecvf.com\/content_CVPR_2020\/html\/Sarlin_SuperGlue_Learning_Feature_Matching_With_Graph_Neural_Networks_CVPR_2020_paper.html","DOI":"10.1109\/CVPR42600.2020.00499"},{"key":"2889_CR41","doi-asserted-by":"publisher","unstructured":"Yu, W., Luo, M., Zhou, P., Si, C., Zhou, Y., Wang, X., Feng, J., Yan, S.: Metaformer is actually what you need for vision. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2022, New Orleans, LA, USA, June 18\u201324, 2022, pp. 10809\u201310819. IEEE (2022). https:\/\/doi.org\/10.1109\/CVPR52688.2022.01055","DOI":"10.1109\/CVPR52688.2022.01055"},{"key":"2889_CR42","unstructured":"Tyszkiewicz, M.J., Fua, P., Trulls, E.: DISK: learning local features with policy gradient. In: Larochelle, H., Ranzato, M., Hadsell, R., Balcan, M., Lin, H. (eds.) Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6\u201312, 2020, Virtual (2020). https:\/\/proceedings.neurips.cc\/paper\/2020\/hash\/a42a596fc71e17828440030074d15e74-Abstract.html"},{"key":"2889_CR43","unstructured":"Rocco, I., Cimpoi, M., Arandjelovic, R., Torii, A., Pajdla, T., Sivic, J.: Neighbourhood consensus networks. In: Bengio, S., Wallach, H.M., Larochelle, H., Grauman, K., Cesa-Bianchi, N., Garnett, R. (eds.) Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3\u20138, 2018, Montr\u00e9al, Canada, pp. 1658\u20131669 (2018). https:\/\/proceedings.neurips.cc\/paper\/2018\/hash\/8f7d807e1f53eff5f9efbe5cb81090fb-Abstract.html"},{"key":"2889_CR44","doi-asserted-by":"publisher","unstructured":"Wang, Q., Zhou, X., Hariharan, B., Snavely, N.: Learning feature descriptors using camera pose supervision. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J. (eds.) Computer Vision\u2014ECCV 2020\u201416th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part I. Lecture Notes in Computer Science, vol. 12346, pp. 757\u2013774. Springer (2020). https:\/\/doi.org\/10.1007\/978-3-030-58452-8_44","DOI":"10.1007\/978-3-030-58452-8_44"},{"key":"2889_CR45","doi-asserted-by":"crossref","unstructured":"Schmitt, M., Hughes, L.H., Zhu, X.X.: The SEN1-2 dataset for deep learning in SAR-optical data fusion. CoRR abs\/1807.01569 (2018). arXiv:1807.01569","DOI":"10.5194\/isprs-annals-IV-1-141-2018"},{"key":"2889_CR46","unstructured":"Schmitt, M., Wu, Y.: Remote sensing image classification with the SEN12MS dataset. CoRR abs\/2104.00704 (2021). arXiv:2104.00704"},{"key":"2889_CR47","doi-asserted-by":"publisher","unstructured":"Brown, M.A., S\u00fcsstrunk, S.: Multi-spectral SIFT for scene category recognition. In: The 24th IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2011, Colorado Springs, CO, USA, 20\u201325 June 2011, pp. 177\u2013184. IEEE Computer Society (2011). https:\/\/doi.org\/10.1109\/CVPR.2011.5995637","DOI":"10.1109\/CVPR.2011.5995637"},{"key":"2889_CR48","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TGRS.2022.3165940","volume":"60","author":"J Li","year":"2022","unstructured":"Li, J., Xu, W., Shi, P., Zhang, Y., Hu, Q.: LNIFT: locally normalized image for rotation invariant multimodal feature matching. IEEE Trans. Geosci. Remote. Sens. 60, 1\u201314 (2022). https:\/\/doi.org\/10.1109\/TGRS.2022.3165940","journal-title":"IEEE Trans. Geosci. Remote. Sens."},{"key":"2889_CR49","doi-asserted-by":"publisher","unstructured":"Dusmanu, M., Rocco, I., Pajdla, T., Pollefeys, M., Sivic, J., Torii, A., Sattler, T.: D2-net: a trainable CNN for joint description and detection of local features. In: IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2019, Long Beach, CA, USA, June 16\u201320, 2019, pp. 8092\u20138101. Computer Vision Foundation\/IEEE (2019). https:\/\/doi.org\/10.1109\/CVPR.2019.00828. http:\/\/openaccess.thecvf.com\/content_CVPR_2019\/html\/Dusmanu_D2-Net_A_Trainable_CNN_for_Joint_Description_and_Detection_of_CVPR_2019_paper.html","DOI":"10.1109\/CVPR.2019.00828"},{"issue":"10","key":"2889_CR50","doi-asserted-by":"publisher","first-page":"1615","DOI":"10.1109\/TPAMI.2005.188","volume":"27","author":"K Mikolajczyk","year":"2005","unstructured":"Mikolajczyk, K., Schmid, C.: A performance evaluation of local descriptors. IEEE Trans. Pattern Anal. Mach. Intell. 27(10), 1615\u20131630 (2005). https:\/\/doi.org\/10.1109\/TPAMI.2005.188","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2889_CR51","doi-asserted-by":"publisher","unstructured":"Zhou, Q., Sattler, T., Leal-Taix\u00e9, L.: Patch2pix: epipolar-guided pixel-level correspondences. In: IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2021, Virtual, June 19\u201325, 2021, pp. 4669\u20134678. Computer Vision Foundation\/IEEE (2021). https:\/\/doi.org\/10.1109\/CVPR46437.2021.00464. https:\/\/openaccess.thecvf.com\/content\/CVPR2021\/html\/Zhou_Patch2Pix_Epipolar-Guided_Pixel-Level_Correspondences_CVPR_2021_paper.html","DOI":"10.1109\/CVPR46437.2021.00464"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-023-02889-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-023-02889-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-023-02889-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,19]],"date-time":"2024-02-19T08:11:32Z","timestamp":1708330292000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-023-02889-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,5,24]]},"references-count":51,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2024,3]]}},"alternative-id":["2889"],"URL":"https:\/\/doi.org\/10.1007\/s00371-023-02889-9","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,5,24]]},"assertion":[{"value":"28 April 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 May 2023","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflicts of interests or competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}