{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,5]],"date-time":"2026-05-05T12:02:02Z","timestamp":1777982522064,"version":"3.51.4"},"reference-count":41,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T00:00:00Z","timestamp":1775001600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"Ningxia Natural Science Foundation Project","award":["2025AAC030196"],"award-info":[{"award-number":["2025AAC030196"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2026,4]]},"DOI":"10.1007\/s00371-026-04463-5","type":"journal-article","created":{"date-parts":[[2026,4,8]],"date-time":"2026-04-08T16:38:15Z","timestamp":1775666295000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["AdverFuse: robust fusion of multimodal images based on dynamic attention and adversarial learning"],"prefix":"10.1007","volume":"42","author":[{"given":"Fangyan","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fan","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yingbing","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fei","family":"Ma","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chunsheng","family":"Hu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,4,8]]},"reference":[{"key":"4463_CR1","doi-asserted-by":"crossref","unstructured":"Zhang Y, Wang X, Meng F, et al. Knowledge-driven subspace fusion and gradient coordination for multi-modal learning. In: International Conference on Medical Image Computing and Computer-Assisted Intervention. Cham: Springer Nature Switzerland, 2024: 263\u2013273.","DOI":"10.1007\/978-3-031-72083-3_25"},{"issue":"8","key":"4463_CR2","doi-asserted-by":"publisher","first-page":"10535","DOI":"10.1109\/TPAMI.2023.3261282","volume":"45","author":"X Zhang","year":"2023","unstructured":"Zhang, X., Demiris, Y.: Visible and infrared image fusion using deep learning. IEEE Trans. Pattern Anal. Mach. Intell. 45(8), 10535\u201310554 (2023)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"4463_CR3","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiomed.2023.106959","volume":"160","author":"T Zhou","year":"2023","unstructured":"Zhou, T., Cheng, Q.R., Lu, H.L., et al.: Deep learning methods for medical image fusion: a review. Comput. Biol. Med. 160, 106959 (2023)","journal-title":"Comput. Biol. Med."},{"key":"4463_CR4","doi-asserted-by":"publisher","first-page":"5626","DOI":"10.1109\/TIP.2021.3087348","volume":"30","author":"Z Yu","year":"2021","unstructured":"Yu, Z., Zhou, B., Wan, J., et al.: Searching multi-rate and multi-modal temporal enhanced networks for gesture recognition. IEEE Trans. Image Process. 30, 5626\u20135640 (2021)","journal-title":"IEEE Trans. Image Process."},{"key":"4463_CR5","doi-asserted-by":"crossref","unstructured":"Ye Q, Yu Z, Shao R, et al. Cat: Enhancing multimodal large language model to answer questions in dynamic audio-visual scenarios. In: European Conference on Computer Vision. Cham: Springer Nature Switzerland, 2024: 146\u2013164.","DOI":"10.1007\/978-3-031-72684-2_9"},{"issue":"11","key":"4463_CR6","doi-asserted-by":"publisher","first-page":"5217","DOI":"10.1007\/s11263-024-02055-1","volume":"132","author":"Z Yu","year":"2024","unstructured":"Yu, Z., Cai, R., Cui, Y., et al.: Rethinking vision transformer and masked autoencoder in multimodal face anti-spoofing. Int. J. Comput. Vis. 132(11), 5217\u20135238 (2024)","journal-title":"Int. J. Comput. Vis."},{"key":"4463_CR7","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2025.111991","volume":"169","author":"J Cui","year":"2026","unstructured":"Cui, J., Li, Y., Shen, D., et al.: MGCM: multi-modal graph convolutional mamba for cancer survival prediction. Pattern Recognit. 169, 111991 (2026)","journal-title":"Pattern Recognit."},{"key":"4463_CR8","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2024.102381","volume":"108","author":"T Zhang","year":"2024","unstructured":"Zhang, T., Tan, T., Han, L., et al.: IMPORTANT-Net: integrated MRI multiparametric increment fusion generator with attention network for synthesizing absent data. Inf. Fusion 108, 102381 (2024)","journal-title":"Inf. Fusion"},{"issue":"7","key":"4463_CR9","doi-asserted-by":"publisher","first-page":"1200","DOI":"10.1109\/JAS.2022.105686","volume":"9","author":"J Ma","year":"2022","unstructured":"Ma, J., Tang, L., Fan, F., et al.: SwinFusion: cross-domain long-range learning for general image fusion via Swin Transformer. IEEE\/CAA J. Autom. Sin. 9(7), 1200\u20131217 (2022)","journal-title":"IEEE\/CAA J. Autom. Sin."},{"key":"4463_CR10","doi-asserted-by":"publisher","first-page":"477","DOI":"10.1016\/j.inffus.2022.10.034","volume":"91","author":"L Tang","year":"2023","unstructured":"Tang, L., Xiang, X., Zhang, H., et al.: DIVFusion: darkness-free infrared and visible image fusion. Inf. Fusion 91, 477\u2013493 (2023)","journal-title":"Inf. Fusion"},{"issue":"12","key":"4463_CR11","doi-asserted-by":"publisher","first-page":"9645","DOI":"10.1109\/TIM.2020.3005230","volume":"69","author":"H Li","year":"2020","unstructured":"Li, H., Wu, X.J., Durrani, T.: NestFuse: an infrared and visible image fusion architecture based on nest connection and spatial\/channel attention models. IEEE Trans. Instrum. Meas. 69(12), 9645\u20139656 (2020)","journal-title":"IEEE Trans. Instrum. Meas."},{"issue":"7","key":"4463_CR12","doi-asserted-by":"publisher","first-page":"2029","DOI":"10.1007\/s00521-018-3441-1","volume":"30","author":"H Hermessi","year":"2018","unstructured":"Hermessi, H., Mourali, O., Zagrouba, E.: Convolutional neural network-based multimodal image fusion via similarity learning in the shearlet domain. Neural Comput. Appl. 30(7), 2029\u20132045 (2018)","journal-title":"Neural Comput. Appl."},{"key":"4463_CR13","doi-asserted-by":"crossref","unstructured":"Zhao Z, Bai H, Zhang J, et al. Cddfuse: Correlation-driven dual-branch feature decomposition for multi-modality image fusion. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 2023: 5906\u20135916.","DOI":"10.1109\/CVPR52729.2023.00572"},{"key":"4463_CR14","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/LGRS.2023.3339214","volume":"21","author":"J Nie","year":"2023","unstructured":"Nie, J., Sun, H., Sun, X., et al.: Cross-modal feature fusion and interaction strategy for CNN-transformer-based object detection in visual and infrared remote sensing imagery. IEEE Geosci. Remote Sens. Lett. 21, 1\u20135 (2023)","journal-title":"IEEE Geosci. Remote Sens. Lett."},{"key":"4463_CR15","unstructured":"Gu A, Dao T. Mamba: Linear-time sequence modeling with selective state spaces. In: First conference on language modeling. 2024."},{"issue":"9","key":"4463_CR16","doi-asserted-by":"publisher","first-page":"9796","DOI":"10.1109\/JSEN.2023.3263336","volume":"23","author":"J Zhang","year":"2023","unstructured":"Zhang, J., Liu, Y., Liu, A., et al.: Multimodal image fusion via self-supervised transformer. IEEE Sens. J. 23(9), 9796\u20139807 (2023)","journal-title":"IEEE Sens. J."},{"key":"4463_CR17","doi-asserted-by":"crossref","unstructured":"Vs V, Valanarasu J M J, Oza P, et al. Image fusion transformer. In: 2022 IEEE International conference on image processing (ICIP). IEEE, 2022: 3566\u20133570.","DOI":"10.1109\/ICIP46576.2022.9897280"},{"key":"4463_CR18","first-page":"1","volume":"72","author":"X Xie","year":"2023","unstructured":"Xie, X., Zhang, X., Ye, S., et al.: Mrscfusion: joint residual Swin transformer and multiscale CNN for unsupervised multimodal medical image fusion. IEEE Trans. Instrum. Meas. 72, 1\u201317 (2023)","journal-title":"IEEE Trans. Instrum. Meas."},{"key":"4463_CR19","doi-asserted-by":"crossref","unstructured":"Pei X, Huang T, Xu C. Efficientvmamba: Atrous selective scan for light weight visual mamba. In: Proceedings of the AAAI Conference on Artificial Intelligence. 2025, 39(6): 6443\u20136451.","DOI":"10.1609\/aaai.v39i6.32690"},{"key":"4463_CR20","doi-asserted-by":"crossref","unstructured":"Woo S, Park J, Lee J Y, et al. Proceedings of the European conference on computer vision (ECCV). In: Proceedings of the European conference on computer vision (ECCV). 2018, 3(5): 8.","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"4463_CR21","unstructured":"Mardani M, Gong E, Cheng J Y, et al. Deep generative adversarial networks for compressed sensing automates MRI. arXiv preprint arXiv:1706.00051, 2017."},{"key":"4463_CR22","doi-asserted-by":"crossref","unstructured":"Ram Prabhakar K, Sai Srikar V, Venkatesh Babu R. Deepfuse: A deep unsupervised approach for exposure fusion with extreme exposure image pairs. In: Proceedings of the IEEE international conference on computer vision. 2017: 4714\u20134722.","DOI":"10.1109\/ICCV.2017.505"},{"key":"4463_CR23","doi-asserted-by":"publisher","first-page":"323","DOI":"10.1016\/j.inffus.2021.06.008","volume":"76","author":"H Zhang","year":"2021","unstructured":"Zhang, H., Xu, H., Tian, X., et al.: Image fusion meets deep learning: a survey and perspective. Inf. Fusion 76, 323\u2013336 (2021)","journal-title":"Inf. Fusion"},{"issue":"5","key":"4463_CR24","first-page":"63","volume":"19","author":"C Wang","year":"2024","unstructured":"Wang, C., Zhu, Y.: Ship crack detection method based on light-weight fast convolution and bidirectional weighted feature fusion network. Chin. J. Ship Res. 19(5), 63 (2024)","journal-title":"Chin. J. Ship Res."},{"issue":"5","key":"4463_CR25","doi-asserted-by":"publisher","first-page":"1748","DOI":"10.1007\/s11263-023-01952-1","volume":"132","author":"J Liu","year":"2024","unstructured":"Liu, J., Lin, R., Wu, G., et al.: Coconet: Coupled contrastive learning network with multi-level feature ensemble for multi-modality image fusion. Int. J. Comput. Vision 132(5), 1748\u20131775 (2024)","journal-title":"Int. J. Comput. Vision"},{"key":"4463_CR26","first-page":"96","volume":"5","author":"Z Wang","year":"2024","unstructured":"Wang, Z., Liao, X., Yuan, J., et al.: Cdc-yolofusion: Leveraging cross-scale dynamic convolution fusion for visible-infrared object detection. IEEE Trans. Intell. Veh. 5, 96 (2024)","journal-title":"IEEE Trans. Intell. Veh."},{"key":"4463_CR27","doi-asserted-by":"publisher","first-page":"79","DOI":"10.1016\/j.inffus.2022.03.007","volume":"83","author":"L Tang","year":"2022","unstructured":"Tang, L., Yuan, J., Zhang, H., et al.: PIAFusion: a progressive infrared and visible image fusion network based on illumination aware. Inf. Fusion 83, 79\u201392 (2022)","journal-title":"Inf. Fusion"},{"key":"4463_CR28","doi-asserted-by":"publisher","first-page":"28","DOI":"10.1016\/j.inffus.2021.12.004","volume":"82","author":"L Tang","year":"2022","unstructured":"Tang, L., Yuan, J., Ma, J.: Image fusion in the loop of high-level vision tasks: a semantic-aware real-time infrared and visible image fusion network. Inf. Fusion 82, 28\u201342 (2022)","journal-title":"Inf. Fusion"},{"key":"4463_CR29","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1016\/j.inffus.2018.09.004","volume":"48","author":"J Ma","year":"2019","unstructured":"Ma, J., Yu, W., Liang, P., et al.: FusionGAN: a generative adversarial network for infrared and visible image fusion. Inf. Fusion 48, 11\u201326 (2019)","journal-title":"Inf. Fusion"},{"key":"4463_CR30","doi-asserted-by":"crossref","unstructured":"Bai H, Zhang J, Zhao Z, et al. Task-driven Image Fusion with Learnable Fusion Loss. In: Proceedings of the Computer Vision and Pattern Recognition Conference. 2025: 7457\u20137468.","DOI":"10.1109\/CVPR52734.2025.00699"},{"issue":"1","key":"4463_CR31","first-page":"65","volume":"46","author":"Y Lin","year":"2025","unstructured":"Lin, Y., Li, M., Li, Y., et al.: Multimodal medical image fusion based on GAN and multi-scale spatial attention. J. Zhengzhou Univ. Eng. Sci. 46(1), 65 (2025)","journal-title":"J. Zhengzhou Univ. Eng. Sci."},{"key":"4463_CR32","first-page":"790","volume":"13407","author":"A Kumar","year":"2025","unstructured":"Kumar, A., Kanthen, K.R., John, J.: GS-TransUNet: integrated 2D Gaussian splatting and transformer UNet for accurate skin lesion analysis. Medical Imaging 2025: Computer-Aided Diagnosis. SPIE 13407, 790\u2013800 (2025)","journal-title":"SPIE"},{"key":"4463_CR33","doi-asserted-by":"crossref","unstructured":"Qu L, Liu S, Wang M, et al. Transmef: A transformer-based multi-exposure image fusion framework using self-supervised multi-task learning. In: Proceedings of the AAAI conference on artificial intelligence. 2022, 36(2): 2126\u20132134.","DOI":"10.1609\/aaai.v36i2.20109"},{"issue":"1","key":"4463_CR34","doi-asserted-by":"publisher","first-page":"325","DOI":"10.1109\/TAES.2024.3443014","volume":"61","author":"L Kong","year":"2024","unstructured":"Kong, L., Gao, F., He, X., et al.: Few-shot class-incremental SAR target recognition via orthogonal distributed features. IEEE Trans. Aerosp. Electron. Syst. 61(1), 325\u2013341 (2024)","journal-title":"IEEE Trans. Aerosp. Electron. Syst."},{"key":"4463_CR35","doi-asserted-by":"crossref","unstructured":"Zhong F, Gao F, Liu T, et al. Scattering characteristics guided network for isar space target component segmentation[J]. IEEE Geoscience and Remote Sensing Letters, 2025.","DOI":"10.1109\/LGRS.2025.3576662"},{"key":"4463_CR36","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2025.3558801","author":"N Xie","year":"2025","unstructured":"Xie, N., Zhang, T., Zhang, L., et al.: VLF-SAR: a novel vision-language framework for few-shot SAR target recognition. IEEE Trans. Circuits Syst. Video Technol. (2025). https:\/\/doi.org\/10.1109\/TCSVT.2025.3558801","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"key":"4463_CR37","first-page":"1","volume":"21","author":"J Deng","year":"2024","unstructured":"Deng, J., Wang, W., Zhang, H., et al.: PolSAR ship detection based on superpixel-level contrast enhancement. IEEE Geosci. Remote Sens. Lett. 21, 1\u20135 (2024)","journal-title":"IEEE Geosci. Remote Sens. Lett."},{"issue":"1","key":"4463_CR38","doi-asserted-by":"publisher","DOI":"10.1007\/s44267-024-00072-9","volume":"2","author":"X Xie","year":"2024","unstructured":"Xie, X., Cui, Y., Tan, T., et al.: Fusionmamba: dynamic feature enhancement for multimodal image fusion with Mamba. Vis. Intell. 2(1), 37 (2024)","journal-title":"Vis. Intell."},{"key":"4463_CR39","doi-asserted-by":"crossref","unstructured":"Kalman R E. A new approach to linear filtering and prediction problems. 1960.","DOI":"10.1115\/1.3662552"},{"key":"4463_CR40","doi-asserted-by":"crossref","unstructured":"Wang Q, Wu B, Zhu P, et al. ECA-Net: Efficient channel attention for deep convolutional neural networks. In: Proceedings of the IEEE\/CVF conference oncomputer vision and pattern recognition. 2020: 11534\u201311542.","DOI":"10.1109\/CVPR42600.2020.01155"},{"issue":"5","key":"4463_CR41","doi-asserted-by":"publisher","first-page":"1702","DOI":"10.1109\/TMI.2023.3347511","volume":"43","author":"Y Zhong","year":"2023","unstructured":"Zhong, Y., Zhang, S., Liu, Z., et al.: Unsupervised fusion of misaligned PAT and MRI images via mutually reinforcing cross-modality image generation and registration. IEEE Trans. Med. Imaging 43(5), 1702\u20131714 (2023)","journal-title":"IEEE Trans. Med. Imaging"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-026-04463-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-026-04463-5","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-026-04463-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T13:16:00Z","timestamp":1777468560000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-026-04463-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,4]]},"references-count":41,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2026,4]]}},"alternative-id":["4463"],"URL":"https:\/\/doi.org\/10.1007\/s00371-026-04463-5","relation":{"has-preprint":[{"id-type":"doi","id":"10.21203\/rs.3.rs-8381183\/v1","asserted-by":"object"}]},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,4]]},"assertion":[{"value":"17 December 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 March 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 April 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interest"}},{"value":"Agreement to publish.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}}],"article-number":"244"}}