{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,5]],"date-time":"2026-05-05T00:24:55Z","timestamp":1777940695113,"version":"3.51.4"},"reference-count":70,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Journal of Visual Communication and Image Representation"],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1016\/j.jvcir.2026.104821","type":"journal-article","created":{"date-parts":[[2026,4,23]],"date-time":"2026-04-23T06:54:33Z","timestamp":1776927273000},"page":"104821","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["A Mamba-based multi-modal and multi-view ophthalmologic image analysis framework for correspondence relationships and complementary information modeling"],"prefix":"10.1016","volume":"118","author":[{"given":"Yonghao","family":"Huang","sequence":"first","affiliation":[]},{"given":"Leiting","family":"Chen","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7700-7188","authenticated-orcid":false,"given":"Chuan","family":"Zhou","sequence":"additional","affiliation":[]},{"given":"Sen","family":"Yang","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"issue":"4","key":"10.1016\/j.jvcir.2026.104821_b1","doi-asserted-by":"crossref","first-page":"e489","DOI":"10.1016\/S2214-109X(20)30488-5","article-title":"The lancet global health commission on global eye health: vision beyond 2020","volume":"9","author":"Burton","year":"2021","journal-title":"Lancet Glob. Health"},{"key":"10.1016\/j.jvcir.2026.104821_b2","doi-asserted-by":"crossref","DOI":"10.1016\/j.patcog.2021.108104","article-title":"Mvdrnet: Multi-view diabetic retinopathy detection by combining dcnns and attention mechanisms","volume":"120","author":"Luo","year":"2021","journal-title":"Pattern Recognit."},{"issue":"5","key":"10.1016\/j.jvcir.2026.104821_b3","doi-asserted-by":"crossref","first-page":"1945","DOI":"10.1109\/TMI.2024.3352602","article-title":"Geometric correspondence-based multimodal learning for ophthalmic image analysis","volume":"43","author":"Wang","year":"2024","journal-title":"IEEE Trans. Med. Imaging"},{"key":"10.1016\/j.jvcir.2026.104821_b4","series-title":"Medical Image Computing and Computer Assisted Intervention\u2013MICCAI 2019: 22nd International Conference, Shenzhen, China, October 13\u201317, 2019, Proceedings, Part I 22","first-page":"156","article-title":"Two-stream CNN with loose pair training for multi-modal amd categorization","author":"Wang","year":"2019"},{"key":"10.1016\/j.jvcir.2026.104821_b5","doi-asserted-by":"crossref","DOI":"10.1016\/j.inffus.2024.102594","article-title":"A multi-modal and multi-stage fusion enhancement network for segmentation based on OCT and OCTA images","volume":"113","author":"Quan","year":"2025","journal-title":"Inf. Fusion"},{"key":"10.1016\/j.jvcir.2026.104821_b6","series-title":"2021 IEEE International Conference on Bioinformatics and Biomedicine","first-page":"945","article-title":"Automatic report generation based on multi-modal and multi-view model for fundus images","author":"Lan","year":"2021"},{"key":"10.1016\/j.jvcir.2026.104821_b7","doi-asserted-by":"crossref","DOI":"10.1016\/j.knosys.2023.110544","article-title":"Model long-range dependencies for multi-modality and multi-view retinopathy diagnosis through transformers","volume":"271","author":"Huang","year":"2023","journal-title":"Knowl.-Based Syst."},{"key":"10.1016\/j.jvcir.2026.104821_b8","series-title":"Cross-fundus transformer for multi-modal diabetic retinopathy grading with cataract","author":"Xiao","year":"2024"},{"key":"10.1016\/j.jvcir.2026.104821_b9","article-title":"Attention is all you need","volume":"30","author":"Vaswani","year":"2017","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.jvcir.2026.104821_b10","series-title":"An image is worth 16x16 words: Transformers for image recognition at scale","author":"Dosovitskiy","year":"2020"},{"key":"10.1016\/j.jvcir.2026.104821_b11","series-title":"Mamba: Linear-time sequence modeling with selective state spaces","author":"Gu","year":"2023"},{"key":"10.1016\/j.jvcir.2026.104821_b12","series-title":"A comprehensive survey of mamba architectures for medical image analysis: Classification, segmentation, restoration and beyond","author":"Bansal","year":"2024"},{"key":"10.1016\/j.jvcir.2026.104821_b13","series-title":"Long range language modeling via gated state spaces","author":"Mehta","year":"2022"},{"key":"10.1016\/j.jvcir.2026.104821_b14","doi-asserted-by":"crossref","unstructured":"J. Wang, W. Zhu, P. Wang, X. Yu, L. Liu, M. Omar, R. Hamid, Selective structured state-spaces for long-form video understanding, in: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 2023, pp. 6387\u20136397.","DOI":"10.1109\/CVPR52729.2023.00618"},{"key":"10.1016\/j.jvcir.2026.104821_b15","first-page":"103031","article-title":"Vmamba: Visual state space model","volume":"37","author":"Liu","year":"2024","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.jvcir.2026.104821_b16","series-title":"Plainmamba: Improving non-hierarchical mamba in visual recognition","author":"Yang","year":"2024"},{"issue":"1","key":"10.1016\/j.jvcir.2026.104821_b17","doi-asserted-by":"crossref","first-page":"37","DOI":"10.1007\/s44267-024-00072-9","article-title":"Fusionmamba: Dynamic feature enhancement for multimodal image fusion with mamba","volume":"2","author":"Xie","year":"2024","journal-title":"Vis. Intell."},{"key":"10.1016\/j.jvcir.2026.104821_b18","series-title":"MGI: Multimodal contrastive pre-training of genomic and medical imaging","author":"Zhou","year":"2024"},{"key":"10.1016\/j.jvcir.2026.104821_b19","series-title":"Medmamba: Vision mamba for medical image classification","author":"Yue","year":"2024"},{"key":"10.1016\/j.jvcir.2026.104821_b20","series-title":"Nnmamba: 3d biomedical image segmentation, classification and landmark detection with state space model","author":"Gong","year":"2024"},{"key":"10.1016\/j.jvcir.2026.104821_b21","series-title":"International Conference on Medical Image Computing and Computer-Assisted Intervention","first-page":"578","article-title":"Segmamba: Long-range sequential modeling mamba for 3d medical image segmentation","author":"Xing","year":"2024"},{"key":"10.1016\/j.jvcir.2026.104821_b22","article-title":"H-vmunet: High-order vision mamba unet for medical image segmentation","author":"Wu","year":"2025","journal-title":"Neurocomputing"},{"key":"10.1016\/j.jvcir.2026.104821_b23","series-title":"Mambamir: An arbitrary-masked mamba for joint medical image reconstruction and uncertainty estimation","author":"Huang","year":"2024"},{"key":"10.1016\/j.jvcir.2026.104821_b24","series-title":"Fd-vision mamba for endoscopic exposure correction","author":"Zheng","year":"2024"},{"key":"10.1016\/j.jvcir.2026.104821_b25","series-title":"Vision mamba: Efficient visual representation learning with bidirectional state space model","author":"Liang","year":"2024"},{"key":"10.1016\/j.jvcir.2026.104821_b26","article-title":"A review of deep learning-based information fusion techniques for multimodal medical image classification","author":"Li","year":"2024","journal-title":"Comput. Biol. Med."},{"key":"10.1016\/j.jvcir.2026.104821_b27","article-title":"A review: Deep learning for medical image segmentation using multi-modality fusion","volume":"3","author":"Zhou","year":"2019","journal-title":"Array"},{"key":"10.1016\/j.jvcir.2026.104821_b28","doi-asserted-by":"crossref","DOI":"10.1109\/TMI.2024.3398728","article-title":"Unetr++: delving into efficient and accurate 3D medical image segmentation","author":"Shaker","year":"2024","journal-title":"IEEE Trans. Med. Imaging"},{"key":"10.1016\/j.jvcir.2026.104821_b29","doi-asserted-by":"crossref","first-page":"4036","DOI":"10.1109\/TIP.2023.3293771","article-title":"Nnformer: volumetric medical image segmentation via a 3D transformer","volume":"32","author":"Zhou","year":"2023","journal-title":"IEEE Trans. Image Process."},{"key":"10.1016\/j.jvcir.2026.104821_b30","article-title":"Deep learning-based classification of healthy aging controls, mild cognitive impairment and alzheimer\u2019s disease using fusion of MRI-pet imaging","volume":"80","author":"Rallabandi","year":"2023","journal-title":"Biomed. Signal Process. Control."},{"key":"10.1016\/j.jvcir.2026.104821_b31","article-title":"Computer-aided diagnosis of breast ultrasound images using ensemble learning from convolutional neural networks","volume":"190","author":"Moon","year":"2020","journal-title":"Comput. Methods Programs Biomed."},{"issue":"1","key":"10.1016\/j.jvcir.2026.104821_b32","doi-asserted-by":"crossref","first-page":"3404","DOI":"10.1038\/s41467-022-31037-5","article-title":"Multimodal deep learning for alzheimer\u2019s disease dementia assessment","volume":"13","author":"Qiu","year":"2022","journal-title":"Nat. Commun."},{"key":"10.1016\/j.jvcir.2026.104821_b33","article-title":"Diagnosis of early glottic cancer using laryngeal image and voice based on ensemble learning of convolutional neural network classifiers","author":"Kwon","year":"2022","journal-title":"J. Voice"},{"issue":"1","key":"10.1016\/j.jvcir.2026.104821_b34","doi-asserted-by":"crossref","first-page":"2","DOI":"10.1186\/s40708-023-00217-4","article-title":"Deep learning based joint fusion approach to exploit anatomical and functional brain information in autism spectrum disorders","volume":"11","author":"Saponaro","year":"2024","journal-title":"Brain Informatics"},{"key":"10.1016\/j.jvcir.2026.104821_b35","doi-asserted-by":"crossref","DOI":"10.1016\/j.dsp.2023.104229","article-title":"Efficient multimodel method based on transformers and CoAtNet for alzheimer\u2019s diagnosis","volume":"143","author":"Kadri","year":"2023","journal-title":"Digit. Signal Process."},{"issue":"2","key":"10.1016\/j.jvcir.2026.104821_b36","doi-asserted-by":"crossref","first-page":"171","DOI":"10.1016\/j.ophtha.2021.07.032","article-title":"Multimodal machine learning using visual fields and peripapillary circular OCT scans in detection of glaucomatous optic neuropathy","volume":"129","author":"Xiong","year":"2022","journal-title":"Ophthalmology"},{"issue":"1","key":"10.1016\/j.jvcir.2026.104821_b37","doi-asserted-by":"crossref","DOI":"10.1002\/ima.22970","article-title":"MMTFN: Multi-modal multi-scale transformer fusion network for alzheimer\u2019s disease diagnosis","volume":"34","author":"Miao","year":"2024","journal-title":"Int. J. Imaging Syst. Technol."},{"key":"10.1016\/j.jvcir.2026.104821_b38","doi-asserted-by":"crossref","DOI":"10.1016\/j.eswa.2023.121574","article-title":"TranSiam: Aggregating multi-modal visual features with locality for medical image segmentation","volume":"237","author":"Li","year":"2024","journal-title":"Expert Syst. Appl."},{"issue":"17","key":"10.1016\/j.jvcir.2026.104821_b39","doi-asserted-by":"crossref","DOI":"10.1002\/hbm.26783","article-title":"A multimodal vision transformer for interpretable fusion of functional and structural neuroimaging data","volume":"45","author":"Bi","year":"2024","journal-title":"Hum. Brain Mapp."},{"issue":"1","key":"10.1016\/j.jvcir.2026.104821_b40","doi-asserted-by":"crossref","first-page":"112","DOI":"10.1186\/s12880-024-01296-3","article-title":"A multi-view fusion lightweight network for crswnps prediction on ct images","volume":"24","author":"Zou","year":"2024","journal-title":"BMC Med. Imaging"},{"key":"10.1016\/j.jvcir.2026.104821_b41","article-title":"A lesion-fusion neural network for multi-view diabetic retinopathy grading","author":"Luo","year":"2024","journal-title":"IEEE J. Biomed. Health Inform."},{"issue":"14","key":"10.1016\/j.jvcir.2026.104821_b42","doi-asserted-by":"crossref","first-page":"1566","DOI":"10.3390\/diagnostics14141566","article-title":"MV-MFF: Multi-view multi-feature fusion model for pneumonia classification","volume":"14","author":"Alsulami","year":"2024","journal-title":"Diagnostics"},{"key":"10.1016\/j.jvcir.2026.104821_b43","doi-asserted-by":"crossref","unstructured":"D. Kim, Chexfusion: Effective fusion of multi-view features using transformers for long-tailed chest x-ray classification, in: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 2023, pp. 2702\u20132710.","DOI":"10.1109\/ICCVW60793.2023.00285"},{"key":"10.1016\/j.jvcir.2026.104821_b44","first-page":"572","article-title":"Combining recurrent, convolutional, and continuous-time models with linear state space layers","volume":"34","author":"Gu","year":"2021","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.jvcir.2026.104821_b45","series-title":"Efficiently modeling long sequences with structured state spaces","author":"Gu","year":"2021"},{"key":"10.1016\/j.jvcir.2026.104821_b46","series-title":"Simplified state space layers for sequence modeling","author":"Smith","year":"2022"},{"issue":"4","key":"10.1016\/j.jvcir.2026.104821_b47","doi-asserted-by":"crossref","first-page":"1445","DOI":"10.1109\/TPAMI.2020.2975798","article-title":"Deep multi-view enhancement hashing for image retrieval","volume":"43","author":"Yan","year":"2020","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"4","key":"10.1016\/j.jvcir.2026.104821_b48","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3404374","article-title":"Depth image denoising using nuclear norm and learning graph model","volume":"16","author":"Yan","year":"2020","journal-title":"ACM Trans. Multimed. Comput. Commun. Appl. (TOMM)"},{"issue":"1","key":"10.1016\/j.jvcir.2026.104821_b49","doi-asserted-by":"crossref","first-page":"43","DOI":"10.1109\/TCSVT.2021.3067449","article-title":"Task-adaptive attention for image captioning","volume":"32","author":"Yan","year":"2021","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"issue":"3s","key":"10.1016\/j.jvcir.2026.104821_b50","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3468872","article-title":"Precise no-reference image quality evaluation based on distortion identification","volume":"17","author":"Yan","year":"2021","journal-title":"ACM Trans. Multimed. Comput. Commun. Appl. (TOMM)"},{"issue":"1s","key":"10.1016\/j.jvcir.2026.104821_b51","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3472810","article-title":"Age-invariant face recognition by multi-feature fusionand decomposition with self-attention","volume":"18","author":"Yan","year":"2022","journal-title":"ACM Trans. Multimed. Comput. Commun. Appl. (TOMM)"},{"issue":"6","key":"10.1016\/j.jvcir.2026.104821_b52","first-page":"1111","article-title":"Review of omnimedia content quality evaluation","volume":"38","author":"Yan","year":"2022","journal-title":"J. Signal Process."},{"key":"10.1016\/j.jvcir.2026.104821_b53","doi-asserted-by":"crossref","unstructured":"Z. Zhang, L. Li, G. Cong, H. Yin, Y. Gao, C. Yan, A.v.d. Hengel, Y. Qi, From speaker to dubber: movie dubbing with prosody and duration consistency learning, in: Proceedings of the 32nd ACM International Conference on Multimedia, 2024, pp. 7523\u20137532.","DOI":"10.1145\/3664647.3680777"},{"key":"10.1016\/j.jvcir.2026.104821_b54","series-title":"International Conference on Medical Image Computing and Computer-Assisted Intervention","first-page":"134","article-title":"Cardiovascular disease detection from multi-view chest X-rays with BI-mamba","author":"Yang","year":"2024"},{"key":"10.1016\/j.jvcir.2026.104821_b55","doi-asserted-by":"crossref","unstructured":"S. Woo, J. Park, J.-Y. Lee, I.S. Kweon, Cbam: Convolutional block attention module, in: Proceedings of the European Conference on Computer Vision, ECCV, 2018, pp. 3\u201319.","DOI":"10.1007\/978-3-030-01234-2_1"},{"issue":"8","key":"10.1016\/j.jvcir.2026.104821_b56","doi-asserted-by":"crossref","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","article-title":"Long short-term memory","volume":"9","author":"Hochreiter","year":"1997","journal-title":"Neural Comput."},{"key":"10.1016\/j.jvcir.2026.104821_b57","series-title":"On the automatic generation of medical imaging reports","author":"Jing","year":"2017"},{"key":"10.1016\/j.jvcir.2026.104821_b58","series-title":"Adam: a method for stochastic optimization","author":"Kingma","year":"2014"},{"issue":"8","key":"10.1016\/j.jvcir.2026.104821_b59","doi-asserted-by":"crossref","first-page":"1384","DOI":"10.3390\/diagnostics11081384","article-title":"Transmed: Transformers advance multi-modal medical image classification","volume":"11","author":"Dai","year":"2021","journal-title":"Diagnostics"},{"key":"10.1016\/j.jvcir.2026.104821_b60","doi-asserted-by":"crossref","unstructured":"K. Papineni, S. Roukos, T. Ward, W.-J. Zhu, Bleu: a method for automatic evaluation of machine translation, in: Proceedings of the 40th Annual Meeting of the Association for Computational Linguistics, 2002, pp. 311\u2013318.","DOI":"10.3115\/1073083.1073135"},{"key":"10.1016\/j.jvcir.2026.104821_b61","unstructured":"C.-Y. Lin, Rouge: A package for automatic evaluation of summaries, in: Text Summarization Branches Out, 2004, pp. 74\u201381."},{"key":"10.1016\/j.jvcir.2026.104821_b62","doi-asserted-by":"crossref","unstructured":"M. Denkowski, A. Lavie, Meteor universal: Language specific translation evaluation for any target language, in: Proceedings of the Ninth Workshop on Statistical Machine Translation, 2014, pp. 376\u2013380.","DOI":"10.3115\/v1\/W14-3348"},{"key":"10.1016\/j.jvcir.2026.104821_b63","doi-asserted-by":"crossref","unstructured":"R. Vedantam, C. Lawrence Zitnick, D. Parikh, Cider: Consensus-based image description evaluation, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2015, pp. 4566\u20134575.","DOI":"10.1109\/CVPR.2015.7299087"},{"key":"10.1016\/j.jvcir.2026.104821_b64","series-title":"2009 IEEE Conference on Computer Vision and Pattern Recognition","first-page":"248","article-title":"Imagenet: A large-scale hierarchical image database","author":"Deng","year":"2009"},{"key":"10.1016\/j.jvcir.2026.104821_b65","doi-asserted-by":"crossref","unstructured":"K. He, X. Zhang, S. Ren, J. Sun, Deep residual learning for image recognition, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2016, pp. 770\u2013778.","DOI":"10.1109\/CVPR.2016.90"},{"key":"10.1016\/j.jvcir.2026.104821_b66","series-title":"2024 IEEE International Symposium on Biomedical Imaging","first-page":"1","article-title":"Mv-swin-t: mammogram classification with multi-view swin transformer","author":"Sarker","year":"2024"},{"key":"10.1016\/j.jvcir.2026.104821_b67","doi-asserted-by":"crossref","unstructured":"S. Black, R. Souvenir, Multi-view classification using hybrid fusion and mutual distillation, in: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, 2024, pp. 270\u2013280.","DOI":"10.1109\/WACV57701.2024.00034"},{"key":"10.1016\/j.jvcir.2026.104821_b68","series-title":"Xfmamba: Cross-fusion mamba for multi-view medical image classification","author":"Zheng","year":"2025"},{"key":"10.1016\/j.jvcir.2026.104821_b69","doi-asserted-by":"crossref","unstructured":"X. Wang, Y. Peng, L. Lu, Z. Lu, R.M. Summers, Tienet: Text-image embedding network for common thorax disease classification and reporting in chest x-rays, in: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2018, pp. 9049\u20139058.","DOI":"10.1109\/CVPR.2018.00943"},{"key":"10.1016\/j.jvcir.2026.104821_b70","doi-asserted-by":"crossref","unstructured":"R.R. Selvaraju, M. Cogswell, A. Das, R. Vedantam, D. Parikh, D. Batra, Grad-cam: Visual explanations from deep networks via gradient-based localization, in: Proceedings of the IEEE International Conference on Computer Vision, 2017, pp. 618\u2013626.","DOI":"10.1109\/ICCV.2017.74"}],"container-title":["Journal of Visual Communication and Image Representation"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1047320326001161?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1047320326001161?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,5,2]],"date-time":"2026-05-02T05:57:51Z","timestamp":1777701471000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1047320326001161"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,6]]},"references-count":70,"alternative-id":["S1047320326001161"],"URL":"https:\/\/doi.org\/10.1016\/j.jvcir.2026.104821","relation":{},"ISSN":["1047-3203"],"issn-type":[{"value":"1047-3203","type":"print"}],"subject":[],"published":{"date-parts":[[2026,6]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"A Mamba-based multi-modal and multi-view ophthalmologic image analysis framework for correspondence relationships and complementary information modeling","name":"articletitle","label":"Article Title"},{"value":"Journal of Visual Communication and Image Representation","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.jvcir.2026.104821","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier Inc. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"104821"}}