{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,4]],"date-time":"2025-12-04T07:02:16Z","timestamp":1764831736281,"version":"3.46.0"},"reference-count":36,"publisher":"Tech Science Press","issue":"2","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["CMC"],"published-print":{"date-parts":[[2025]]},"DOI":"10.32604\/cmc.2025.066937","type":"journal-article","created":{"date-parts":[[2025,7,22]],"date-time":"2025-07-22T07:24:21Z","timestamp":1753169061000},"page":"2999-3022","source":"Crossref","is-referenced-by-count":0,"title":["An Overlapped Multihead Self-Attention-Based Feature Enhancement Approach for Ocular Disease Image Recognition"],"prefix":"10.32604","volume":"85","author":[{"given":"Peng","family":"Xiao","sequence":"first","affiliation":[]},{"given":"Haiyu","family":"Xu","sequence":"additional","affiliation":[]},{"given":"Peng","family":"Xu","sequence":"additional","affiliation":[]},{"given":"Zhiwei","family":"Guo","sequence":"additional","affiliation":[]},{"given":"Amr","family":"Tolba","sequence":"additional","affiliation":[]},{"given":"Osama","family":"Alfarraj","sequence":"additional","affiliation":[]}],"member":"17807","published-online":{"date-parts":[[2025]]},"reference":[{"key":"ref1","doi-asserted-by":"crossref","first-page":"221","DOI":"10.1146\/annurev-bioeng-071516-044442","article-title":"Deep learning in medical image analysis","volume":"19","author":"Shen","year":"2017","journal-title":"Annu Rev Biomed Eng"},{"key":"ref2","doi-asserted-by":"crossref","first-page":"315","DOI":"10.1146\/annurev.bioeng.2.1.315","article-title":"Current methods in medical image segmentation","volume":"2","author":"Pham","year":"2000","journal-title":"Annu Rev Biomed Eng"},{"key":"ref3","doi-asserted-by":"crossref","first-page":"137","DOI":"10.1007\/s10462-020-09854-1","article-title":"Deep semantic segmentation of natural and medical images: a review","volume":"54","author":"Asgari Taghanaki","year":"2021","journal-title":"Artif Intell Rev"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"185","DOI":"10.1007\/s10462-024-10806-2","article-title":"Deep learning model using classification for diabetic retinopathy detection: an overview","volume":"57","author":"Muthusamy","year":"2024","journal-title":"Artif Intell Rev"},{"key":"ref5","doi-asserted-by":"crossref","first-page":"154","DOI":"10.1016\/j.ajo.2021.04.021","article-title":"Automated detection of glaucoma with interpretable machine learning using clinical data and multimodal retinal images","volume":"231","author":"Mehta","year":"2021","journal-title":"Am J Ophthalmol"},{"key":"ref6","doi-asserted-by":"crossref","first-page":"1049","DOI":"10.1007\/s00371-024-03383-6","article-title":"Deep learning-driven automated quality assessment of ultra-widefield optical coherence tomography angiography images for diabetic retinopathy","volume":"41","author":"Jin","year":"2025","journal-title":"Vis Comput"},{"key":"ref7","doi-asserted-by":"crossref","first-page":"1045","DOI":"10.1001\/jamaophthalmol.2023.4650","article-title":"Deep learning performance of ultra-widefield fundus imaging for screening retinal lesions in rural locales","volume":"141","author":"Cui","year":"2023","journal-title":"JAMA Ophthalmol"},{"key":"ref8","first-page":"3523","article-title":"Image segmentation using deep learning: a survey","volume":"44","author":"Minaee","year":"2022","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"ref9","doi-asserted-by":"crossref","first-page":"2263","DOI":"10.1007\/s10462-023-10577-2","article-title":"Attention-based graph neural networks: a survey","volume":"56","author":"Sun","year":"2023","journal-title":"Artif Intell Rev"},{"key":"ref10","doi-asserted-by":"crossref","first-page":"106478","DOI":"10.1016\/j.bspc.2024.106478","article-title":"Adaptive spatial and frequency experts fusion network for medical image fusion","volume":"96","author":"Gu","year":"2024","journal-title":"Biomed Signal Process Control"},{"key":"ref11","doi-asserted-by":"crossref","first-page":"3699","DOI":"10.1364\/BOE.516764","article-title":"Cross-modal attention network for retinal disease classification based on multi-modal images","volume":"15","author":"Liu","year":"2024","journal-title":"Biomed Opt Express"},{"key":"ref12","doi-asserted-by":"crossref","first-page":"108057","DOI":"10.1016\/j.compbiomed.2024.108057","article-title":"MS-TCNet: an effective Transformer-CNN combined network using multi-scale feature learning for 3D medical image segmentation","volume":"170","author":"Ao","year":"2024","journal-title":"Comput Biol Med"},{"key":"ref13","doi-asserted-by":"crossref","first-page":"60","DOI":"10.1016\/j.media.2017.07.005","article-title":"A survey on deep learning in medical image analysis","volume":"42","author":"Litjens","year":"2017","journal-title":"Med Image Anal"},{"article-title":"TransFusion: multi-view divergent fusion for medical image segmentation with transformers","series-title":"Proceedings of the Medical Image Computing and Computer Assisted Intervention\u2014MICCAI 2022; 2022 Sep 18\u201322","author":"Liu","key":"ref14"},{"article-title":"U-Net transformer: self and cross attention for medical image segmentation","series-title":"Proceedings of the Machine Learning in Medical Imaging; 2021 Sep 27","author":"Petit","key":"ref15"},{"key":"ref16","doi-asserted-by":"crossref","first-page":"2598","DOI":"10.1109\/TMI.2022.3167808","article-title":"ResViT: residual vision transformers for multimodal medical image synthesis","volume":"41","author":"Dalmaz","year":"2022","journal-title":"IEEE Trans Med Imag"},{"key":"ref17","doi-asserted-by":"crossref","first-page":"106890","DOI":"10.1016\/j.knosys.2021.106890","article-title":"An effective multi-model fusion method for EEG-based sleep stage classification","volume":"219","author":"An","year":"2021","journal-title":"Knowl Based Syst"},{"key":"ref18","doi-asserted-by":"crossref","first-page":"210","DOI":"10.1016\/j.isatra.2019.11.023","article-title":"A feature selection and multi-model fusion-based approach of predicting air quality","volume":"100","author":"Zhang","year":"2020","journal-title":"ISA Trans"},{"key":"ref19","doi-asserted-by":"crossref","first-page":"598","DOI":"10.1109\/TPDS.2022.3222765","article-title":"TFormer: a transmission-friendly ViT model for IoT devices","volume":"34","author":"Lu","year":"2023","journal-title":"IEEE Trans Parallel Distrib Syst"},{"key":"ref20","doi-asserted-by":"crossref","first-page":"7853","DOI":"10.1109\/TPAMI.2022.3223955","article-title":"TransVOD: end-to-end video object detection with spatial-temporal transformers","volume":"45","author":"Zhou","year":"2022","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"ref21","doi-asserted-by":"crossref","first-page":"109552","DOI":"10.1016\/j.knosys.2022.109552","article-title":"Vision transformers for dense prediction: a survey","volume":"253","author":"Zuo","year":"2022","journal-title":"Knowl Based Syst"},{"article-title":"BossNAS: exploring hybrid CNN-transformers with block-wisely self-supervised neural architecture search","series-title":"Proceedings of the 2021 IEEE\/CVF International Conference on Computer Vision (ICCV); 2021 Oct 10\u201317","author":"Li","key":"ref22"},{"article-title":"Incorporating convolution designs into visual transformers","series-title":"Proceedings of the 2021 IEEE\/CVF International Conference on Computer Vision (ICCV); 2021 Oct 10\u201317","author":"Yuan","key":"ref23"},{"key":"ref24","doi-asserted-by":"crossref","first-page":"9454","DOI":"10.1109\/TPAMI.2023.3243048","article-title":"Conformer: local features coupling global representations for recognition and detection","volume":"45","author":"Peng","year":"2023","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"article-title":"Mobile-former: bridging MobileNet and transformer","series-title":"Proceedings of the 2022 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR); 2022 Jun 18\u201324","author":"Chen","key":"ref25"},{"article-title":"Medical transformer: gated axial-attention for medical image segmentation","series-title":"Proceedings of the Medical Image Computing and Computer Assisted Intervention\u2014MICCAI 2021; 2021 Sep 27\u2013Oct 1","author":"Valanarasu","key":"ref26"},{"key":"ref27","doi-asserted-by":"crossref","first-page":"2123","DOI":"10.1007\/s00371-024-03524-x","article-title":"Vision transformers (ViT) and deep convolutional neural network (D-CNN)-based models for MRI brain primary tumors images multi-classification supported by explainable artificial intelligence (XAI)","volume":"41","author":"Mzoughi","year":"2025","journal-title":"Vis Comput"},{"key":"ref28","doi-asserted-by":"crossref","first-page":"203","DOI":"10.1038\/s41592-020-01008-z","article-title":"nnU-Net: a self-configuring method for deep learning-based biomedical image segmentation","volume":"18","author":"Isensee","year":"2021","journal-title":"Nat Methods"},{"article-title":"ParC-net: position aware circular convolution with merits from ConvNets and transformer","series-title":"Proceedings of the Computer Vision\u2014ECCV 2022; 2022 Oct 23\u201327","author":"Zhang","key":"ref29"},{"article-title":"CMT: convolutional neural networks meet vision transformers","series-title":"Proceedings of the 2022 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR); 2022 Jun 18\u201324","author":"Guo","key":"ref30"},{"key":"ref31","doi-asserted-by":"crossref","first-page":"896","DOI":"10.1109\/TPAMI.2023.3329173","article-title":"MetaFormer baselines for vision","volume":"46","author":"Yu","year":"2024","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"ref32","doi-asserted-by":"crossref","first-page":"8176","DOI":"10.1109\/TPAMI.2023.3236725","article-title":"Convolution-enhanced evolving attention networks","volume":"45","author":"Wang","year":"2023","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"ref33","doi-asserted-by":"crossref","first-page":"144","DOI":"10.1109\/TBC.2022.3204235","article-title":"Attentional feature fusion for end-to-end blind image quality assessment","volume":"69","author":"Zhou","year":"2023","journal-title":"IEEE Trans Broadcast"},{"key":"ref34","doi-asserted-by":"crossref","first-page":"1326","DOI":"10.1109\/TIP.2022.3197972","article-title":"Decoupled cross-modal phrase-attention network for image-sentence matching","volume":"33","author":"Shi","year":"2022","journal-title":"IEEE Trans Image Process"},{"key":"ref35","doi-asserted-by":"crossref","first-page":"2917","DOI":"10.1007\/s10462-023-10595-0","article-title":"A survey of the vision transformers and their CNN-transformer based variants","volume":"56","author":"Khan","year":"2023","journal-title":"Artif Intell Rev"},{"article-title":"Evaluating Adan vs. Adam: an analysis of optimizer performance in deep learning","series-title":"Proceedings of the 5th International Symposium on Intelligent Computing Systems, ISICS 2024; 2024 Nov 6\u20137","author":"Ismail","key":"ref36"}],"container-title":["Computers, Materials &amp; Continua"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/cdn.techscience.cn\/files\/cmc\/2025\/TSP_CMC-85-2\/TSP_CMC_66937\/TSP_CMC_66937.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,4]],"date-time":"2025-12-04T05:35:40Z","timestamp":1764826540000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.techscience.com\/cmc\/v85n2\/63805"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"references-count":36,"journal-issue":{"issue":"2","published-online":{"date-parts":[[2025]]},"published-print":{"date-parts":[[2025]]}},"URL":"https:\/\/doi.org\/10.32604\/cmc.2025.066937","relation":{},"ISSN":["1546-2226"],"issn-type":[{"type":"electronic","value":"1546-2226"}],"subject":[],"published":{"date-parts":[[2025]]}}}