{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,2]],"date-time":"2026-04-02T19:07:06Z","timestamp":1775156826705,"version":"3.50.1"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"8","license":[{"start":{"date-parts":[[2025,9,24]],"date-time":"2025-09-24T00:00:00Z","timestamp":1758672000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,9,24]],"date-time":"2025-09-24T00:00:00Z","timestamp":1758672000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"DOI":"10.13039\/501100001809","name":"The National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["62266025"],"award-info":[{"award-number":["62266025"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J. King Saud Univ. Comput. Inf. Sci."],"published-print":{"date-parts":[[2025,10]]},"DOI":"10.1007\/s44443-025-00159-3","type":"journal-article","created":{"date-parts":[[2025,9,24]],"date-time":"2025-09-24T10:37:24Z","timestamp":1758710244000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["DR-MAE: Self-supervised learning for diabetic retinopathy grading based on masked autoencoder"],"prefix":"10.1007","volume":"37","author":[{"given":"Yanyou","family":"Ren","sequence":"first","affiliation":[]},{"given":"Dangguo","family":"Shao","sequence":"additional","affiliation":[]},{"given":"Sanli","family":"Yi","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,9,24]]},"reference":[{"issue":"3","key":"159_CR1","doi-asserted-by":"publisher","first-page":"467","DOI":"10.1109\/TBCAS.2022.3182907","volume":"16","author":"AB Aujih","year":"2022","unstructured":"Aujih AB, Shapiai MI, Meriaudeau F, Tang TB (2022) EDR-Net: Lightweight deep neural network architecture for detecting referable diabetic retinopathy. IEEE Trans Biomed Circuits Syst 16(3):467\u2013478. https:\/\/doi.org\/10.1109\/TBCAS.2022.3182907","journal-title":"IEEE Trans Biomed Circuits Syst"},{"key":"159_CR2","unstructured":"Bao H, Dong L, Piao S, et al. Beit: Bert pre-training of image transformers[J]. arXiv preprint arXiv:2106.08254, 2021."},{"key":"159_CR3","doi-asserted-by":"publisher","first-page":"105341","DOI":"10.1016\/j.compbiomed.2022.105341","volume":"144","author":"P Cao","year":"2022","unstructured":"Cao P, Hou Q, Song R, Wang H, Zaiane O (2022) Collaborative learning of weaklysupervised domain adaptation for diabetic retinopathy grading on retinal images. Comput Biol Med 144:105341","journal-title":"Comput Biol Med"},{"key":"159_CR4","unstructured":"Chen X, Fan H, Girshick R, et al. Improved baselines with momentum contrastive learning[J]. arXiv preprint arXiv:2003.04297, 2020."},{"key":"159_CR5","unstructured":"Chen T, Kornblith S, Norouzi M, et al. A simple framework for contrastive learning of visual representations[C]\/\/International conference on machine learning. PMLR, 2020: 1597\u20131607."},{"key":"159_CR6","doi-asserted-by":"publisher","first-page":"107037","DOI":"10.1016\/j.compbiomed.2023.107037","volume":"161","author":"Y Dai","year":"2023","unstructured":"Dai Y, Liu F, Chen W et al (2023) Swin MAE: masked autoencoders for small datasets[J]. Comput Biol Med 161:107037","journal-title":"Comput Biol Med"},{"key":"159_CR7","unstructured":"Diabetic retinopathy screening. EyePACS; 8 May 2019. www.eyepacs.com\/"},{"key":"159_CR8","doi-asserted-by":"crossref","unstructured":"Ding X, Zhang X, Ma N, et al. Repvgg: Making vgg-style convnets great again[C]\/\/Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 2021: 13733\u201313742.","DOI":"10.1109\/CVPR46437.2021.01352"},{"key":"159_CR9","unstructured":"Dosovitskiy A. An image is worth 16x16 words: Transformers for image recognition at scale[J]. arXiv preprint arXiv:2010.11929, 2020."},{"key":"159_CR10","unstructured":"Gao P, Ma T, Li H, et al. Convmae: Masked convolution meets masked autoencoders[J]. arXiv preprint arXiv:2205.03892, 2022."},{"key":"159_CR11","unstructured":"Geng X, Liu H, Lee L, et al. Multimodal masked autoencoders learn transferable representations[J]. arXiv preprint arXiv:2205.14204, 2022."},{"issue":"1","key":"159_CR12","doi-asserted-by":"publisher","first-page":"1305583","DOI":"10.1155\/2023\/1305583","volume":"2023","author":"Z Gu","year":"2023","unstructured":"Gu Z, Li Y, Wang Z et al (2023) Classification of diabetic retinopathy severity in fundus images using the vision transformer and residual attention[J]. Comput Intell Neurosci 2023(1):1305583","journal-title":"Comput Intell Neurosci"},{"issue":"13","key":"159_CR13","doi-asserted-by":"publisher","first-page":"16797","DOI":"10.1007\/s10489-022-04295-5","volume":"53","author":"X Guo","year":"2023","unstructured":"Guo X, Li X, Lin Q et al (2023) Joint grading of diabetic retinopathy and diabetic macular edema using an adaptive attention block and semisupervised learning[J]. Appl Intell 53(13):16797\u201316812","journal-title":"Appl Intell"},{"key":"159_CR14","unstructured":"Hatamizadeh A, Heinrich G, Yin H, et al. Fastervit: Fast vision transformers with hierarchical attention[J]. arXiv preprint arXiv:2306.06189, 2023."},{"issue":"1","key":"159_CR15","doi-asserted-by":"publisher","first-page":"143","DOI":"10.1109\/TMI.2020.3023463","volume":"40","author":"A He","year":"2020","unstructured":"He A, Li T, Li N, Wang K, Fu H (2020b) CABNet: category attention block for imbalanced diabetic retinopathy grading. IEEE Trans Med Imaging 40(1):143\u2013153","journal-title":"IEEE Trans Med Imaging"},{"key":"159_CR16","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, et al. Deep residual learning for image recognition[C]\/\/Proceedings of the IEEE conference on computer vision and pattern recognition. 2016: 770\u2013778.","DOI":"10.1109\/CVPR.2016.90"},{"key":"159_CR17","doi-asserted-by":"crossref","unstructured":"He K, Fan H, Wu Y, et al. Momentum contrast for unsupervised visual representation learning[C]\/\/Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 2020: 9729\u20139738.","DOI":"10.1109\/CVPR42600.2020.00975"},{"key":"159_CR18","doi-asserted-by":"crossref","unstructured":"He K, Chen X, Xie S, et al. Masked autoencoders are scalable vision learners[C]\/\/Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 2022: 16000\u201316009.","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"159_CR19","doi-asserted-by":"publisher","first-page":"105602","DOI":"10.1016\/j.compbiomed.2022.105602","volume":"146","author":"MR Islam","year":"2022","unstructured":"Islam MR, Abdulrazak LF, Nahiduzzaman M et al (2022) Applying supervised contrastive learning for the detection of diabetic retinopathy and its severity levels from fundus images[J]. Comput Biol Med 146:105602","journal-title":"Comput Biol Med"},{"key":"159_CR20","doi-asserted-by":"publisher","first-page":"103256","DOI":"10.1016\/j.media.2024.103256","volume":"97","author":"Q Kang","year":"2024","unstructured":"Kang Q, Lao Q, Gao J et al (2024) Deblurring masked image modeling for ultrasound image analysis[J]. Med Image Anal 97:103256","journal-title":"Med Image Anal"},{"key":"159_CR21","unstructured":"M. Karthick, D. Sohier, APTOS 2019 blindness detection, 2019, Kagglehttps:\/\/kaggle.com\/competitions\/aptos2019-blindness-detection."},{"key":"159_CR22","doi-asserted-by":"publisher","first-page":"61408","DOI":"10.1109\/ACCESS.2021.3074422","volume":"9","author":"Z Khan","year":"2021","unstructured":"Khan Z, Khan FG, Khan A, Rehman ZU, Shah S, Qummar S et al (2021) Diabetic retinopathy detection using VGG-NIN a deep learning architecture. IEEE Access 9:61408\u201361416. https:\/\/doi.org\/10.1109\/ACCESS.2021.3074422","journal-title":"IEEE Access"},{"key":"159_CR23","unstructured":"Kim T, Chun S, Heo B, et al. Longer-range Contextualized Masked Autoencoder[J]. arXiv preprint arXiv:2310.13593, 2023."},{"key":"159_CR24","doi-asserted-by":"publisher","first-page":"107994","DOI":"10.1016\/j.engappai.2024.107994","volume":"133","author":"Y Lei","year":"2024","unstructured":"Lei Y, Lin S, Li Z et al (2024) GNN-fused CapsNet with multi-head prediction for diabetic retinopathy grading[J]. Eng Appl Artif Intell 133:107994","journal-title":"Eng Appl Artif Intell"},{"key":"159_CR25","doi-asserted-by":"publisher","first-page":"511","DOI":"10.1016\/j.ins.2019.06.011","volume":"501","author":"T Li","year":"2019","unstructured":"Li T, Gao Y, Wang K, Guo S, Liu H, Kang H (2019) Diagnostic assessment of deep learning algorithms for diabetic retinopathy screening. Inform Sci 501:511\u2013522","journal-title":"Inform Sci"},{"key":"159_CR26","doi-asserted-by":"publisher","first-page":"105607","DOI":"10.1016\/j.bspc.2023.105607","volume":"88","author":"J Lian","year":"2024","unstructured":"Lian J, Liu T (2024) Lesion identification in fundus images via convolutional neural network-vision transformer[J]. Biomed Signal Process Control 88:105607","journal-title":"Biomed Signal Process Control"},{"issue":"1","key":"159_CR27","first-page":"857","volume":"35","author":"X Liu","year":"2021","unstructured":"Liu X, Zhang F, Hou Z et al (2021a) Self-supervised learning: Generative or contrastive[J]. IEEE Trans Knowl Data Eng 35(1):857\u2013876","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"159_CR28","doi-asserted-by":"crossref","unstructured":"Liu X, Chi W. A cross-lesion attention network for accurate diabetic retinopathy grading with fundus images[J]. IEEE Transactions on Instrumentation and Measurement, 2023.","DOI":"10.1109\/TIM.2023.3322497"},{"key":"159_CR29","doi-asserted-by":"crossref","unstructured":"Liu Z, Lin Y, Cao Y, et al. Swin transformer: Hierarchical vision transformer using shifted windows[C]\/\/Proceedings of the IEEE\/CVF international conference on computer vision. 2021: 10012\u201310022.","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"159_CR30","doi-asserted-by":"crossref","unstructured":"Liu Z, Mao H, Wu C Y, et al. A convnet for the 2020s[C]\/\/Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 2022: 11976\u201311986.","DOI":"10.1109\/CVPR52688.2022.01167"},{"key":"159_CR31","doi-asserted-by":"crossref","unstructured":"Ma X, Dai X, Bai Y, et al. Rewrite the Stars[C]\/\/Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2024: 5694\u20135703.","DOI":"10.1109\/CVPR52733.2024.00544"},{"key":"159_CR32","doi-asserted-by":"publisher","first-page":"117546","DOI":"10.1109\/ACCESS.2023.3326528","volume":"11","author":"W Nazih","year":"2023","unstructured":"Nazih W, Aseeri AO, Atallah OY et al (2023) Vision transformer model for predicting the severity of diabetic retinopathy in fundus photography-based retina images[J]. IEEE Access 11:117546\u2013117561","journal-title":"IEEE Access"},{"key":"159_CR33","unstructured":"Nguyen D K, Aggarwal V, Li Y, et al. R-mae: Regions meet masked autoencoders[J]. arXiv preprint arXiv:2306.05411, 2023."},{"key":"159_CR34","doi-asserted-by":"publisher","first-page":"108523","DOI":"10.1016\/j.compbiomed.2024.108523","volume":"175","author":"M Oulhadj","year":"2024","unstructured":"Oulhadj M, Riffi J, Khodriss C et al (2024) Diabetic retinopathy prediction based on vision transformer and modified capsule network[J]. Comput Biol Med 175:108523","journal-title":"Comput Biol Med"},{"key":"159_CR35","doi-asserted-by":"publisher","first-page":"108460","DOI":"10.1016\/j.compbiomed.2024.108460","volume":"174","author":"W Park","year":"2024","unstructured":"Park W, Ryu J (2024) Fine-Grained Self-Supervised Learning with Jigsaw puzzles for medical image classification[J]. Comput Biol Med 174:108460","journal-title":"Comput Biol Med"},{"key":"159_CR36","doi-asserted-by":"publisher","first-page":"105928","DOI":"10.1016\/j.bspc.2023.105928","volume":"91","author":"I Park","year":"2024","unstructured":"Park I, Kim WH, Ryu J (2024) Style-KD: Class-imbalanced medical image classification via style knowledge distillation[J]. Biomed Signal Process Control 91:105928","journal-title":"Biomed Signal Process Control"},{"key":"159_CR37","doi-asserted-by":"crossref","unstructured":"P. Qian, Z. Zhao, C. Chen, Z. Zeng, X. Li, Two eyes are better than one: Exploiting binocular correlation for diabetic retinopathy severity grading, in: Proc. IEEE EMBC 2021, IEEE, 2021, pp. 2115\u20132118.","DOI":"10.1109\/EMBC46164.2021.9630812"},{"key":"159_CR38","doi-asserted-by":"crossref","unstructured":"Shi D. TransNeXt: Robust Foveal Visual Perception for Vision Transformers[C]\/\/Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2024: 17773\u201317783.","DOI":"10.1109\/CVPR52733.2024.01683"},{"key":"159_CR39","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.preteyeres.2017.11.003","volume":"64","author":"RF Spaide","year":"2018","unstructured":"Spaide RF, Fujimoto JG, Waheed NK et al (2018) Optical coherence tomography angiography[J]. Prog Retin Eye Res 64:1\u201355","journal-title":"Prog Retin Eye Res"},{"key":"159_CR40","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1016\/j.cmpb.2016.10.017","volume":"138","author":"R Srivastava","year":"2017","unstructured":"Srivastava R, Duan L, Wong DWK et al (2017) Detecting retinal microaneurysms and hemorrhages with robustness to the presence of blood vessels[J]. Comput Methods Programs Biomed 138:83\u201391","journal-title":"Comput Methods Programs Biomed"},{"key":"159_CR41","doi-asserted-by":"publisher","first-page":"107876","DOI":"10.1016\/j.cmpb.2023.107876","volume":"243","author":"Z Tan","year":"2024","unstructured":"Tan Z, Yu Y, Meng J et al (2024) Self-supervised learning with self-distillation on COVID-19 medical image classification[J]. Comput Methods Programs Biomed 243:107876","journal-title":"Comput Methods Programs Biomed"},{"issue":"11","key":"159_CR42","doi-asserted-by":"publisher","first-page":"1580","DOI":"10.1016\/j.ophtha.2021.04.027","volume":"128","author":"ZL Teo","year":"2021","unstructured":"Teo ZL, Tham YC, Yu M et al (2021) Global prevalence of diabetic retinopathy and projection of burden through 2045: systematic review and meta-analysis[J]. Ophthalmology 128(11):1580\u20131591","journal-title":"Ophthalmology"},{"key":"159_CR43","doi-asserted-by":"crossref","unstructured":"Vij, R., Arora, S., 2023. A novel deep transfer learning based computerized diagnostic systems for multi-class imbalanced diabetic retinopathy severity classification.Multimedia Tools Appl. 1\u201338.","DOI":"10.1007\/s11042-023-14963-4"},{"issue":"9","key":"159_CR44","doi-asserted-by":"publisher","first-page":"1677","DOI":"10.1016\/S0161-6420(03)00475-5","volume":"110","author":"CP Wilkinson","year":"2003","unstructured":"Wilkinson CP et al (2003) Proposed international clinical diabetic retinopathy and diabetic macular edema disease severity scales. Ophthalmology 110(9):1677\u20131682","journal-title":"Ophthalmology"},{"key":"159_CR45","doi-asserted-by":"publisher","first-page":"103304","DOI":"10.1016\/j.media.2024.103304","volume":"98","author":"Y Xie","year":"2024","unstructured":"Xie Y, Gu L, Harada T et al (2024) Rethinking masked image modelling for medical image representation[J]. Med Image Anal 98:103304","journal-title":"Med Image Anal"},{"key":"159_CR46","doi-asserted-by":"crossref","unstructured":"Xie Z, Zhang Z, Cao Y, et al. Simmim: A simple framework for masked image modeling[C]\/\/Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 2022: 9653\u20139663.","DOI":"10.1109\/CVPR52688.2022.00943"},{"issue":"11","key":"159_CR47","doi-asserted-by":"publisher","first-page":"9562","DOI":"10.1109\/TNNLS.2022.3158966","volume":"34","author":"J Xu","year":"2022","unstructured":"Xu J, Pan Y, Pan X et al (2022) RegNet: Self-regulated network for image classification[J]. IEEE Transactions on Neural Networks and Learning Systems 34(11):9562\u20139567","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"issue":"11","key":"159_CR48","doi-asserted-by":"publisher","first-page":"11407","DOI":"10.1109\/TCYB.2021.3062638","volume":"52","author":"Y Yang","year":"2021","unstructured":"Yang Y, Shang F, Wu B, Yang D, Wang L, Xu Y, Zhang W, Zhang T (2021) Robust collaborative learning of patch-level and image-level annotations for diabetic retinopathy grading from fundus image. IEEE Trans Cybern 52(11):11407\u201311417","journal-title":"IEEE Trans Cybern"},{"key":"159_CR49","doi-asserted-by":"publisher","first-page":"107993","DOI":"10.1016\/j.compbiomed.2024.107993","volume":"170","author":"F Zang","year":"2024","unstructured":"Zang F, Ma H (2024) CRA-Net: Transformer guided category-relation attention network for diabetic retinopathy grading[J]. Comput Biol Med 170:107993","journal-title":"Comput Biol Med"},{"key":"159_CR50","doi-asserted-by":"crossref","unstructured":"Zhang C, Zhang C, Song J, et al. A survey on masked autoencoder for self-supervised learning in vision and beyond[J]. arXiv preprint arXiv:2208.00173, 2022.","DOI":"10.24963\/ijcai.2023\/762"}],"container-title":["Journal of King Saud University Computer and Information Sciences"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s44443-025-00159-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s44443-025-00159-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s44443-025-00159-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,29]],"date-time":"2025-10-29T15:36:49Z","timestamp":1761752209000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s44443-025-00159-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,24]]},"references-count":50,"journal-issue":{"issue":"8","published-print":{"date-parts":[[2025,10]]}},"alternative-id":["159"],"URL":"https:\/\/doi.org\/10.1007\/s44443-025-00159-3","relation":{},"ISSN":["1319-1578","2213-1248"],"issn-type":[{"value":"1319-1578","type":"print"},{"value":"2213-1248","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,9,24]]},"assertion":[{"value":"26 April 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 July 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 September 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"217"}}