{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T21:16:36Z","timestamp":1774905396857,"version":"3.50.1"},"reference-count":93,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T00:00:00Z","timestamp":1774828800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T00:00:00Z","timestamp":1774828800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Cluster Comput"],"published-print":{"date-parts":[[2026,8]]},"DOI":"10.1007\/s10586-026-06045-5","type":"journal-article","created":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T20:30:25Z","timestamp":1774902625000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Deep learning approaches in computer vision: a comprehensive survey"],"prefix":"10.1007","volume":"29","author":[{"given":"Shilan","family":"Reshadi","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shiva","family":"TaghipourEivazi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ali","family":"Ghaffari","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Amir","family":"Seyyedabbasi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,3,30]]},"reference":[{"key":"6045_CR1","doi-asserted-by":"publisher","unstructured":"Alzubaidi, L., et al.: Review of deep learning: concepts, CNN architectures, challenges, applications, future directions. J. Big Data. 8(1) (2021). https:\/\/doi.org\/10.1186\/s40537-021-00444-8","DOI":"10.1186\/s40537-021-00444-8"},{"issue":"8","key":"6045_CR2","doi-asserted-by":"publisher","first-page":"5455","DOI":"10.1007\/s10462-020-09825-6","volume":"53","author":"A Khan","year":"2020","unstructured":"Khan, A., Sohail, A., Zahoora, U., Qureshi, A.S.: A survey of the recent architectures of deep convolutional neural networks. Artif. Intell. Rev. 53(8), 5455\u20135516 (2020). https:\/\/doi.org\/10.1007\/s10462-020-09825-6","journal-title":"Artif. Intell. Rev."},{"key":"6045_CR3","doi-asserted-by":"publisher","unstructured":"LeCun, Y., Bottou, L., Bengio, Y., Haffner, P.: Gradient-based learning applied to document recognition, Proceed IEEE. 86(11), 2278\u20132323 (1998). https:\/\/doi.org\/10.1109\/5.726791","DOI":"10.1109\/5.726791"},{"key":"6045_CR4","doi-asserted-by":"crossref","unstructured":"Krizhevsky, B.A., Sutskever, I., Hinton, G.E.: ImageNet Classification with Deep Convolutional Neural Networks Commun ACM 60(6), 84\u201390 (2012)","DOI":"10.1145\/3065386"},{"key":"6045_CR5","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition, in 3rd International Conference on Learning Representations, ICLR 2015 - Conference Track Proceedings, (2015)"},{"key":"6045_CR6","doi-asserted-by":"publisher","first-page":"82031","DOI":"10.1109\/ACCESS.2021.3086020","volume":"9","author":"N Siddique","year":"2021","unstructured":"Siddique, N., Paheding, S., Elkin, C.P., Devabhaktuni, V.: U-Net and Its Variants for Medical Image Segmentation: A Review of Theory and Applications. IEEE Access. 9, 82031\u201382057 (2021). https:\/\/doi.org\/10.1109\/ACCESS.2021.3086020","journal-title":"IEEE Access."},{"key":"6045_CR7","doi-asserted-by":"publisher","unstructured":"Archana, R., Jeevaraj, P.S.E.: Deep learning models for digital image processing: a review. Artif. Intell. Rev. 57(1) (2024). https:\/\/doi.org\/10.1007\/s10462-023-10631-z","DOI":"10.1007\/s10462-023-10631-z"},{"key":"6045_CR8","doi-asserted-by":"publisher","unstructured":"Voulodimos, A., Doulamis, N., Doulamis, A., Protopapadakis, E.: Deep learning for computer vision: A brief review. Comput. Intell. Neurosci. (2018). https:\/\/doi.org\/10.1155\/2018\/7068349","DOI":"10.1155\/2018\/7068349"},{"issue":"1","key":"6045_CR9","doi-asserted-by":"publisher","first-page":"22","DOI":"10.29099\/ijair.v2i1.42","volume":"2","author":"V Wiley","year":"2018","unstructured":"Wiley, V., Lucas, T.: Computer Vision and Image Processing: A Paper Review. Int. J. Artif. Intell. Res. 2(1), 22 (2018). https:\/\/doi.org\/10.29099\/ijair.v2i1.42","journal-title":"Int. J. Artif. Intell. Res."},{"key":"6045_CR10","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1016\/j.neucom.2016.12.038","volume":"234","author":"W Liu","year":"2017","unstructured":"Liu, W., Wang, Z., Liu, X., Zeng, N., Liu, Y., Alsaadi, F.E.: A survey of deep neural network architectures and their applications. Neurocomputing. 234, 11\u201326 (2017)","journal-title":"Neurocomputing"},{"key":"6045_CR11","unstructured":"Noor, M.H.M., Ige, A.O.: A Survey on State-of-the-art Deep Learning Applications and Challenges, (2024). http:\/\/arxiv.org\/abs\/2403.17561"},{"key":"6045_CR12","doi-asserted-by":"publisher","unstructured":"Mienye, I.D., Swart, T.G., A Comprehensive Review of Deep Learning: Architectures, Advances, R., Applications, D.: (2024). https:\/\/doi.org\/10.3390\/info15120755","DOI":"10.3390\/info15120755"},{"key":"6045_CR13","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1016\/j.neucom.2015.09.116","volume":"187","author":"Y Guo","year":"2016","unstructured":"Guo, Y., Liu, Y., Oerlemans, A., Lao, S., Wu, S., Lew, M.S.: Deep learning for visual understanding: A review. Neurocomputing. 187, 27\u201348 (2016). https:\/\/doi.org\/10.1016\/j.neucom.2015.09.116","journal-title":"Neurocomputing"},{"key":"6045_CR14","unstructured":"Wang, H., Raj, B.: On the Origin of Deep Learning, 1\u201372, (2017). http:\/\/arxiv.org\/abs\/1702.07800"},{"key":"6045_CR15","doi-asserted-by":"publisher","DOI":"10.1155\/2023\/7091301","author":"B Sistaninejhad","year":"2023","unstructured":"Sistaninejhad, B., Rasi, H., Nayeri, P.: A Review Paper about Deep Learning for Medical Image Analysis. Hindawi Ltd. (2023). https:\/\/doi.org\/10.1155\/2023\/7091301","journal-title":"Hindawi Ltd."},{"key":"6045_CR16","doi-asserted-by":"publisher","unstructured":"F\u0131rat, H., Asker, M.E., Bayindir, M., Hanbay, D.: Spatial-spectral classification of hyperspectral remote sensing images using 3D CNN based LeNet-5 architecture. Infrared Phys. Technol. 127 (2022). https:\/\/doi.org\/10.1016\/j.infrared.2022.104470","DOI":"10.1016\/j.infrared.2022.104470"},{"key":"6045_CR17","doi-asserted-by":"publisher","unstructured":"Balasubramaniam, S., Velmurugan, Y., Jaganathan, D., Dhanasekaran, S.: A Modified LeNet CNN for Breast Cancer Diagnosis in Ultrasound Images. Diagnostics. 13(17) (2023). https:\/\/doi.org\/10.3390\/diagnostics13172746","DOI":"10.3390\/diagnostics13172746"},{"key":"6045_CR18","doi-asserted-by":"publisher","unstructured":"Eldem, H., \u00dclker, E., I\u015f\u0131kl\u0131, O.Y.: Alexnet architecture variations with transfer learning for classification of wound images. Eng. Sci. Technol. Int. J. 45 (2023). https:\/\/doi.org\/10.1016\/j.jestch.2023.101490","DOI":"10.1016\/j.jestch.2023.101490"},{"key":"6045_CR19","doi-asserted-by":"publisher","unstructured":"Kollem, S., et al.: Jul., AlexNet-NDTL: Classification of MRI brain tumor images using modified AlexNet with deep transfer learning and Lipschitz-based data augmentation, Int J Imaging Syst Technol. 33(4), 1306\u20131322 (2023). https:\/\/doi.org\/10.1002\/ima.22870","DOI":"10.1002\/ima.22870"},{"key":"6045_CR20","doi-asserted-by":"publisher","unstructured":"Zhang, C., Zhang, H., Tian, F., Zhou, Y., Zhao, S., Du, X.: Research on sheep face recognition algorithm based on improved AlexNet model, Neural Comput Appl. 35(36), 24971\u201324979 (2023). https:\/\/doi.org\/10.1007\/s00521-023-08413-3","DOI":"10.1007\/s00521-023-08413-3"},{"key":"6045_CR21","doi-asserted-by":"publisher","unstructured":"Shibu George, G., Raj Mishra, P., Sinha, P., Ranjan Prusty, M.: COVID-19 detection on chest X-ray images using Homomorphic Transformation and VGG inspired deep convolutional neural network. Biocybern Biomed. Eng. 43(1), 1\u201316 (2023). https:\/\/doi.org\/10.1016\/j.bbe.2022.11.003","DOI":"10.1016\/j.bbe.2022.11.003"},{"key":"6045_CR22","doi-asserted-by":"publisher","first-page":"72518","DOI":"10.1109\/ACCESS.2023.3289224","volume":"11","author":"A Jabbar","year":"2023","unstructured":"Jabbar, A., Naseem, S., Mahmood, T., Saba, T., Alamri, F.S., Rehman, A.: Brain Tumor Detection and Multi-Grade Segmentation Through Hybrid Caps-VGGNet Model. IEEE Access. 11, 72518\u201372536 (2023). https:\/\/doi.org\/10.1109\/ACCESS.2023.3289224","journal-title":"IEEE Access."},{"key":"6045_CR23","doi-asserted-by":"publisher","unstructured":"Vignesh, S., Savithadevi, M., Sridevi, M., Sridhar, R.: A novel facial emotion recognition model using segmentation VGG-19 architecture. Int. J. Inform. Technol. (Singapore). 15(4), 1777\u20131787 (2023). https:\/\/doi.org\/10.1007\/s41870-023-01184-z","DOI":"10.1007\/s41870-023-01184-z"},{"key":"6045_CR24","doi-asserted-by":"publisher","unstructured":"Zou, J., Guo, W., Wang, F.: A Study on Pavement Classification and Recognition Based on VGGNet-16 Transfer Learning. Electron. (Switzerland). 12(15) (2023). https:\/\/doi.org\/10.3390\/electronics12153370","DOI":"10.3390\/electronics12153370"},{"issue":"3","key":"6045_CR25","doi-asserted-by":"publisher","first-page":"395","DOI":"10.1080\/24751839.2021.1893495","volume":"5","author":"E Yilmaz","year":"2021","unstructured":"Yilmaz, E., Trocan, M.: A modified version of GoogLeNet for melanoma diagnosis. J. Inform. Telecommunication. 5(3), 395\u2013405 (2021). https:\/\/doi.org\/10.1080\/24751839.2021.1893495","journal-title":"J. Inform. Telecommunication"},{"issue":"1","key":"6045_CR26","doi-asserted-by":"publisher","first-page":"565","DOI":"10.32604\/cmc.2023.036317","volume":"75","author":"W Zhang","year":"2023","unstructured":"Zhang, W., Li, J., Bhatti, U.A., Liu, J., Zheng, J., Chen, Y.W.: Robust Multi-Watermarking Algorithm for Medical Images Based on GoogLeNet and Henon Map. Computers Mater. Continua. 75(1), 565\u2013586 (2023). https:\/\/doi.org\/10.32604\/cmc.2023.036317","journal-title":"Computers Mater. Continua"},{"key":"6045_CR27","doi-asserted-by":"publisher","unstructured":"Chen, S.-H., Wu, Y.-L., Pan, C.-Y., Lian, L.-Y., Su, Q.-C.: Breast ultrasound image classification and physiological assessment based on GoogLeNet. J. Radiat. Res. Appl. Sci. 16(3), 100628 (2023). https:\/\/doi.org\/10.1016\/j.jrras.2023.100628","DOI":"10.1016\/j.jrras.2023.100628"},{"key":"6045_CR28","doi-asserted-by":"publisher","unstructured":"Hasanah, S.A., Pravitasari, A.A., Abdullah, A.S., Yulita, I.N., Asnawi, M.H.: A Deep Learning Review of ResNet Architecture for Lung Disease Identification in CXR Image. Dec 01, 2023, Multidisciplinary Digital Publishing Institute (MDPI). https:\/\/doi.org\/10.3390\/app132413111","DOI":"10.3390\/app132413111"},{"key":"6045_CR29","doi-asserted-by":"publisher","unstructured":"Liu, K., et al.: Prediction of Primary Tumor Sites in Spinal Metastases Using a ResNet-50 Convolutional Neural Network Based on MRI. Cancers (Basel). 15(11) (2023). https:\/\/doi.org\/10.3390\/cancers15112974","DOI":"10.3390\/cancers15112974"},{"key":"6045_CR30","doi-asserted-by":"publisher","unstructured":"Kanavos, A., Mylonas, P.: Deep Learning Analysis of Histopathology Images for Breast Cancer Detection: A Comparative Study of ResNet and VGG Architectures, in 2023 18th International Workshop on Semantic and Social Media Adaptation and Personalization, SMAP 2023, Institute of Electrical and Electronics Engineers Inc., (2023). https:\/\/doi.org\/10.1109\/SMAP59435.2023.10255168","DOI":"10.1109\/SMAP59435.2023.10255168"},{"key":"6045_CR31","doi-asserted-by":"publisher","unstructured":"Chhabra, M., Kumar, R.: An Efficient ResNet-50 based Intelligent Deep Learning Model to Predict Pneumonia from Medical Images, in International Conference on Sustainable Computing and Data Communication Systems, ICSCDS 2022 - Proceedings, Institute of Electrical and Electronics Engineers Inc., pp. 1714\u20131721. (2022). https:\/\/doi.org\/10.1109\/ICSCDS53736.2022.9760995","DOI":"10.1109\/ICSCDS53736.2022.9760995"},{"key":"6045_CR32","doi-asserted-by":"publisher","unstructured":"Liao, T., et al.: Classification of asymmetry in mammography via the DenseNet convolutional neural network, Dec. 01, Elsevier Ltd. (2023). https:\/\/doi.org\/10.1016\/j.ejro.2023.100502","DOI":"10.1016\/j.ejro.2023.100502"},{"key":"6045_CR33","doi-asserted-by":"publisher","unstructured":"Zhu, H., et al.: MEEDNets: Medical Image Classification via Ensemble Bio-inspired Evolutionary DenseNets. Knowl. Based Syst. 280 (2023). https:\/\/doi.org\/10.1016\/j.knosys.2023.111035","DOI":"10.1016\/j.knosys.2023.111035"},{"key":"6045_CR34","doi-asserted-by":"publisher","unstructured":"Chauhan, T., Palivela, H., Tiwari, S.: Optimization and fine-tuning of DenseNet model for classification of COVID-19 cases in medical imaging. Int. J. Inform. Manage. Data Insights. 1(2) (2021). https:\/\/doi.org\/10.1016\/j.jjimei.2021.100020","DOI":"10.1016\/j.jjimei.2021.100020"},{"key":"6045_CR35","doi-asserted-by":"publisher","unstructured":"Prakash, N.N., Rajesh, V., Namakhwa, D.L., Dwarkanath Pande, S., Ahammad, S.H.: A DenseNet CNN-based liver lesion prediction and classification for future medical diagnosis. Sci. Afr. 20 (2023). https:\/\/doi.org\/10.1016\/j.sciaf.2023.e01629","DOI":"10.1016\/j.sciaf.2023.e01629"},{"key":"6045_CR36","doi-asserted-by":"publisher","unstructured":"Sajid, M.Z., et al.: Mobile-HR: An Ophthalmologic-Based Classification System for Diagnosis of Hypertensive Retinopathy Using Optimized MobileNet Architecture. Diagnostics. 13(8) (2023). https:\/\/doi.org\/10.3390\/diagnostics13081439","DOI":"10.3390\/diagnostics13081439"},{"key":"6045_CR37","doi-asserted-by":"publisher","unstructured":"Kumar Lilhore, U., et al.: A precise model for skin cancer diagnosis using hybrid U-Net and improved MobileNet-V3 with hyperparameters optimization. Sci. Rep. 14(1) (2024). https:\/\/doi.org\/10.1038\/s41598-024-54212-8","DOI":"10.1038\/s41598-024-54212-8"},{"key":"6045_CR38","doi-asserted-by":"publisher","unstructured":"Gang, L., Haixuan, Z., Linning, E., Ling, Z., Yu, L., Juming, Z.: Recognition of honeycomb lung in CT images based on improved MobileNet model, Med Phys. 48(8), 4304\u20134315 (2021). https:\/\/doi.org\/10.1002\/mp.14873","DOI":"10.1002\/mp.14873"},{"key":"6045_CR39","doi-asserted-by":"publisher","unstructured":"Al, M.S., Reshan, et al.: Detection of Pneumonia from Chest X-ray Images Utilizing MobileNet Model. Healthc. (Switzerland). 11(11) (2023). https:\/\/doi.org\/10.3390\/healthcare11111561","DOI":"10.3390\/healthcare11111561"},{"key":"6045_CR40","doi-asserted-by":"publisher","unstructured":"Agarwal, D., Berb\u00eds, M., Luna, A., Lipari, V., Ballester, J.B., de la Torre-D\u00edez, I.: Automated Medical Diagnosis of Alzheimer\u00b4s Disease Using an Efficient Net Convolutional Neural Network. J. Med. Syst. 47(1) (2023). https:\/\/doi.org\/10.1007\/s10916-023-01941-4","DOI":"10.1007\/s10916-023-01941-4"},{"key":"6045_CR41","doi-asserted-by":"publisher","unstructured":"Raza, R., et al.: Lung-EffNet: Lung cancer classification using EfficientNet from CT-scan images. Eng. Appl. Artif. Intell. 126 (2023). https:\/\/doi.org\/10.1016\/j.engappai.2023.106902","DOI":"10.1016\/j.engappai.2023.106902"},{"key":"6045_CR42","doi-asserted-by":"publisher","unstructured":"Tripathy, S., Singh, R., Ray, M.: Automation of Brain Tumor Identification using EfficientNet on Magnetic Resonance Images, in Procedia Computer Science, Elsevier B.V., pp. 1551\u20131560. (2022). https:\/\/doi.org\/10.1016\/j.procs.2023.01.133","DOI":"10.1016\/j.procs.2023.01.133"},{"key":"6045_CR43","doi-asserted-by":"publisher","unstructured":"Talukder, M.A., Layek, M.A., Kazi, M., Uddin, M.A., Aryal, S.: Empowering COVID-19 detection: Optimizing performance through fine-tuned EfficientNet deep learning architecture. Comput. Biol. Med. 168 (2024). https:\/\/doi.org\/10.1016\/j.compbiomed.2023.107789","DOI":"10.1016\/j.compbiomed.2023.107789"},{"issue":"1","key":"6045_CR44","doi-asserted-by":"publisher","first-page":"439","DOI":"10.37385\/jaets.v5i1.3226","volume":"5","author":"S Magesh","year":"2023","unstructured":"Magesh, S., RajaKumar, P.S.: Fetal Heart Disease Detection Via Deep Reg Network Based on Ultrasound Images. J. Appl. Eng. Technological Sci. (JAETS). 5(1), 439\u2013450 (2023). https:\/\/doi.org\/10.37385\/jaets.v5i1.3226","journal-title":"J. Appl. Eng. Technological Sci. (JAETS)"},{"key":"6045_CR45","doi-asserted-by":"publisher","unstructured":"Chetoui, M., Akhloufi, M.A., Bouattane, E.M., Abdulnour, J., Roux, S., Bernard, C.D.: Explainable COVID-19 Detection Based on Chest X-rays Using an End-to-End RegNet Architecture. Viruses. 15(6) (2023). https:\/\/doi.org\/10.3390\/v15061327","DOI":"10.3390\/v15061327"},{"issue":"3","key":"6045_CR46","doi-asserted-by":"publisher","first-page":"5451","DOI":"10.32604\/cmc.2023.033787","volume":"75","author":"Y Chen","year":"2023","unstructured":"Chen, Y., et al.: Deep Learning Based Underground Sewer Defect Classification Using a Modified RegNet. Computers Mater. Continua. 75(3), 5451\u20135469 (2023). https:\/\/doi.org\/10.32604\/cmc.2023.033787","journal-title":"Computers Mater. Continua"},{"key":"6045_CR47","unstructured":"Santana, A., Colombini, E.: Neural Attention Models in Deep Learning: Survey and Taxonomy. (2021). http:\/\/arxiv.org\/abs\/2112.05909"},{"key":"6045_CR48","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2021.3126456","author":"G Brauwers","year":"2022","unstructured":"Brauwers, G., Frasincar, F.: A General Survey on Attention Mechanisms in Deep Learning. (2022). https:\/\/doi.org\/10.1109\/TKDE.2021.3126456","journal-title":"Mar"},{"key":"6045_CR49","doi-asserted-by":"publisher","unstructured":"Dosovitskiy, A., et al.: An image is worth 16\u00d716 words: Transformers for image recognition at scale. (2021). https:\/\/doi.org\/10.48550\/arXiv.2010.11929","DOI":"10.48550\/arXiv.2010.11929"},{"key":"6045_CR50","unstructured":"Radford, A., et al.: Feb., Learning Transferable Visual Models From Natural Language Supervision. (2021). http:\/\/arxiv.org\/abs\/2103.00020"},{"key":"6045_CR51","doi-asserted-by":"publisher","unstructured":"Zhou, J., et al.: Graph neural networks: A review of methods and applications. Jan 01 2020 KeAi Commun. Co. https:\/\/doi.org\/10.1016\/j.aiopen.2021.01.001","DOI":"10.1016\/j.aiopen.2021.01.001"},{"key":"6045_CR52","doi-asserted-by":"publisher","first-page":"4544","DOI":"10.1109\/JSTARS.2022.3176612","volume":"15","author":"S Sun","year":"2022","unstructured":"Sun, S., Dustdar, S., Ranjan, R., Morgan, G., Dong, Y., Wang, L.: Remote Sensing Image Interpretation With Semantic Graph-Based Methods: A Survey. IEEE J. Sel. Top. Appl. Earth Obs Remote Sens. 15, 4544\u20134558 (2022). https:\/\/doi.org\/10.1109\/JSTARS.2022.3176612","journal-title":"IEEE J. Sel. Top. Appl. Earth Obs Remote Sens."},{"key":"6045_CR53","unstructured":"Jaiswal, A., Sodhi, S., Muzamil, M., Chandhok, R.S., Oore, S., Sastry, C.S.: Controlling BigGAN Image Generation with a Segmentation Network."},{"key":"6045_CR54","doi-asserted-by":"publisher","unstructured":"Tian, Y., Tian, C., Fan, Z., Fu, M., Ma, H.: Quantum generative adversarial network with automated noise suppression mechanism based on WGAN-GP, EPJ Quantum Technology. 12(80), (2025). https:\/\/doi.org\/10.1140\/epjqt\/s40507-025-00372-z","DOI":"10.1140\/epjqt\/s40507-025-00372-z"},{"key":"6045_CR55","doi-asserted-by":"publisher","unstructured":"Sun, A., et al.: Scalable QCNN for image classification, November 2024 Physica A Statistical Mechanics and its Applications 657(1):130226. (2025). https:\/\/doi.org\/10.1016\/j.physa.2024.130226","DOI":"10.1016\/j.physa.2024.130226"},{"key":"6045_CR56","doi-asserted-by":"crossref","unstructured":"Caron, M., Touvron, H., Misra, I., et al.: Emerging Properties in Self-Supervised Vision Transformers, in Proc. ICCV, (2021)","DOI":"10.1109\/ICCV48922.2021.00951"},{"key":"6045_CR57","doi-asserted-by":"crossref","unstructured":"He, K., Chen, X., Xie, S., Li, Y., Doll\u00e1r, P., Girshick, R.: Masked Autoencoders Are Scalable Vision Learners, in Proc. CVPR, (2022)","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"6045_CR58","doi-asserted-by":"crossref","unstructured":"Kirillov, A., Mintun, E., Ravi, N., et al.: Segment Anything, in Proc. ICCV, (2023)","DOI":"10.1109\/ICCV51070.2023.00371"},{"issue":"5","key":"6045_CR59","doi-asserted-by":"publisher","first-page":"323","DOI":"10.3390\/axioms13050323","volume":"13","author":"M Comajoan Cara","year":"2024","unstructured":"Comajoan Cara, M., et al.: Quantum vision transformers for quark\u2013gluon classification. Axioms. 13(5), 323 (2024). https:\/\/doi.org\/10.3390\/axioms13050323","journal-title":"Axioms"},{"key":"6045_CR60","doi-asserted-by":"publisher","first-page":"1265","DOI":"10.22331\/q-2024-02-22-1265","volume":"8","author":"Q Kerenidis","year":"2024","unstructured":"Kerenidis, Q., et al.: Quantum Vision Transformers. Quantum. 8, 1265 (2024). https:\/\/doi.org\/10.22331\/q-2024-02-22-1265","journal-title":"Quantum"},{"key":"6045_CR61","doi-asserted-by":"publisher","unstructured":"Peng, S., Luo, L., Peng, H.: A new framework for graph neural network with local information diffusion. Appl. Intell. 52(9) (2022). https:\/\/doi.org\/10.1007\/s10489-021-03132-5","DOI":"10.1007\/s10489-021-03132-5"},{"key":"6045_CR62","unstructured":"Wang, Z., Zheng, H., He, P., Chen, W., Zhou, M.: Diffusion-GAN: Training GANs with Diffusion. (2022). http:\/\/arxiv.org\/abs\/2206.02262"},{"key":"6045_CR63","unstructured":"Goodfellow, I.J., Courville, A., Bengio, Y.: Joint Training Deep Boltzmann Machines for Classification. (2013). http:\/\/arxiv.org\/abs\/1301.3568"},{"key":"6045_CR64","doi-asserted-by":"publisher","unstructured":"Kuremoto, T., Kimura, S., Kobayashi, K., Obayashi, M.: Time series forecasting using a deep belief network with restricted Boltzmann machines. Neurocomputing. 137, 47\u201356 (2014). https:\/\/doi.org\/10.1016\/J.NEUCOM.2013.03.047","DOI":"10.1016\/J.NEUCOM.2013.03.047"},{"issue":"6","key":"6045_CR65","doi-asserted-by":"publisher","first-page":"82","DOI":"10.1109\/MSP.2012.2205597","volume":"29","author":"G Hinton","year":"2012","unstructured":"Hinton, G., et al.: Deep neural networks for acoustic modeling in speech recognition: The shared views of four research groups. IEEE Signal. Process. Mag. 29(6), 82\u201397 (2012). https:\/\/doi.org\/10.1109\/MSP.2012.2205597","journal-title":"IEEE Signal. Process. Mag"},{"key":"6045_CR66","doi-asserted-by":"publisher","unstructured":"Thies, J., Alimohammad, A.: Compact and Low-Power Neural Spike Compression Using Undercomplete Autoencoders. IEEE Trans. Neural Syst. Rehabil Eng. 27(8) (2019). https:\/\/doi.org\/10.1109\/TNSRE.2019.2929081","DOI":"10.1109\/TNSRE.2019.2929081"},{"key":"6045_CR67","doi-asserted-by":"publisher","unstructured":"Ibebuchi, C.C., Richman, M.B.: Deep learning with autoencoders and LSTM for ENSO forecasting. Clim. Dyn. 62(6), 5683\u20135697 (2024). https:\/\/doi.org\/10.1007\/s00382-024-07180-8","DOI":"10.1007\/s00382-024-07180-8"},{"key":"6045_CR68","doi-asserted-by":"publisher","unstructured":"Berahmand, K., Daneshfar, F., Salehi, E.S., Li, Y., Xu, Y.: Autoencoders and their applications in machine learning: a survey. no 2 Springer Neth. 57 (2024). https:\/\/doi.org\/10.1007\/s10462-023-10662-6","DOI":"10.1007\/s10462-023-10662-6"},{"key":"6045_CR69","doi-asserted-by":"publisher","unstructured":"Bourlard, H., Kabil, S.H.: Autoencoders reloaded, Biol Cybern. 116(4), 389\u2013406, (2022). https:\/\/doi.org\/10.1007\/s00422-022-00937-6","DOI":"10.1007\/s00422-022-00937-6"},{"key":"6045_CR70","doi-asserted-by":"publisher","unstructured":"Hussain, M.A., Saif-Ur-Rehman, M., Klaes, C., Iossifidis, I.: Comparison of Anomaly Detection between Statistical Method and Undercomplete Autoencoder, in ACM International Conference Proceeding Series, (2020). https:\/\/doi.org\/10.1145\/3404687.3404689","DOI":"10.1145\/3404687.3404689"},{"key":"6045_CR71","doi-asserted-by":"publisher","unstructured":"Delong, \u0141., Kozak, A.: The use of autoencoders for training neural networks with mixed categorical and numerical features. ASTIN Bulletin. 53(2), 213\u2013232 (2023). https:\/\/doi.org\/10.1017\/asb.2023.15","DOI":"10.1017\/asb.2023.15"},{"key":"6045_CR72","doi-asserted-by":"publisher","first-page":"361","DOI":"10.1146\/annurev-statistics-010814-020120","volume":"2","author":"R Salakhutdinov","year":"2015","unstructured":"Salakhutdinov, R., Models, L.D.G.: Annu. Rev. Stat. Appl. 2, 361\u2013385 (2015). https:\/\/doi.org\/10.1146\/annurev-statistics-010814-020120","journal-title":"Annu. Rev. Stat. Appl."},{"key":"6045_CR73","doi-asserted-by":"publisher","unstructured":"Iglesias, G., Talavera, E., D\u00edaz-\u00c1lvarez, A.: A survey on GANs for computer vision: Recent research, analysis and taxonomy, May 01, 2023, Elsevier Ireland Ltd. https:\/\/doi.org\/10.1016\/j.cosrev.2023.100553","DOI":"10.1016\/j.cosrev.2023.100553"},{"key":"6045_CR74","unstructured":"Gui, J., Sun, Z., Wen, Y., Tao, D., Ye, J.: A Review on Generative Adversarial Networks: Algorithms, Theory, and Applications. (2020). http:\/\/arxiv.org\/abs\/2001.06937"},{"key":"6045_CR75","doi-asserted-by":"publisher","DOI":"10.1007\/s11042-024-18767-y","author":"P Sharma","year":"2024","unstructured":"Sharma, P., Kumar, M., Sharma, H.K., Biju, S.M.: Generative adversarial networks (GANs): Introduction, Taxonomy, Variants, Limitations, and Applications. Multimed Tools Appl. (2024). https:\/\/doi.org\/10.1007\/s11042-024-18767-y","journal-title":"Multimed Tools Appl."},{"key":"6045_CR76","doi-asserted-by":"publisher","unstructured":"Hooftman, D., Ziabari, S.S.M., Snijder, J.: Exploring CycleGAN for Bias Reduction in Gender Classification: Generative Modelling for Diversifying Data Augmentation. In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), pp. 26\u201340. Springer Science and Business Media Deutschland GmbH (2023). https:\/\/doi.org\/10.1007\/978-3-031-47665-5_3","DOI":"10.1007\/978-3-031-47665-5_3"},{"key":"6045_CR77","unstructured":"Brock, A., Donahue, J., Simonyan, K.: Large Scale GAN Training for High Fidelity Natural Image Synthesis. (2018). http:\/\/arxiv.org\/abs\/1809.11096"},{"key":"6045_CR78","unstructured":"Melnik, A., et al.: Face Generation and Editing with StyleGAN: A Survey"},{"key":"6045_CR79","unstructured":"Huang, L., Chen, L., Zhang, B., Chai, S.: A Transformer-based Generative Adversarial Network for Brain Tumor Segmentation."},{"key":"6045_CR80","unstructured":"Jiang, Y., Chang, S., Wang, Z.: TransGAN: Two Pure Transformers Can Make One Strong GAN, and That Can Scale Up. (2021). http:\/\/arxiv.org\/abs\/2102.07074"},{"key":"6045_CR81","unstructured":"Ho, J., Jain, A., Abbeel, P.: Denoising Diffusion Probabilistic Models, in Proc. NeurIPS, (2020)"},{"key":"6045_CR82","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P., Ommer, B.: High-Resolution Image Synthesis with Latent Diffusion Models, in Proc. CVPR, (2022)","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"6045_CR83","doi-asserted-by":"crossref","unstructured":"Redmon, J., Divvala, S., Girshick, R., Farhadi, A.: You Only Look Once: Unified, Real-Time Object Detection. (2015). http:\/\/arxiv.org\/abs\/1506.02640","DOI":"10.1109\/CVPR.2016.91"},{"key":"6045_CR84","doi-asserted-by":"crossref","unstructured":"Redmon, J., Farhadi, A.: YOLO9000: Better, Faster, Stronger. (2016). http:\/\/arxiv.org\/abs\/1612.08242","DOI":"10.1109\/CVPR.2017.690"},{"key":"6045_CR85","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46448-0_2","author":"W Liu","year":"2015","unstructured":"Liu, W., et al.: SSD: Single Shot MultiBox Detector. (2015). https:\/\/doi.org\/10.1007\/978-3-319-46448-0_2","journal-title":"Dec"},{"key":"6045_CR86","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-15-4288-6_1","author":"F Sultana","year":"2019","unstructured":"Sultana, F., Sufian, A., Dutta, P.: A Review of Object Detection Models based on Convolutional Neural Network. (2019). https:\/\/doi.org\/10.1007\/978-981-15-4288-6_1","journal-title":"May"},{"key":"6045_CR87","doi-asserted-by":"publisher","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Rich feature hierarchies for accurate object detection and semantic segmentation, Proceedings of the IEEE Computer Society Conference on Computer Vision and Pattern Recognition. 580\u2013587 (2014). https:\/\/doi.org\/10.1109\/CVPR.2014.81","DOI":"10.1109\/CVPR.2014.81"},{"key":"6045_CR88","doi-asserted-by":"publisher","first-page":"1440","DOI":"10.1109\/ICCV.2015.169","volume":"2015 Inter","author":"R Girshick","year":"2015","unstructured":"Girshick, R.: Fast, R.-C.N.N. Proc. IEEE Int. Conf. Comput. Vis. 2015 Inter, 1440\u20131448 (2015). https:\/\/doi.org\/10.1109\/ICCV.2015.169","journal-title":"Proc. IEEE Int. Conf. Comput. Vis."},{"key":"6045_CR89","unstructured":"Ren, S., He, K., Girshick, R., Sun, J., Faster, R.-C.N.N.: Towards Real-Time Object Detection with Region Proposal Networks. (2015). http:\/\/arxiv.org\/abs\/1506.01497"},{"key":"6045_CR90","doi-asserted-by":"publisher","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-net: Convolutional networks for biomedical image segmentation. In: Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics), pp. 234\u2013241. Springer (2015). https:\/\/doi.org\/10.1007\/978-3-319-24574-4_28","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"6045_CR91","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep Residual Learning for Image Recognition. Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR). 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"6045_CR92","first-page":"6105","volume":"97","author":"M Tan","year":"2019","unstructured":"Tan, M., Le, Q.V.: EfficientNet: Rethinking Model Scaling for Convolutional Neural Networks. ICML 2019. PMLR. 97, 6105\u20136114 (2019)","journal-title":"PMLR"},{"key":"6045_CR93","doi-asserted-by":"publisher","unstructured":"Lin, T.-Y., Doll\u00e1r, P., Girshick, R., He, K., Hariharan, B., Belongie, S.: Feature Pyramid Networks for Object Detection, in Proc. IEEE Conf. Computer Vision and Pattern Recognition (CVPR). 2117\u20132125, (2017). https:\/\/doi.org\/10.1109\/CVPR.2017.106","DOI":"10.1109\/CVPR.2017.106"}],"container-title":["Cluster Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10586-026-06045-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10586-026-06045-5","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10586-026-06045-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T20:30:43Z","timestamp":1774902643000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10586-026-06045-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,3,30]]},"references-count":93,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2026,8]]}},"alternative-id":["6045"],"URL":"https:\/\/doi.org\/10.1007\/s10586-026-06045-5","relation":{},"ISSN":["1386-7857","1573-7543"],"issn-type":[{"value":"1386-7857","type":"print"},{"value":"1573-7543","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,3,30]]},"assertion":[{"value":"9 June 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 October 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 February 2026","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 March 2026","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable. This survey relies exclusively on publicly available research publications and de-identified benchmark datasets and involves no human participants, animals, or personally identifiable information.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval"}},{"value":"The authors declare no competing interests.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"210"}}