{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,31]],"date-time":"2026-03-31T16:33:49Z","timestamp":1774974829565,"version":"3.50.1"},"reference-count":85,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2026,2,21]],"date-time":"2026-02-21T00:00:00Z","timestamp":1771632000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,2,21]],"date-time":"2026-02-21T00:00:00Z","timestamp":1771632000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100002858","name":"China Postdoctoral Science Foundation","doi-asserted-by":"crossref","award":["2025M771665"],"award-info":[{"award-number":["2025M771665"]}],"id":[{"id":"10.13039\/501100002858","id-type":"DOI","asserted-by":"crossref"}]},{"name":"Research Project on the Communist Youth League in Hangzhou Schools","award":["hzxx25052"],"award-info":[{"award-number":["hzxx25052"]}]},{"DOI":"10.13039\/100022955","name":"Fundamental Research Funds for the Provincial Universities of Zhejiang","doi-asserted-by":"publisher","award":["230056"],"award-info":[{"award-number":["230056"]}],"id":[{"id":"10.13039\/100022955","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Scientific Research Fund of Zhejiang Provincial Education Department","award":["Y202557513"],"award-info":[{"award-number":["Y202557513"]}]},{"name":"Zhejiang Provincial Natural Science Foundation of China","award":["QN26F020075"],"award-info":[{"award-number":["QN26F020075"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Pattern Anal Applic"],"published-print":{"date-parts":[[2026,3]]},"DOI":"10.1007\/s10044-026-01637-8","type":"journal-article","created":{"date-parts":[[2026,2,21]],"date-time":"2026-02-21T09:43:28Z","timestamp":1771667008000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["TEN: A transformer-based efficient network for pneumonia diagnosis with chest x-rays"],"prefix":"10.1007","volume":"29","author":[{"given":"Yunxue","family":"Bao","sequence":"first","affiliation":[]},{"given":"Wenjun","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Lu","family":"Zhao","sequence":"additional","affiliation":[]},{"given":"Heng","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Zijun","family":"Zheng","sequence":"additional","affiliation":[]},{"given":"Laishui","family":"Lv","sequence":"additional","affiliation":[]},{"given":"Dalal","family":"Bardou","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,2,21]]},"reference":[{"key":"1637_CR1","unstructured":"Organization WH (2019) Pneumonia in children. Retrieved from https:\/\/www.who.int\/news-room\/fact-sheets\/detail\/pneumonia"},{"issue":"9","key":"1637_CR2","doi-asserted-by":"publisher","first-page":"835","DOI":"10.1056\/NEJMoa1405870","volume":"372","author":"S Jain","year":"2015","unstructured":"Jain S, Williams DJ, Arnold SR, Ampofo K, Bramley AM, Reed C, Stockmann C, Anderson EJ, Grijalva CG, Self WH et al (2015) Community-acquired pneumonia requiring hospitalization among us children. N Engl J Med 372(9):835\u2013845","journal-title":"N Engl J Med"},{"key":"1637_CR3","unstructured":"Simonyan K, Zisserman A (2015) Very deep convolutional networks for large-scale image recognition. In: International Conference on Learning Representations (ICLR)"},{"key":"1637_CR4","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"1637_CR5","doi-asserted-by":"crossref","unstructured":"Szegedy C, Liu W, Jia Y, Sermanet P, Reed S, Anguelov D, Erhan D, Vanhoucke V, Rabinovich A (2015) Going deeper with convolutions. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1\u20139","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"1637_CR6","doi-asserted-by":"crossref","unstructured":"Girshick R, Donahue J, Darrell T, Malik J (2014) Rich feature hierarchies for accurate object detection and semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp 580\u2013587","DOI":"10.1109\/CVPR.2014.81"},{"key":"1637_CR7","unstructured":"Ren S, He K, Girshick R, Sun J (2015) Faster r-cnn: towards real-time object detection with region proposal networks. In: Advances in Neural Information Processing Systems (NIPS), pp 91\u201399"},{"key":"1637_CR8","doi-asserted-by":"crossref","unstructured":"Redmon J, Divvala S, Girshick R, Farhadi A (2016) You only look once: unified, real-time object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp 779\u2013788","DOI":"10.1109\/CVPR.2016.91"},{"key":"1637_CR9","first-page":"159","volume":"2","author":"R Wang","year":"2019","unstructured":"Wang R, Sun HD, Zhang JL, Zhao ZJ (2019) A transfer learning method for ct image classification of pulmonary nodules. WISATS 2:159\u2013166","journal-title":"WISATS"},{"key":"1637_CR10","unstructured":"Wang H, Zhang Y, Shen Y, Zhou J (2018) Chestx-ray14: a large-scale benchmark dataset for pneumonia recognition in chest x-rays. 2018 IEEE 31st International Symposium on Computer-Based Medical Systems (CBMS), pp 244\u2013249"},{"key":"1637_CR11","doi-asserted-by":"crossref","unstructured":"Sori\u0107 M, Pongrac D, Inza I (2020) Using convolutional neural network for chest x-ray image classification. In: 2020 43rd International Convention on Information, Communication and Electronic Technology (MIPRO). IEEE, pp 1771\u20131776","DOI":"10.23919\/MIPRO48935.2020.9245376"},{"issue":"2","key":"1637_CR12","doi-asserted-by":"publisher","first-page":"2123","DOI":"10.1007\/s13369-021-06127-z","volume":"47","author":"E Ayan","year":"2022","unstructured":"Ayan E, Karabulut B, \u00dcnver HM (2022) Diagnosis of pediatric pneumonia with ensemble of deep convolutional neural networks in chest x-ray images. Arab J Sci Eng 47(2):2123\u20132139","journal-title":"Arab J Sci Eng"},{"key":"1637_CR13","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser \u00c5, Polosukhin I (2017) Attention is all you need. Adv Neural Inform Process Syst 30 :1-11"},{"key":"1637_CR14","unstructured":"Dosovitskiy A, Beyer L, Kolesnikov A, Weissenborn D, Zhai X, Unterthiner T, Dehghani M, Minderer M, Heigold G, Gelly S et\u00a0al (2020) An image is worth 16x16 words: transformers for image recognition at scale. In: International Conference on Learning Representations"},{"key":"1637_CR15","doi-asserted-by":"crossref","unstructured":"Touvron H, Cord M, Douze M, Massa F, Sablayrolles A, Jegou H (2021) Training data-efficient image transformers and distillation through attention. In: ICML","DOI":"10.1109\/ICCV48922.2021.00010"},{"key":"1637_CR16","doi-asserted-by":"crossref","unstructured":"Touvron H, Cord M, Sablayrolles A, Synnaeve G and Jegou H (2021) Going deeper with image transformers. In: ICCV","DOI":"10.1109\/ICCV48922.2021.00010"},{"key":"1637_CR17","doi-asserted-by":"crossref","unstructured":"Liu Z, Lin Y, Cao Y, Hu H, Wei Y, Zhang Z, Lin S, Guo B (2021) Swin transformer: hierarchical vision transformer using shifted windows. IEEE","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"1637_CR18","unstructured":"Tay Y, Dehghani M, Bahri D, Metzler D (2020) Efficient transformers: a survey. arXiv preprint arXiv:2009.06732"},{"key":"1637_CR19","doi-asserted-by":"crossref","unstructured":"Cheng Y, Yu W (2024) Research on resnet34 improved model. In: 2024 9th International Conference on Intelligent Informatics and Biomedical Sciences (ICIIBMS), vol.\u00a09. IEEE, pp 11\u201314","DOI":"10.1109\/ICIIBMS62405.2024.10792749"},{"issue":"5","key":"1637_CR20","doi-asserted-by":"publisher","first-page":"1122","DOI":"10.1016\/j.cell.2018.02.010","volume":"172","author":"DS Kermany","year":"2018","unstructured":"Kermany DS, Goldbaum M, Cai W, Valentim CC, Liang H, Baxter SL, McKeown A, Yang G, Wu X, Yan F, Dong J, Prasadha MK, Pei J, Ting MY, Zhu J, Li C, Hewett S, Dong J, Ziyar I, Shi A, Zhang R, Zheng L, Hou R, Shi W, Fu X, Duan Y, Huu VA, Wen C, Zhang ED, Zhang CL, Li O, Wang X, Singer MA, Sun X, Xu J, Tafreshi A, Lewis MA, Xia H, Zhang K (2018) Identifying medical diagnoses and treatable diseases by image-based deep learning. Cell 172(5):1122-1131.e9","journal-title":"Cell"},{"key":"1637_CR21","doi-asserted-by":"crossref","unstructured":"Shinoda, R, Shiohara K (2024) Openanimaltracks: a dataset for animal track recognition. arXiv preprint arXiv:2406.09647","DOI":"10.1109\/ICIP51287.2024.10648043"},{"issue":"9","key":"1637_CR22","doi-asserted-by":"publisher","first-page":"5102","DOI":"10.1109\/TCSVT.2023.3249468","volume":"33","author":"C Tang","year":"2023","unstructured":"Tang C, Wang X, Bai Y, Wu Z, Zhang J, Huang Y (2023) Learning spatial-frequency transformer for visual object tracking. IEEE Trans Circ Syst Video Technol 33(9):5102\u20135116","journal-title":"IEEE Trans Circ Syst Video Technol"},{"key":"1637_CR23","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3633516","volume":"20","author":"J Bian","year":"2022","unstructured":"Bian J, Li X, Wang T, Wang Q, Huang J, Liu C, Zhao J, Lu F, Dou D, Xiong H (2022) P2anet: a large-scale benchmark for dense action detection from table tennis match broadcasting videos. ACM Trans Multimed Comput Commun Appl 20:1\u201323","journal-title":"ACM Trans Multimed Comput Commun Appl"},{"issue":"3","key":"1637_CR24","first-page":"2585","volume":"36","author":"Y Wang","year":"2022","unstructured":"Wang Y, Xu J, Sun Y (2022) End-to-end transformer based model for image captioning. Proc AAAI Conf Artif Intell 36(3):2585\u20132594","journal-title":"Proc AAAI Conf Artif Intell"},{"key":"1637_CR25","doi-asserted-by":"crossref","unstructured":"Chen T, Jiang D, Li R (2022) Swin transformers make strong contextual encoders for vhr image road extraction. In: IGARSS 2022-2022 IEEE International Geoscience and Remote Sensing Symposium. IEEE, pp 3019\u20133022","DOI":"10.1109\/IGARSS46834.2022.9883628"},{"key":"1637_CR26","unstructured":"Yang Y-Q, Guo Y-X, Xiong J, Liu Y, Pan H, Wang P-S, Tong X, Guo B (2023) Swin3d: a pretrained transformer backbone for 3d indoor scene understanding ArXiv, arXiv:2304.06906"},{"key":"1637_CR27","unstructured":"Wei Y, Hu H, Xie Z, Zhang Z, Cao Y, Bao J, Chen D, Guo B (2022) Contrastive learning rivals masked image modeling in fine-tuning via feature distillation. arXiv preprint arXiv:2205.14141"},{"key":"1637_CR28","doi-asserted-by":"crossref","unstructured":"Hong S, Cho S, Nam J, Lin S, Kim S (2022) Cost aggregation with 4d convolutional swin transformer for few-shot segmentation. In: European Conference on Computer Vision. Springer, pp 108\u2013126","DOI":"10.1007\/978-3-031-19818-2_7"},{"key":"1637_CR29","doi-asserted-by":"publisher","first-page":"34 174","DOI":"10.1109\/ACCESS.2024.3371511","volume":"12","author":"MH Bijoy","year":"2024","unstructured":"Bijoy MH, Hasan N, Biswas M, Mazumdar S, Jimenez A, Ahmed F, Rasheduzzaman M, Momen S (2024) Towards sustainable agriculture: a novel approach for rice leaf disease detection using dcnn and enhanced dataset. IEEE Access 12:34 174-34 191","journal-title":"IEEE Access"},{"key":"1637_CR30","doi-asserted-by":"crossref","unstructured":"Wei Y, Hu H, Xie Z, Liu Z, Zhang Z, Cao Y, Bao J, Chen D, Guo B (2023) Improving clip fine-tuning performance. In: IEEE\/CVF International Conference on Computer Vision (ICCV) 2023:5416\u20135426","DOI":"10.1109\/ICCV51070.2023.00501"},{"issue":"12","key":"1637_CR31","doi-asserted-by":"publisher","first-page":"19 517","DOI":"10.1109\/JSEN.2024.3394956","volume":"24","author":"X Luo","year":"2024","unstructured":"Luo X, Luo S, Chen M, Zhao G, He C, Wu H (2024) Mbformer-yolo: multibranch adaptive spatial feature detection network for small infrared object detection. IEEE Sens J 24(12):19 517-19 530","journal-title":"IEEE Sens J"},{"key":"1637_CR32","unstructured":"Lee C-Y, Chien H-C, Wang C-P, Yen H, Zhen K-W, Lin H-K (2022) Using multi-scale swintransformer-htc with data augmentation in conic challenge. arXiv preprint arXiv:2202.13588"},{"key":"1637_CR33","doi-asserted-by":"crossref","unstructured":"Stegm\u00fcller T, Bozorgtabar B, Spahr A, Thiran J-P (2023) Scorenet: Learning non-uniform attention and augmentation for transformer-based histopathological image classification. In: Proceedings of the IEEE\/CVF winter Conference on applications of computer vision, pp 6170\u20136179","DOI":"10.1109\/WACV56688.2023.00611"},{"issue":"4","key":"1637_CR34","doi-asserted-by":"publisher","first-page":"2115","DOI":"10.1109\/JBHI.2024.3360239","volume":"28","author":"Z Xing","year":"2024","unstructured":"Xing Z, Zhu L, Yu L, Xing Z, Wan L (2024) Hybrid masked image modeling for 3d medical image segmentation. IEEE J Biomed Health Inform 28(4):2115\u20132125","journal-title":"IEEE J Biomed Health Inform"},{"key":"1637_CR35","doi-asserted-by":"crossref","unstructured":"Zou S, Liao F (2022) Automated segmentation of glands to facilitate quantitative analysis in cd138 whole slide images using a knet deep learning framework. In: International Conference on Frontiers of Artificial Intelligence and Machine Learning (FAIML) 2022:191\u2013195","DOI":"10.1109\/FAIML57028.2022.00044"},{"key":"1637_CR36","doi-asserted-by":"publisher","first-page":"129\u00a0240","DOI":"10.1109\/ACCESS.2023.3330379","volume":"11","author":"H Wang","year":"2023","unstructured":"Wang H, Yu K, Gao S, Li Q, Guan Q (2023) Skin disease segmentation method based on network feature aggregation module and edge enhanced attention mechanism. IEEE Access 11:129\u00a0240-129\u00a0246","journal-title":"IEEE Access"},{"key":"1637_CR37","doi-asserted-by":"crossref","unstructured":"Rasoulian A, Salari S, Xiao Y (2023) Weakly supervised intracranial hemorrhage segmentation using head-wise gradient-infused self-attention maps from a swin transformer in categorical learning. ArXiv, arXiv:2304.04902","DOI":"10.59275\/j.melba.2023-553a"},{"key":"1637_CR38","doi-asserted-by":"crossref","unstructured":"Heidari M, Kazerouni A, Kadarvish MS, Azad R, Aghdam EK, Cohen-Adad J, Merhof D (2022) Hiformer: hierarchical multi-scale representations using transformers for medical image segmentation. 2023 IEEE\/CVF Winter Conference on Applications of Computer Vision (WACV), pp 6191\u20136201","DOI":"10.1109\/WACV56688.2023.00614"},{"key":"1637_CR39","unstructured":"Jafari H, Faez K, Amindavar H (2023) Swin-tempo: temporal-aware lung nodule detection in ct scans as video sequences using swin transformer-enhanced unet. ArXiv, arXiv:2310.03365"},{"key":"1637_CR40","doi-asserted-by":"crossref","unstructured":"Tragakis A, Kaul C, Murray-Smith R, Husmeier D (2023) The fully convolutional transformer for medical image segmentation. In: Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp 3660\u20133669","DOI":"10.1109\/WACV56688.2023.00365"},{"key":"1637_CR41","doi-asserted-by":"crossref","unstructured":"Roy S, Koehler G, Ulrich C, Baumgartner M, Petersen J, Isensee F, Jaeger PF, Maier-Hein KH (2023) Mednext: transformer-driven scaling of convnets for medical image segmentation. In: International Conference on Medical Image Computing and Computer-Assisted Intervention. Springer, pp 405\u2013415","DOI":"10.1007\/978-3-031-43901-8_39"},{"key":"1637_CR42","doi-asserted-by":"crossref","unstructured":"Chowdary GJ, Yin Z (2024) Med-former: a transformer based architecture for medical image classification. In: International conference on medical image computing and computer-assisted intervention. Springer, pp 448\u2013457","DOI":"10.1007\/978-3-031-72120-5_42"},{"issue":"6","key":"1637_CR43","first-page":"6030","volume":"38","author":"J Wu","year":"2024","unstructured":"Wu J, Ji W, Fu H, Xu M, Jin Y, Xu Y (2024) Medsegdiff-v2: diffusion-based medical image segmentation with transformer. Proc AAAI Conf Artif Intell 38(6):6030\u20136038","journal-title":"Proc AAAI Conf Artif Intell"},{"key":"1637_CR44","doi-asserted-by":"publisher","DOI":"10.1016\/j.compeleceng.2025.110099","volume":"123","author":"S Kumar","year":"2025","unstructured":"Kumar S (2025) Advancements in medical image segmentation: a review of transformer models. Comput Electr Eng 123:110099","journal-title":"Comput Electr Eng"},{"key":"1637_CR45","unstructured":"Hinton G, Vinyals O, Dean J (2015) Distilling the knowledge in a neural network. arXiv preprint arXiv:1503.02531"},{"key":"1637_CR46","first-page":"3830","volume":"35","author":"X-C Li","year":"2022","unstructured":"Li X-C, Fan W-S, Song S, Li Y, Yunfeng S, Zhan D-C et al (2022) Asymmetric temperature scaling makes larger networks teach well again. Adv Neural Inf Process Syst 35:3830\u20133842","journal-title":"Adv Neural Inf Process Syst"},{"key":"1637_CR47","doi-asserted-by":"crossref","unstructured":"Fan S, Cheng X, Wang X, Yang C, Deng P, Liu M, Deng J, Liu M (2022) Channel self-supervision for online knowledge distillation. arXiv preprint arXiv:2203.11660","DOI":"10.1109\/ICCC56324.2022.10065706"},{"key":"1637_CR48","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2022.102693","volume":"84","author":"Y Wang","year":"2023","unstructured":"Wang Y, Wang Y, Cai J, Lee TK, Miao C, Wang ZJ (2023) Ssd-kd: a self-supervised diverse knowledge distillation method for lightweight skin lesion classification using dermoscopic images. Med Image Anal 84:102693","journal-title":"Med Image Anal"},{"key":"1637_CR49","unstructured":"Loussaief EB, Rashwan H, Ayad M, Hassan MZ, Puig D (2023) Knowledge distillation for adaptive mri prostate segmentation based on limit-trained multi-teacher models. arXiv preprint arXiv:2303.09494"},{"key":"1637_CR50","unstructured":"Lichtarge J, Amid E, Kumar S, Yang T-J, Anil R, Mathews R (2023) Heterogeneous federated learning using knowledge codistillation. arXiv preprint arXiv:2310.02549"},{"key":"1637_CR51","unstructured":"Vuong TTL, Kwak JT (2023) Moma: Momentum contrastive learning with multi-head attention-based knowledge distillation for histopathology image analysis. arXiv preprint arXiv:2308.16561"},{"key":"1637_CR52","unstructured":"Gammulle H, Chen Y, Sridharan S, Klein T, Fookes C (2023) Learning through guidance: Knowledge distillation for endoscopic image classification. arXiv preprint arXiv:2308.08731"},{"key":"1637_CR53","unstructured":"Nabavi S, Anvari K, Moghaddam ME, Abin AA, Frangi AF (2024) Multiple teachers-meticulous student: a domain adaptive meta-knowledge distillation model for medical image classification. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR). IEEE, pp 12\u00a0345\u201312\u00a0356"},{"key":"1637_CR54","unstructured":"Kusiak A (2000) Data mining: medical and engineering case studies. In Industrial Engineering Research Conference. pp. 1-7 ."},{"key":"1637_CR55","doi-asserted-by":"publisher","first-page":"80","DOI":"10.1016\/j.procs.2016.07.027","volume":"90","author":"H Alahmer","year":"2016","unstructured":"Alahmer H, Ahmed A (2016) Computer-aided classification of liver lesions from ct images based on multiple roi. Procedia Comput Sci 90:80\u201386","journal-title":"Procedia Comput Sci"},{"key":"1637_CR56","doi-asserted-by":"publisher","first-page":"4135","DOI":"10.1007\/s12652-019-01173-w","volume":"10","author":"F Shaukat","year":"2019","unstructured":"Shaukat F, Raja G, Ashraf R, Khalid S, Ahmad M, Ali A (2019) Artificial neural network based classification of lung nodules in ct images using intensity, shape and texture features. J Ambient Intell Humaniz Comput 10:4135\u20134149","journal-title":"J Ambient Intell Humaniz Comput"},{"key":"1637_CR57","doi-asserted-by":"crossref","unstructured":"Lin T-Y, Doll\u00c3\u00a1r P, Girshick R, He K, Hariharan B, Belongie S (2017) Feature pyramid networks for object detection. 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp 936\u2013944","DOI":"10.1109\/CVPR.2017.106"},{"key":"1637_CR58","doi-asserted-by":"publisher","first-page":"318","DOI":"10.1109\/TPAMI.2018.2858826","volume":"42","author":"T-Y Lin","year":"2017","unstructured":"Lin T-Y, Goyal P, Girshick R, He K, Doll\u00c3\u00a1r P (2017) Focal loss for dense object detection. IEEE Trans Pattern Anal Mach Intell 42:318\u2013327","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"1637_CR59","doi-asserted-by":"publisher","DOI":"10.1016\/j.cmpb.2019.06.023","volume":"187","author":"G Liang","year":"2020","unstructured":"Liang G, Zheng L (2020) A transfer learning method with deep residual network for pediatric pneumonia diagnosis. Comput Methods Programs Biomed 187:104964","journal-title":"Comput Methods Programs Biomed"},{"key":"1637_CR60","doi-asserted-by":"crossref","unstructured":"Liu Z, Lin Y, Cao Y, Hu H, Wei Y, Zhang Z, Lin S, Guo B (2021) Swin transformer: hierarchical vision transformer using shifted windows. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 10\u00a0012\u201310\u00a0022","DOI":"10.1109\/ICCV48922.2021.00986"},{"issue":"2","key":"1637_CR61","doi-asserted-by":"publisher","first-page":"114","DOI":"10.5391\/IJFIS.2024.24.2.114","volume":"24","author":"S-H Choi","year":"2024","unstructured":"Choi S-H (2024) Scale correction cascade smooth loss in gans to improve model performance. Int J Fuzzy Logic Intell Syst 24(2):114\u2013124","journal-title":"Int J Fuzzy Logic Intell Syst"},{"issue":"1","key":"1637_CR62","doi-asserted-by":"publisher","first-page":"769","DOI":"10.1007\/s10489-022-03479-3","volume":"53","author":"Z Zheng","year":"2023","unstructured":"Zheng Z, Feng X, Yu H, Li X, Gao M (2023) Bdla: Bi-directional local alignment for few-shot learning. Appl Intell 53(1):769\u2013785","journal-title":"Appl Intell"},{"issue":"2","key":"1637_CR63","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11227-024-06886-0","volume":"81","author":"H Wu","year":"2025","unstructured":"Wu H, Zheng Z, Lv L, Zhang C, Bardou D, Niu S, Yu G (2025) Dara: distribution-aware representation alignment for semi-supervised domain adaptation in image classification. J Supercomput 81(2):1\u201337","journal-title":"J Supercomput"},{"key":"1637_CR64","doi-asserted-by":"publisher","first-page":"208","DOI":"10.1016\/j.neucom.2021.10.075","volume":"471","author":"Z Zheng","year":"2022","unstructured":"Zheng Z, Feng X, Yu H, Gao M (2022) Cooperative density-aware representation learning for few-shot visual recognition. Neurocomputing 471:208\u2013218","journal-title":"Neurocomputing"},{"key":"1637_CR65","doi-asserted-by":"crossref","unstructured":"Wu H, Zheng Z, Wang H, Wang W, Yang Z (2025) Few-shot incremental learning with context-aware spatial enhancement for image recognition. IEEE Access 13: 110569-110583","DOI":"10.1109\/ACCESS.2025.3579766"},{"key":"1637_CR66","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2023.110412","volume":"266","author":"Z Zheng","year":"2023","unstructured":"Zheng Z, Wu H, Lv L, Ye H, Zhang C, Yu G (2023) Iccl: Independent and correlative correspondence learning for few-shot image classification. Knowl-Based Syst 266:110412","journal-title":"Knowl-Based Syst"},{"issue":"742","key":"1637_CR67","first-page":"1573","volume":"55","author":"H Wu","year":"2025","unstructured":"Wu H, Zheng Z, Lv L, Zhang C, Xu Y, Bardou D, Niu S, Yu G (2025) Clcfe: complementary loss coupling for feature-enhanced few-shot fine-grained visual recognition. Appl Intell 55(742):1573\u20137497","journal-title":"Appl Intell"},{"issue":"7","key":"1637_CR68","doi-asserted-by":"publisher","first-page":"7833","DOI":"10.1007\/s10489-022-03750-7","volume":"53","author":"Z Zheng","year":"2023","unstructured":"Zheng Z, Feng X, Yu H, Li X, Gao M (2023) Unsupervised few-shot image classification via one-vs-all contrastive learning. Appl Intell 53(7):7833\u20137847","journal-title":"Appl Intell"},{"issue":"1","key":"1637_CR69","doi-asserted-by":"publisher","first-page":"21903","DOI":"10.1038\/s41598-025-08323-5","volume":"15","author":"H Wu","year":"2025","unstructured":"Wu H, Zheng Z, Lv L, Xu Y, Bardou D, Niu S, Yu G, Wang Y (2025) A spatially aware global and local perspective approach for few-shot incremental learning. Sci Rep 15(1):21903","journal-title":"Sci Rep"},{"key":"1637_CR70","doi-asserted-by":"crossref","unstructured":"Zheng Z, Wu H, Lv L, Zhang C, Guo H, Niu S, Yu G (2025) Multi-branch semantic alignment for few-shot image classification. Inf Sci 723:122676","DOI":"10.1016\/j.ins.2025.122676"},{"key":"1637_CR71","doi-asserted-by":"crossref","unstructured":"Zheng Z, Wu H, Wang J, Lv L, Bardou D, Yu G (2025) Vlca: Vision-language feature enhancement with cross-attention learning for facial expression recognition. Expert Syst Appl 130292","DOI":"10.1016\/j.eswa.2025.130292"},{"key":"1637_CR72","doi-asserted-by":"crossref","unstructured":"Wu H, Zheng Z, Lv L, Yan Z, Niu S, Yu G (2024) Vlce: unified vision-language collaborative enhancement for facial expression recognition. In: 2024 5th International Conference on Computers and Artificial Intelligence Technology (CAIT). IEEE, pp 94\u201399","DOI":"10.1109\/CAIT64506.2024.10963325"},{"key":"1637_CR73","doi-asserted-by":"crossref","unstructured":"Zheng Z, Zhu Y, Wu H, Lv L, Yu G, Niu S (2024) Cross-domain few-shot chest x-ray recognition. In: 2024 5th International Conference on Computers and Artificial Intelligence Technology (CAIT). IEEE, pp 224\u2013229","DOI":"10.1109\/CAIT64506.2024.10963262"},{"key":"1637_CR74","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.neucom.2022.11.073","volume":"520","author":"H Wu","year":"2023","unstructured":"Wu H, Zhao Y, Li J (2023) Invariant and consistent: unsupervised representation learning for few-shot visual recognition. Neurocomputing 520:1\u201314","journal-title":"Neurocomputing"},{"issue":"8","key":"1637_CR75","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11227-025-07409-1","volume":"81","author":"Z Zheng","year":"2025","unstructured":"Zheng Z, Wu H, Lv L, Bardou D, Niu S, Yu G (2025) Merge: multimodal-enhanced representation and guided ensemble for pneumonia recognition in chest x-ray images. J Supercomput 81(8):1\u201325","journal-title":"J Supercomput"},{"key":"1637_CR76","doi-asserted-by":"crossref","unstructured":"Zheng Z, Zhu Y, Wu H, Lv L, Niu S, Yu G (2025) Sge: semantic-guided generalization enhancement for few-shot learning. Knowl-Based Syst 323: 113761","DOI":"10.1016\/j.knosys.2025.113761"},{"key":"1637_CR77","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2025.105662","volume":"162","author":"Y Cui","year":"2025","unstructured":"Cui Y, Liu J, Teng Z, Yang S, Li H, Li P, Lu J, Gao Y, Peng Y, Han H, Fu W (2025) Multi-scale feature fusion with task-specific data synthesis for pneumonia pathogen classification. Image Vis Comput 162:105662","journal-title":"Image Vis Comput"},{"key":"1637_CR78","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2020.101794","volume":"65","author":"S Minaee","year":"2020","unstructured":"Minaee S, Kafieh R, Sonka M, Yazdani S, Jamalipour Soufi G (2020) Deep-covid: Predicting covid-19 from chest x-ray images using deep transfer learning. Med Image Anal 65:101794","journal-title":"Med Image Anal"},{"key":"1637_CR79","unstructured":"Mehta S, Rastegari M (2021) Mobilevit: light-weight, general-purpose, and mobile-friendly vision transformer. ArXiv, arXiv:2110.02178"},{"key":"1637_CR80","doi-asserted-by":"crossref","unstructured":"Bao Y, Wang W, Zhao L, Zheng Z, Wu H, Yu G, Lv L (2024) E2cl: an efficient and effective classification learning for pneumonia detection in chest x-rays. In: 2024 5th International Conference on Computers and Artificial Intelligence Technology (CAIT). IEEE, pp 35\u201340","DOI":"10.1109\/CAIT64506.2024.10962855"},{"key":"1637_CR81","doi-asserted-by":"publisher","first-page":"559","DOI":"10.3390\/app10020559","volume":"10","author":"V Chouhan","year":"2020","unstructured":"Chouhan V (2020) A novel transfer learning based approach for pneumonia detection in chest x-ray images. Appl Sci 10:559","journal-title":"Appl Sci"},{"key":"1637_CR82","unstructured":"Xu Y, Xie L, Zhang X, Chen X, Qi G-J, Tian Q, Xiong H (2019) Pc-darts: partial channel connections for memory-efficient architecture search. arXiv preprint arXiv:1907.05737"},{"key":"1637_CR83","unstructured":"Liu H, Simonyan K, Yang Y (2019) Darts: differentiable architecture search. arXiv preprint arXiv:1806.09055"},{"key":"1637_CR84","doi-asserted-by":"crossref","unstructured":"Padigela J, Akula P, Balla SS, K S (2023) Comparison of data augmentation techniques for training cnns to detect pneumonia from chest x-ray images. In: 2023 International Conference on Computational Intelligence for Information, Security and Communication Applications (CIISCA)","DOI":"10.1109\/CIISCA59740.2023.00017"},{"key":"1637_CR85","doi-asserted-by":"crossref","unstructured":"Fang J, Xie L, Wang X, Zhang X, Liu W, Tian Q (2022) Msg-transformer: exchanging local spatial information by manipulating messenger tokens. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition pp 12\u00a0063\u201312\u00a0072D","DOI":"10.1109\/CVPR52688.2022.01175"}],"container-title":["Pattern Analysis and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-026-01637-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10044-026-01637-8","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-026-01637-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T10:38:54Z","timestamp":1773484734000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10044-026-01637-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,21]]},"references-count":85,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,3]]}},"alternative-id":["1637"],"URL":"https:\/\/doi.org\/10.1007\/s10044-026-01637-8","relation":{},"ISSN":["1433-7541","1433-755X"],"issn-type":[{"value":"1433-7541","type":"print"},{"value":"1433-755X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2,21]]},"assertion":[{"value":"6 October 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 February 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 February 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"53"}}