{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,27]],"date-time":"2025-12-27T03:23:51Z","timestamp":1766805831785},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"18","license":[{"start":{"date-parts":[[2023,6,17]],"date-time":"2023-06-17T00:00:00Z","timestamp":1686960000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,6,17]],"date-time":"2023-06-17T00:00:00Z","timestamp":1686960000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Supercomput"],"published-print":{"date-parts":[[2023,12]]},"DOI":"10.1007\/s11227-023-05448-0","type":"journal-article","created":{"date-parts":[[2023,6,17]],"date-time":"2023-06-17T04:02:13Z","timestamp":1686974533000},"page":"20899-20922","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Improving generalization in deep neural network using knowledge transformation based on fisher criterion"],"prefix":"10.1007","volume":"79","author":[{"given":"Sajedeh","family":"Morabbi","sequence":"first","affiliation":[]},{"given":"Hadi","family":"Soltanizadeh","sequence":"additional","affiliation":[]},{"given":"Saeed","family":"Mozaffari","sequence":"additional","affiliation":[]},{"given":"Mohammad Javad","family":"Fadaeieslam","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,6,17]]},"reference":[{"key":"5448_CR1","doi-asserted-by":"publisher","DOI":"10.1016\/j.displa.2022.102277","author":"AS Hashemi","year":"2022","unstructured":"Hashemi AS, Mozaffari S, Alirezaee S (2022) Improving adversarial robustness of traffic sign image recognition networks. Displays. https:\/\/doi.org\/10.1016\/j.displa.2022.102277","journal-title":"Displays"},{"key":"5448_CR2","doi-asserted-by":"publisher","first-page":"2850","DOI":"10.1007\/s10489-020-02055-x","volume":"51","author":"C Sitaula","year":"2021","unstructured":"Sitaula C, Hossain MB (2021) Attention-based VGG-16 model for COVID-19 chest X-ray image classification. Appl Intell 51:2850\u20132863. https:\/\/doi.org\/10.1007\/s10489-020-02055-x","journal-title":"Appl Intell"},{"key":"5448_CR3","doi-asserted-by":"publisher","first-page":"1869","DOI":"10.1007\/s00371-019-01775-7","volume":"36","author":"P Xi","year":"2020","unstructured":"Xi P, Guan H, Shu C et al (2020) An integrated approach for medical abnormality detection using deep patch convolutional neural networks. Vis Comput 36:1869\u20131882. https:\/\/doi.org\/10.1007\/s00371-019-01775-7","journal-title":"Vis Comput"},{"key":"5448_CR4","doi-asserted-by":"publisher","first-page":"123649","DOI":"10.1109\/ACCESS.2020.3005687","volume":"8","author":"B Jin","year":"2020","unstructured":"Jin B, Cruz L, Gon\u00e7alves N (2020) Deep facial diagnosis: deep transfer learning from face recognition to facial diagnosis. IEEE Access 8:123649\u2013123661","journal-title":"IEEE Access"},{"key":"5448_CR5","doi-asserted-by":"publisher","first-page":"21719","DOI":"10.1007\/s11042-022-12445-7","volume":"81","author":"A Khosravanian","year":"2022","unstructured":"Khosravanian A, Rahmanimanesh M, Keshavarzi P et al (2022) Level set method for automated 3D brain tumor segmentation using symmetry analysis and kernel induced fuzzy clustering. Multimed Tools Appl 81:21719\u201321740. https:\/\/doi.org\/10.1007\/s11042-022-12445-7","journal-title":"Multimed Tools Appl"},{"key":"5448_CR6","doi-asserted-by":"publisher","first-page":"16353","DOI":"10.1007\/s10489-022-03384-9","volume":"52","author":"JL Wu","year":"2022","unstructured":"Wu JL, Chung WY (2022) Sentiment-based masked language modeling for improving sentence-level valence\u2013arousal prediction. Appl Intell 52:16353\u201316369. https:\/\/doi.org\/10.1007\/s10489-022-03384-9","journal-title":"Appl Intell"},{"key":"5448_CR7","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1148\/radiol.2020192224","volume":"295","author":"MJ Willemink","year":"2020","unstructured":"Willemink MJ, Koszek WA, Hardell C et al (2020) Preparing medical imaging data for machine learning. Radiology 295:4\u201315. https:\/\/doi.org\/10.1148\/radiol.2020192224","journal-title":"Radiology"},{"key":"5448_CR8","doi-asserted-by":"publisher","DOI":"10.1016\/j.infsof.2021.106566","author":"L Ghadhab","year":"2021","unstructured":"Ghadhab L, Jenhani I, Mkaouer MW, Ben Messaoud M (2021) Augmenting commit classification by using fine-grained source code changes and a pre-trained deep neural language model. Inf Softw Technol. https:\/\/doi.org\/10.1016\/j.infsof.2021.106566","journal-title":"Inf Softw Technol"},{"key":"5448_CR9","doi-asserted-by":"publisher","first-page":"7723","DOI":"10.1007\/s00521-020-05514-1","volume":"33","author":"Q Zheng","year":"2021","unstructured":"Zheng Q, Zhao P, Li Y et al (2021) Spectrum interference-based two-level data augmentation method in deep learning for automatic modulation classification. Neural Comput Appl 33:7723\u20137745. https:\/\/doi.org\/10.1007\/s00521-020-05514-1","journal-title":"Neural Comput Appl"},{"key":"5448_CR10","unstructured":"Pang T, Xu K, Dong Y, et al (2019) Rethinking softmax cross-entropy loss for adversarial robustness"},{"key":"5448_CR11","volume-title":"Deep learning","author":"I Goodfellow","year":"2016","unstructured":"Goodfellow I, Bengio Y, Courville A (2016) Deep learning. MIT press"},{"key":"5448_CR12","doi-asserted-by":"publisher","DOI":"10.1017\/9781009025096.003","author":"K Kawaguchi","year":"2022","unstructured":"Kawaguchi K, Bengio Y, Kaelbling L (2022) Generalization in deep learning. Math Asp Deep Learn. https:\/\/doi.org\/10.1017\/9781009025096.003","journal-title":"Math Asp Deep Learn"},{"key":"5448_CR13","doi-asserted-by":"publisher","unstructured":"Gong C, Ren T, Ye M, Liu Q (2021) MaxUp: lightweight adversarial training with data augmentation improves neural network training. In: Proc IEEE Comput Soc Conf Comput Vis Pattern Recognit 2474\u20132483https:\/\/doi.org\/10.1109\/CVPR46437.2021.00250","DOI":"10.1109\/CVPR46437.2021.00250"},{"key":"5448_CR14","doi-asserted-by":"publisher","first-page":"215","DOI":"10.1007\/978-981-16-3357-7_9","volume":"3","author":"MG Sarwar Murshed","year":"2022","unstructured":"Sarwar Murshed MG, Carroll JJ, Khan N, Hussain F (2022) Efficient deployment of deep learning models on autonomous robots in the ROS environment. Deep Learn Appl 3:215\u2013243. https:\/\/doi.org\/10.1007\/978-981-16-3357-7_9","journal-title":"Deep Learn Appl"},{"key":"5448_CR15","first-page":"6906","volume":"9","author":"S Stanton","year":"2021","unstructured":"Stanton S, Izmailov P, Kirichenko P et al (2021) Does knowledge distillation really work? Adv Neural Inf Process Syst 9:6906\u20136919","journal-title":"Adv Neural Inf Process Syst"},{"key":"5448_CR16","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/3446776","volume":"64","author":"C Zhang","year":"2021","unstructured":"Zhang C, Bengio S, Hardt M et al (2021) Understanding deep learning (still) requires rethinking generalization. Commun ACM 64:107\u2013115. https:\/\/doi.org\/10.1145\/3446776","journal-title":"Commun ACM"},{"key":"5448_CR17","unstructured":"Oymak S, Soltanolkotabi M (2019) Overparameterized nonlinear learning: Gradient descent takes the shortest path? In: 36th Int Conf Mach Learn ICML 2019 2019-June:8707\u20138747"},{"key":"5448_CR18","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-023-01792-z","author":"J Gou","year":"2023","unstructured":"Gou J, Xiong X, Yu B et al (2023) Multi-target knowledge distillation via student self-reflection. Int J Comput Vis. https:\/\/doi.org\/10.1007\/s11263-023-01792-z","journal-title":"Int J Comput Vis"},{"key":"5448_CR19","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1016\/j.compind.2019.02.003","volume":"108","author":"S Coulibaly","year":"2019","unstructured":"Coulibaly S, Kamsu-Foguem B, Kamissoko D, Traore D (2019) Deep neural networks with transfer learning in millet crop images. Comput Ind 108:115\u2013120. https:\/\/doi.org\/10.1016\/j.compind.2019.02.003","journal-title":"Comput Ind"},{"key":"5448_CR20","unstructured":"Hinton G, Vinyals O, Dean J (2015) Distilling the knowledge in a neural network"},{"key":"5448_CR21","doi-asserted-by":"publisher","first-page":"7204","DOI":"10.1002\/int.22586","volume":"36","author":"Q Zheng","year":"2021","unstructured":"Zheng Q, Zhao P, Zhang D, Wang H (2021) MR-DCAE: manifold regularization-based deep convolutional autoencoder for unauthorized broadcasting identification. Int J Intell Syst 36:7204\u20137238. https:\/\/doi.org\/10.1002\/int.22586","journal-title":"Int J Intell Syst"},{"key":"5448_CR22","doi-asserted-by":"publisher","first-page":"1298","DOI":"10.1109\/LCOMM.2022.3145647","volume":"26","author":"Q Zheng","year":"2022","unstructured":"Zheng Q, Zhao P, Wang H et al (2022) Fine-grained modulation classification using multi-scale radio transformer with dual-channel representation. IEEE Commun Lett 26:1298\u20131302. https:\/\/doi.org\/10.1109\/LCOMM.2022.3145647","journal-title":"IEEE Commun Lett"},{"key":"5448_CR23","first-page":"2654","volume":"3","author":"LJ Ba","year":"2014","unstructured":"Ba LJ, Caruana R (2014) Do deep nets really need to be deep? Adv Neural Inf Process Syst 3:2654\u20132662","journal-title":"Adv Neural Inf Process Syst"},{"key":"5448_CR24","doi-asserted-by":"publisher","DOI":"10.3389\/fneur.2017.00715","author":"J Zhang","year":"2017","unstructured":"Zhang J (2017) Multivariate analysis and machine learning in cerebral palsy research. Front Neurol. https:\/\/doi.org\/10.3389\/fneur.2017.00715","journal-title":"Front Neurol"},{"key":"5448_CR25","unstructured":"Krizhevsky A (2009) Learning multiple layers of features from tiny images. In: \u2026 Sci Dep Univ Toronto, Tech \u2026 1\u201360"},{"key":"5448_CR26","unstructured":"Le Y, Yang X (2015) Tiny imagenet visual recognition challenge. Stanford CS231N"},{"key":"5448_CR27","first-page":"1","volume":"2019","author":"B Neyshabur","year":"2018","unstructured":"Neyshabur B, Li Z, Bhojanapalli S et al (2018) Towards Understanding the role of over-parametrization in generalization of neural networks. Iclr 2019:1\u201320","journal-title":"Iclr"},{"key":"5448_CR28","doi-asserted-by":"publisher","first-page":"793","DOI":"10.1007\/s11045-019-00686-z","volume":"31","author":"Q Zheng","year":"2020","unstructured":"Zheng Q, Tian X, Yang M et al (2020) PAC-Bayesian framework based drop-path method for 2D discriminative convolutional network pruning. Multidimens Syst Signal Process 31:793\u2013827. https:\/\/doi.org\/10.1007\/s11045-019-00686-z","journal-title":"Multidimens Syst Signal Process"},{"key":"5448_CR29","unstructured":"Simonyan K, Zisserman A (2015) Very deep convolutional networks for large-scale image recognition. In: 3rd Int Conf Learn Represent ICLR 2015\u2014Conf Track Proc 14"},{"key":"5448_CR30","doi-asserted-by":"publisher","unstructured":"Ahn S, Hu SX, Damianou A, et al (2019) Variational information distillation for knowledge transfer. In: Proc IEEE Comput Soc Conf Comput Vis Pattern Recognit. 2019-June: 9155\u20139163. https:\/\/doi.org\/10.1109\/CVPR.2019.00938","DOI":"10.1109\/CVPR.2019.00938"},{"key":"5448_CR31","doi-asserted-by":"publisher","unstructured":"Guo Q, Wang X, Wu Y, et al (2020) Online knowledge distillation via collaborative learning. In: Proc IEEE Comput Soc Conf Comput Vis Pattern Recognit. p 11017\u201311026. https:\/\/doi.org\/10.1109\/CVPR42600.2020.01103","DOI":"10.1109\/CVPR42600.2020.01103"},{"key":"5448_CR32","doi-asserted-by":"publisher","unstructured":"Chen D, Mei JP, Wang C, et al (2020) Online knowledge distillation with diverse peers. In: AAAI 2020\u201434th AAAI Conference on Artificial Intelligence. p 3430\u20133437. https:\/\/doi.org\/10.1609\/aaai.v34i04.5746","DOI":"10.1609\/aaai.v34i04.5746"},{"key":"5448_CR33","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1016\/j.neucom.2021.04.102","volume":"454","author":"T Wen","year":"2021","unstructured":"Wen T, Lai S, Qian X (2021) Preparing lessons: Improve knowledge distillation with better supervision. Neurocomputing 454:25\u201333. https:\/\/doi.org\/10.1016\/j.neucom.2021.04.102","journal-title":"Neurocomputing"},{"key":"5448_CR34","doi-asserted-by":"publisher","unstructured":"Yun S, Park J, Lee K, Shin J (2020) Regularizing class-wise predictions via self-knowledge distillation. Proc IEEE Comput Soc Conf Comput Vis Pattern Recognit 13873\u201313882. DOI: https:\/\/doi.org\/10.1109\/CVPR42600.2020.01389","DOI":"10.1109\/CVPR42600.2020.01389"},{"key":"5448_CR35","doi-asserted-by":"publisher","first-page":"104709","DOI":"10.1016\/j.bspc.2023.104709","volume":"84","author":"S Zhou","year":"2023","unstructured":"Zhou S, Tian S, Yu L et al (2023) FixMatch-LS: semi-supervised skin lesion classification with label smoothing. Biomed Signal Process Control 84:104709. https:\/\/doi.org\/10.1016\/j.bspc.2023.104709","journal-title":"Biomed Signal Process Control"},{"key":"5448_CR36","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2022.108846","author":"Y Cao","year":"2022","unstructured":"Cao Y, Wan Q, Shen W, Gao L (2022) Informative knowledge distillation for image anomaly segmentation. Knowledge-Based Syst. https:\/\/doi.org\/10.1016\/j.knosys.2022.108846","journal-title":"Knowledge-Based Syst"},{"key":"5448_CR37","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2022.110143","author":"S Suh","year":"2023","unstructured":"Suh S, Rey VFLP (2023) Transformer-based adversarial learning for human activity recognition using wearable sensors via self-knowledge distillation. Knowledge-Based Syst. https:\/\/doi.org\/10.1016\/j.knosys.2022.110143","journal-title":"Knowledge-Based Syst"},{"key":"5448_CR38","doi-asserted-by":"crossref","unstructured":"Zheng Z PX (2022) Self-guidance: improve deep neural network generalization via knowledge distillation. In: Proc IEEE\/CVF Winter Conf Appl Comput Vis. p 3203\u20133212","DOI":"10.1109\/WACV51458.2022.00351"},{"key":"5448_CR39","doi-asserted-by":"publisher","first-page":"5093","DOI":"10.1016\/j.procs.2021.09.287","volume":"192","author":"O Moutik","year":"2021","unstructured":"Moutik O, Tigani S, Saadane RCA (2021) Hybrid deep learning vision-based models for human object interaction detection by knowledge distillation. Proc Comput Sci 192:5093\u20135103","journal-title":"Proc Comput Sci"},{"key":"5448_CR40","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2021.103341","author":"W Wu","year":"2022","unstructured":"Wu W, Zhou K, Chen XD, Yong JH (2022) Light-weight shadow detection via GCN-based annotation strategy and knowledge distillation. Comput Vis Image Underst. https:\/\/doi.org\/10.1016\/j.cviu.2021.103341","journal-title":"Comput Vis Image Underst"},{"key":"5448_CR41","unstructured":"Zhu X, Gong S, others (2018) Knowledge distillation by on-the-fly native ensemble. Adv Neural Inf Process Syst. p 7517\u20137527"},{"key":"5448_CR42","doi-asserted-by":"crossref","unstructured":"Qing H, Tang J, Yang X, Huang X, Zhu HJN (2022) Stimulates potential for knowledge distillation. In: Artificial Neural Networks and Machine Learning. Artif Neural Networks Mach Learn 31st Int Conf Artif Neural Networks. p 187\u2013198","DOI":"10.1007\/978-3-031-15937-4_16"},{"key":"5448_CR43","doi-asserted-by":"publisher","first-page":"103632","DOI":"10.1016\/j.cviu.2023.103632","volume":"18","author":"DL Borza","year":"2023","unstructured":"Borza DL, Ileni TA, Marinescu AIDS (2023) Teacher or supervisor? Effective online knowledge distillation via guided collaborative learning. Comput Vis Image Underst 18:103632","journal-title":"Comput Vis Image Underst"},{"key":"5448_CR44","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2023.01.063","author":"S Zhang","year":"2023","unstructured":"Zhang S, Chen C, Hu XPS (2023) Balanced knowledge distillation for long-tailed learning. Neurocomputing. https:\/\/doi.org\/10.1016\/j.neucom.2023.01.063","journal-title":"Neurocomputing"},{"key":"5448_CR45","unstructured":"Welling M (2007) Fisher linear discriminant analysis max. In: 2007 9th Int Symp Signal Process its Appl ISSPA 2007, Proc"},{"key":"5448_CR46","doi-asserted-by":"publisher","DOI":"10.1186\/s13321-017-0226-y","author":"A Koutsoukas","year":"2017","unstructured":"Koutsoukas A, Monaghan KJ, Li X, Huan J (2017) Deep-learning: Investigating deep neural networks hyper-parameters and comparison of performance to shallow methods for modeling bioactivity data. J Cheminform. https:\/\/doi.org\/10.1186\/s13321-017-0226-y","journal-title":"J Cheminform"},{"key":"5448_CR47","unstructured":"Dorfer M, Kelz R, Widmer G (2016) Deep linear discriminant analysis. In: 4th Int Conf Learn Represent ICLR 2016\u2014Conf Track Proc"},{"key":"5448_CR48","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. Proc IEEE Comput Soc Conf Comput Vis Pattern Recognit 2016-Decem: 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"5448_CR49","doi-asserted-by":"crossref","unstructured":"Zhang Y, Xiang T, Hospedales TM, Lu H (2018) Deep mutual learning. In: Proceedings of the IEEE Computer Society Conference on Computer Vision and Pattern Recognition. IEEE conference on computer vision and pattern recognition, p 4320\u20134328","DOI":"10.1109\/CVPR.2018.00454"},{"key":"5448_CR50","unstructured":"Kim J, Park SU, Kwak N (2018) Paraphrasing complex network: Network compression via factor transfer. Adv Neural Inf Process Syst. P 2760\u20132769"}],"container-title":["The Journal of Supercomputing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-023-05448-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11227-023-05448-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-023-05448-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,10,20]],"date-time":"2023-10-20T21:07:13Z","timestamp":1697836033000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11227-023-05448-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,6,17]]},"references-count":50,"journal-issue":{"issue":"18","published-print":{"date-parts":[[2023,12]]}},"alternative-id":["5448"],"URL":"https:\/\/doi.org\/10.1007\/s11227-023-05448-0","relation":{},"ISSN":["0920-8542","1573-0484"],"issn-type":[{"value":"0920-8542","type":"print"},{"value":"1573-0484","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,6,17]]},"assertion":[{"value":"29 May 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 June 2023","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}}]}}