{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,3]],"date-time":"2026-06-03T19:28:09Z","timestamp":1780514889877,"version":"3.54.1"},"reference-count":83,"publisher":"Springer Science and Business Media LLC","issue":"9","license":[{"start":{"date-parts":[[2025,3,28]],"date-time":"2025-03-28T00:00:00Z","timestamp":1743120000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,3,28]],"date-time":"2025-03-28T00:00:00Z","timestamp":1743120000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Sci. China Inf. Sci."],"published-print":{"date-parts":[[2025,9]]},"DOI":"10.1007\/s11432-023-4283-3","type":"journal-article","created":{"date-parts":[[2025,4,4]],"date-time":"2025-04-04T17:33:42Z","timestamp":1743788022000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Self-knowledge distillation with dimensional history knowledge"],"prefix":"10.1007","volume":"68","author":[{"given":"Wenke","family":"Huang","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Mang","family":"Ye","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Zekun","family":"Shi","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"He","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Bo","family":"Du","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,3,28]]},"reference":[{"key":"4283_CR1","first-page":"1097","volume-title":"Proceedings of Conference on Neural Information Processing Systems (NeurIPS)","author":"A Krizhevsky","year":"2012","unstructured":"Krizhevsky A, Sutskever I, Hinton G E. Imagenet classification with deep convolutional neural networks. In: Proceedings of Conference on Neural Information Processing Systems (NeurIPS), 2012. 1097\u20131105"},{"key":"4283_CR2","first-page":"770","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"K He","year":"2016","unstructured":"He K, Zhang X, Ren S, et al. Deep residual learning for image recognition. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2016. 770\u2013778"},{"key":"4283_CR3","volume-title":"Proceedings of International Conference on Learning Representations (ICLR)","author":"A Dosovitskiy","year":"2021","unstructured":"Dosovitskiy A, Beyer L, Kolesnikov A, et al. An image is worth 16\u00d716 words: transformers for image recognition at scale. In: Proceedings of International Conference on Learning Representations (ICLR), 2021"},{"key":"4283_CR4","first-page":"11976","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"Z Liu","year":"2022","unstructured":"Liu Z, Mao H, Wu C Y, et al. A convnet for the 2020s. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2022. 11976\u201311986"},{"key":"4283_CR5","doi-asserted-by":"publisher","first-page":"9387","DOI":"10.1109\/TPAMI.2024.3418862","volume":"46","author":"W Huang","year":"2024","unstructured":"Huang W, Ye M, Shi Z, et al. Federated learning for generalization, robustness, fairness: a survey and benchmark. IEEE Trans Pattern Anal Mach Intell, 2024, 46: 9387\u20139406","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"4283_CR6","doi-asserted-by":"publisher","first-page":"770","DOI":"10.1109\/TKDE.2004.11","volume":"16","author":"Z-H Zhou","year":"2004","unstructured":"Zhou Z-H, Jiang Y. NeC4.5: neural ensemble based C4.5. IEEE Trans Knowl Data Eng, 2004, 16: 770\u2013773","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"4283_CR7","doi-asserted-by":"publisher","first-page":"535","DOI":"10.1145\/1150402.1150464","volume-title":"Proceedings of ACM SIGKDD International Conference on Knowledge Discovery and Data Mining","author":"C Bucilu\u0103","year":"2006","unstructured":"Bucilu\u0103 C, Caruana R, Niculescu-Mizil A. Model compression. In: Proceedings of ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, 2006. 535\u2013541"},{"key":"4283_CR8","unstructured":"Hinton G, Vinyals O, Dean J. Distilling the knowledge in a neural network. 2015. ArXiv:1503.02531"},{"key":"4283_CR9","first-page":"2023","volume":"16","author":"V Vapnik","year":"2015","unstructured":"Vapnik V, Izmailov R. Learning using privileged information: similarity control and knowledge transfer. J Mach Learn Res, 2015, 16: 2023\u20132049","journal-title":"J Mach Learn Res"},{"key":"4283_CR10","first-page":"5900","volume-title":"Proceedings of IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP)","author":"Z Tang","year":"2016","unstructured":"Tang Z, Wang D, Zhang Z. Recurrent neural network training with dark knowledge transfer. In: Proceedings of IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2016. 5900\u20135904"},{"key":"4283_CR11","volume-title":"Proceedings of International Conference on Learning Representations (ICLR)","author":"D Lopez-Paz","year":"2016","unstructured":"Lopez-Paz D, Bottou L, Sch\u00f6lkopf B, et al. Unifying distillation and privileged information. In: Proceedings of International Conference on Learning Representations (ICLR), 2016"},{"key":"4283_CR12","doi-asserted-by":"publisher","first-page":"1789","DOI":"10.1007\/s11263-021-01453-z","volume":"129","author":"J Gou","year":"2021","unstructured":"Gou J, Yu B, Maybank S J, et al. Knowledge distillation: a survey. Int J Comput Vis, 2021, 129: 1789\u20131819","journal-title":"Int J Comput Vis"},{"key":"4283_CR13","doi-asserted-by":"publisher","first-page":"3048","DOI":"10.1109\/TPAMI.2021.3055564","volume":"44","author":"L Wang","year":"2022","unstructured":"Wang L, Yoon K J. Knowledge distillation and student-teacher learning for visual intelligence: a review and new outlooks. IEEE Trans Pattern Anal Mach Intell, 2022, 44: 3048\u20133068","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"4283_CR14","first-page":"4794","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"J H Cho","year":"2019","unstructured":"Cho J H, Hariharan B. On the efficacy of knowledge distillation. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2019. 4794\u20134802"},{"key":"4283_CR15","first-page":"5191","volume-title":"Proceedings of Association for the Advancement of Artificial Intelligence (AAAI)","author":"S I Mirzadeh","year":"2020","unstructured":"Mirzadeh S I, Farajtabar M, Li A, et al. Improved knowledge distillation via teacher assistant. In: Proceedings of Association for the Advancement of Artificial Intelligence (AAAI), 2020. 5191\u20135198"},{"key":"4283_CR16","first-page":"13292","volume-title":"Proceedings of Conference on Neural Information Processing Systems (NeurIPS)","author":"D Y Park","year":"2021","unstructured":"Park D Y, Cha M H, Kim D, et al. Learning student-friendly teacher networks for knowledge distillation. In: Proceedings of Conference on Neural Information Processing Systems (NeurIPS), 2021. 13292\u201313303"},{"key":"4283_CR17","first-page":"5057","volume-title":"Proceedings of IEEE International Conference on Computer Vision (ICCV)","author":"Y Zhu","year":"2021","unstructured":"Zhu Y, Wang Y. Student customized knowledge distillation: bridging the gap between student and teacher. In: Proceedings of IEEE International Conference on Computer Vision (ICCV), 2021. 5057\u20135066"},{"key":"4283_CR18","volume-title":"Proceedings of Association for the Advancement of Artificial Intelligence (AAAI)","author":"C Yang","year":"2018","unstructured":"Yang C, Xie L, Qiao S, et al. Knowledge distillation in generations: more tolerant teachers educate better students. In: Proceedings of Association for the Advancement of Artificial Intelligence (AAAI), 2018"},{"key":"4283_CR19","first-page":"4320","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"Y Zhang","year":"2018","unstructured":"Zhang Y, Xiang T, Hospedales T M, et al. Deep mutual learning. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2018. 4320\u20134328"},{"key":"4283_CR20","first-page":"11020","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"Q Guo","year":"2020","unstructured":"Guo Q, Wang X, Wu Y, et al. Online knowledge distillation via collaborative learning. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2020. 11020\u201311029"},{"key":"4283_CR21","first-page":"3430","volume-title":"Proceedings of Association for the Advancement of Artificial Intelligence (AAAI)","author":"D Chen","year":"2020","unstructured":"Chen D, Mei J P, Wang C, et al. Online knowledge distillation with diverse peers. In: Proceedings of Association for the Advancement of Artificial Intelligence (AAAI), 2020. 3430\u20133437"},{"key":"4283_CR22","first-page":"10302","volume-title":"Proceedings of Association for the Advancement of Artificial Intelligence (AAAI)","author":"G Wu","year":"2021","unstructured":"Wu G, Gong S. Peer collaborative learning for online knowledge distillation. In: Proceedings of Association for the Advancement of Artificial Intelligence (AAAI), 2021. 10302\u201310310"},{"key":"4283_CR23","first-page":"1607","volume-title":"Proceedings of International Conference on Machine Learning (ICML)","author":"T Furlanello","year":"2018","unstructured":"Furlanello T, Lipton Z, Tschannen M, et al. Born again neural networks. In: Proceedings of International Conference on Machine Learning (ICML), 2018. 1607\u20131616"},{"key":"4283_CR24","first-page":"2859","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"C Yang","year":"2019","unstructured":"Yang C, Xie L, Su C, et al. Snapshot distillation: teacher-student optimization in one generation. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2019. 2859\u20132868"},{"key":"4283_CR25","first-page":"6567","volume-title":"Proceedings of IEEE International Conference on Computer Vision (ICCV)","author":"K Kim","year":"2021","unstructured":"Kim K, Ji B, Yoon D, et al. Self-knowledge distillation with progressive refinement of targets. In: Proceedings of IEEE International Conference on Computer Vision (ICCV), 2021. 6567\u20136576"},{"key":"4283_CR26","first-page":"11943","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"Y Shen","year":"2022","unstructured":"Shen Y, Xu L, Yang Y, et al. Self-distillation from the last mini-batch for consistency regularization. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2022. 11943\u201311952"},{"key":"4283_CR27","volume-title":"Proceedings of International Conference on Learning Representations (ICLR)","author":"H Zhou","year":"2021","unstructured":"Zhou H, Song L, Chen J, et al. Rethinking soft labels for knowledge distillation: a bias-variance tradeoff perspective. In: Proceedings of International Conference on Learning Representations (ICLR), 2021"},{"key":"4283_CR28","volume-title":"Sensory Communication. Cambridge: MIT Press","author":"H B Barlow","year":"1961","unstructured":"Barlow H B. Possible principles underlying the transformation of sensory messages. In: Sensory Communication. Cambridge: MIT Press, 1961"},{"key":"4283_CR29","first-page":"1597","volume-title":"Proceedings of International Conference on Machine Learning (ICML)","author":"T Chen","year":"2020","unstructured":"Chen T, Kornblith S, Norouzi M, et al. A simple framework for contrastive learning of visual representations. In: Proceedings of International Conference on Machine Learning (ICML), 2020. 1597\u20131607"},{"key":"4283_CR30","first-page":"9729","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"K He","year":"2020","unstructured":"He K, Fan H, Wu Y, et al. Momentum contrast for unsupervised visual representation learning. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2020. 9729\u20139738"},{"key":"4283_CR31","first-page":"6210","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"M Ye","year":"2019","unstructured":"Ye M, Zhang X, Yuen P C, et al. Unsupervised embedding learning via invariant and spreading instance feature. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2019. 6210\u20136219"},{"key":"4283_CR32","doi-asserted-by":"publisher","first-page":"6946","DOI":"10.1109\/TGRS.2020.3030990","volume":"59","author":"X Feng","year":"2020","unstructured":"Feng X, Han J, Yao X, et al. TCANet: triple context-aware network for weakly supervised object detection in remote sensing images. IEEE Trans Geosci Remote Sens, 2020, 59: 6946\u20136955","journal-title":"IEEE Trans Geosci Remote Sens"},{"key":"4283_CR33","doi-asserted-by":"publisher","first-page":"8002","DOI":"10.1109\/TGRS.2020.2985989","volume":"58","author":"X Feng","year":"2020","unstructured":"Feng X, Han J, Yao X, et al. Progressive contextual instance refinement for weakly supervised object detection in remote sensing images. IEEE Trans Geosci Remote Sens, 2020, 58: 8002\u20138012","journal-title":"IEEE Trans Geosci Remote Sens"},{"key":"4283_CR34","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"W Huang","year":"2022","unstructured":"Huang W, Ye M, Du B. Learn from others and be yourself in heterogeneous federated learning. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2022"},{"key":"4283_CR35","doi-asserted-by":"publisher","first-page":"712","DOI":"10.1109\/TPAMI.2023.3327373","volume":"46","author":"W Huang","year":"2024","unstructured":"Huang W, Ye M, Shi Z, et al. Generalizable heterogeneous federated cross-correlation and instance similarity learning. IEEE Trans Pattern Anal Mach Intell, 2024, 46: 712\u2013728","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"4283_CR36","volume-title":"Proceedings of International Conference on Machine Learning (ICML)","author":"J Zbontar","year":"2021","unstructured":"Zbontar J, Jing L, Misra I, et al. Barlow twins: self-supervised learning via redundancy reduction. In: Proceedings of International Conference on Machine Learning (ICML), 2021"},{"key":"4283_CR37","volume-title":"Proceedings of International Conference on Learning Representations (ICLR)","author":"A Bardes","year":"2022","unstructured":"Bardes A, Ponce J, LeCun Y. VICReg: variance-invariance-covariance regularization for self-supervised learning. In: Proceedings of International Conference on Learning Representations (ICLR), 2022"},{"key":"4283_CR38","first-page":"16600","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"S Zhang","year":"2022","unstructured":"Zhang S, Qiu L, Zhu F, et al. Align representations with base: a new approach to self-supervised learning. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2022. 16600\u201316609"},{"key":"4283_CR39","volume-title":"Proceedings of Conference on Neural Information Processing Systems (NeurIPS)","author":"J Li","year":"2022","unstructured":"Li J, Qiang W, Zhang Y, et al. MetaMask: revisiting dimensional confounder for self-supervised learning. In: Proceedings of Conference on Neural Information Processing Systems (NeurIPS), 2022"},{"key":"4283_CR40","series-title":"Dissertation for Ph.D. Degree","volume-title":"Learning multiple layers of features from tiny images","author":"A Krizhevsky","year":"2009","unstructured":"Krizhevsky A, Hinton G. Learning multiple layers of features from tiny images. Dissertation for Ph.D. Degree. Toronto: University of Toronto, 2009"},{"key":"4283_CR41","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky O, Deng J, Su H, et al. ImageNet large scale visual recognition challenge. Int J Comput Vis, 2015, 115: 211\u2013252","journal-title":"Int J Comput Vis"},{"key":"4283_CR42","first-page":"1492","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"S Xie","year":"2017","unstructured":"Xie S, Girshick R, Doll\u00e1r P, et al. Aggregated residual transformations for deep neural networks. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2017. 1492\u20131500"},{"key":"4283_CR43","unstructured":"Howard A G, Zhu M, Chen B, et al. MobileNets: efficient convolutional neural networks for mobile vision applications. 2017. ArXiv:1704.04861"},{"key":"4283_CR44","first-page":"6105","volume-title":"Proceedings of International Conference on Machine Learning (ICML)","author":"M Tan","year":"2019","unstructured":"Tan M, Le Q. EfficientNet: rethinking model scaling for convolutional neural networks. In: Proceedings of International Conference on Machine Learning (ICML), 2019. 6105\u20136114"},{"key":"4283_CR45","first-page":"3903","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"L Yuan","year":"2020","unstructured":"Yuan L, Tay F E, Li G, et al. Revisiting knowledge distillation via label smoothing regularization. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2020. 3903\u20133911"},{"key":"4283_CR46","first-page":"6290","volume-title":"Proceedings of IEEE International Conference on Computer Vision (ICCV)","author":"Y Kim","year":"2021","unstructured":"Kim Y, Park J, Jang Y, et al. Distilling global and local with densely connected relations. In: Proceedings of IEEE International Conference on Computer Vision (ICCV), 2021. 6290\u20136300"},{"key":"4283_CR47","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"B Zhao","year":"2022","unstructured":"Zhao B, Cui Q, Song R, et al. Decoupled knowledge distillation. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2022"},{"key":"4283_CR48","doi-asserted-by":"publisher","first-page":"7296","DOI":"10.1109\/TCSVT.2023.3279281","volume":"33","author":"S Xu","year":"2023","unstructured":"Xu S, Zhang S, Liu J, et al. Generative data free model quantization with knowledge matching for classification. IEEE Trans Circuits Syst Video Technol, 2023, 33: 7296\u20137309","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"4283_CR49","unstructured":"Tang J, Shivanna R, Zhao Z, et al. Understanding and improving knowledge distillation. 2020. ArXiv:2002.03532"},{"key":"4283_CR50","volume-title":"Proceedings of International Conference on Learning Representations (ICLR)","author":"A Romero","year":"2015","unstructured":"Romero A, Ballas N, Kahou S E, et al. FitNets: hints for thin deep nets. In: Proceedings of International Conference on Learning Representations (ICLR), 2015"},{"key":"4283_CR51","volume-title":"Proceedings of International Conference on Learning Representations (ICLR)","author":"N Komodakis","year":"2017","unstructured":"Komodakis N, Zagoruyko S. Paying more attention to attention: improving the performance of convolutional neural networks via attention transfer. In: Proceedings of International Conference on Learning Representations (ICLR), 2017"},{"key":"4283_CR52","first-page":"1921","volume-title":"Proceedings of IEEE International Conference on Computer Vision (ICCV)","author":"B Heo","year":"2019","unstructured":"Heo B, Kim J, Yun S, et al. A comprehensive overhaul of feature distillation. In: Proceedings of IEEE International Conference on Computer Vision (ICCV), 2019. 1921\u20131930"},{"key":"4283_CR53","first-page":"588","volume-title":"Proceedings of European Conference on Computer Vision (ECCV)","author":"G Xu","year":"2020","unstructured":"Xu G, Liu Z, Li X, et al. Knowledge distillation meets self-supervision. In: Proceedings of European Conference on Computer Vision (ECCV), 2020. 588\u2013604"},{"key":"4283_CR54","first-page":"5008","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"P Chen","year":"2021","unstructured":"Chen P, Liu S, Zhao H, et al. Distilling knowledge via knowledge review. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2021. 5008\u20135017"},{"key":"4283_CR55","volume-title":"Proceedings of European Conference on Computer Vision (ECCV)","author":"Z Yang","year":"2022","unstructured":"Yang Z, Li Z, Shao M, et al. Masked generative distillation. In: Proceedings of European Conference on Computer Vision (ECCV), 2022"},{"key":"4283_CR56","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1016\/j.neunet.2021.01.022","volume":"138","author":"Z Xie","year":"2021","unstructured":"Xie Z, Wen Z, Wang Y, et al. Towards effective deep transfer via attentive feature alignment. Neural Netws, 2021, 138: 98\u2013109","journal-title":"Neural Netws"},{"key":"4283_CR57","first-page":"625","volume-title":"Proceedings of European Conference on Computer Vision (ECCV)","author":"Z Xie","year":"2020","unstructured":"Xie Z, Wen Z, Liu J, et al. Deep transferring quantization. In: Proceedings of European Conference on Computer Vision (ECCV), 2020. 625\u2013642"},{"key":"4283_CR58","first-page":"4133","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"J Yim","year":"2017","unstructured":"Yim J, Joo D, Bae J, et al. A gift from knowledge distillation: fast optimization, network minimization and transfer learning. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2017. 4133\u20134141"},{"key":"4283_CR59","first-page":"3967","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"W Park","year":"2019","unstructured":"Park W, Kim D, Lu Y, et al. Relational knowledge distillation. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2019. 3967\u20133976"},{"key":"4283_CR60","first-page":"9260","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"J Zhu","year":"2021","unstructured":"Zhu J, Tang S, Chen D, et al. Complementary relation contrastive distillation. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2021. 9260\u20139269"},{"key":"4283_CR61","doi-asserted-by":"publisher","first-page":"1817","DOI":"10.1109\/TPAMI.2022.3160328","volume":"45","author":"H J Ye","year":"2023","unstructured":"Ye H J, Lu S, Zhan D C. Generalized knowledge distillation via relationship matching. IEEE Trans Pattern Anal Mach Intell, 2023, 45: 1817\u20131834","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"4283_CR62","first-page":"1355","volume-title":"Proceedings of IEEE International Conference on Computer Vision (ICCV)","author":"M Phuong","year":"2019","unstructured":"Phuong M, Lampert C H. Distillation-based training for multi-exit architectures. In: Proceedings of IEEE International Conference on Computer Vision (ICCV), 2019. 1355\u20131364"},{"key":"4283_CR63","first-page":"1013","volume-title":"Proceedings of IEEE International Conference on Computer Vision (ICCV)","author":"Y Hou","year":"2019","unstructured":"Hou Y, Ma Z, Liu C, et al. Learning lightweight lane detection CNNs by self attention distillation. In: Proceedings of IEEE International Conference on Computer Vision (ICCV), 2019. 1013\u20131021"},{"key":"4283_CR64","first-page":"3713","volume-title":"Proceedings of IEEE International Conference on Computer Vision (ICCV)","author":"L Zhang","year":"2019","unstructured":"Zhang L, Song J, Gao A, et al. Be your own teacher: improve the performance of convolutional neural networks via self distillation. In: Proceedings of IEEE International Conference on Computer Vision (ICCV), 2019. 3713\u20133722"},{"key":"4283_CR65","first-page":"10664","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"M Ji","year":"2021","unstructured":"Ji M, Shin S, Hwang S, et al. Refine myself by teaching myself: feature refinement via self-knowledge distillation. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2021. 10664\u201310673"},{"key":"4283_CR66","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1016\/j.inffus.2022.09.007","volume":"90","author":"Z Long","year":"2023","unstructured":"Long Z, Ma F, Sun B, et al. Diversified branch fusion for self-knowledge distillation. Inf Fusion, 2023, 90: 12\u201322","journal-title":"Inf Fusion"},{"key":"4283_CR67","first-page":"5565","volume-title":"Proceedings of Association for the Advancement of Artificial Intelligence (AAAI)","author":"T B Xu","year":"2019","unstructured":"Xu T B, Liu C L. Data-distortion guided self-distillation for deep neural networks. In: Proceedings of Association for the Advancement of Artificial Intelligence (AAAI), 2019. 5565\u20135572"},{"key":"4283_CR68","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"S Yun","year":"2020","unstructured":"Yun S, Park J, Lee K, et al. Regularizing class-wise predictions via self-knowledge distillation. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2020"},{"key":"4283_CR69","volume-title":"Proceedings of European Conference on Computer Vision (ECCV)","author":"C Yang","year":"2022","unstructured":"Yang C, An Z, Zhou H, et al. MixSKD: self-knowledge distillation from mixup for image recognition. In: Proceedings of European Conference on Computer Vision (ECCV), 2022"},{"key":"4283_CR70","unstructured":"Ge Y, Choi C L, Zhang X, et al. Self-distillation with batch knowledge ensembling improves ImageNet classification. 2021. ArXiv:2104.13298"},{"key":"4283_CR71","first-page":"2818","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"C Szegedy","year":"2016","unstructured":"Szegedy C, Vanhoucke V, Ioffe S, et al. Rethinking the inception architecture for computer vision. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2016. 2818\u20132826"},{"key":"4283_CR72","volume-title":"Proceedings of Conference on Neural Information Processing Systems (NeurIPS)","author":"R M\u00fcller","year":"2019","unstructured":"M\u00fcller R, Kornblith S, Hinton G E. When does label smoothing help? In: Proceedings of Conference on Neural Information Processing Systems (NeurIPS), 2019"},{"key":"4283_CR73","volume-title":"Proceedings of European Conference on Computer Vision (ECCV)","author":"J Liang","year":"2022","unstructured":"Liang J, Li L, Bing Z, et al. Efficient one pass self-distillation with Zipf\u2019s label smoothing. In: Proceedings of European Conference on Computer Vision (ECCV), 2022"},{"key":"4283_CR74","doi-asserted-by":"publisher","first-page":"109541","DOI":"10.1016\/j.patcog.2023.109541","volume":"140","author":"Y Cho","year":"2023","unstructured":"Cho Y, Ham G, Lee J H, et al. Ambiguity-aware robust teacher (ART): enhanced self-knowledge distillation framework with pruned teacher network. Pattern Recogn, 2023, 140: 109541","journal-title":"Pattern Recogn"},{"key":"4283_CR75","doi-asserted-by":"publisher","first-page":"103771","DOI":"10.1016\/j.cviu.2023.103771","volume":"235","author":"F Liu","year":"2023","unstructured":"Liu F, Wang Y, Li Z, et al. GEIKD: self-knowledge distillation based on gated ensemble networks and influences-based label noise removal. Comput Vision Image Understanding, 2023, 235: 103771","journal-title":"Comput Vision Image Understanding"},{"key":"4283_CR76","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1007\/s10479-005-5724-z","volume":"134","author":"P T de Boer","year":"2005","unstructured":"de Boer P T, Kroese D P, Mannor S, et al. A tutorial on the cross-entropy method. Ann Oper Res, 2005, 134: 19\u201367","journal-title":"Ann Oper Res"},{"key":"4283_CR77","doi-asserted-by":"publisher","first-page":"79","DOI":"10.1214\/aoms\/1177729694","volume":"22","author":"S Kullback","year":"1951","unstructured":"Kullback S, Leibler R A. On Information and Sufficiency. Ann Math Statist, 1951, 22: 79\u201386","journal-title":"Ann Math Statist"},{"key":"4283_CR78","first-page":"16570","volume-title":"Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","author":"X Wang","year":"2022","unstructured":"Wang X, Fan H, Tian Y, et al. On the importance of asymmetry for Siamese representation learning. In: Proceedings of IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2022. 16570\u201316579"},{"key":"4283_CR79","first-page":"2184","volume-title":"Proceedings of Conference on Neural Information Processing Systems (NeurIPS)","author":"Z Zhang","year":"2020","unstructured":"Zhang Z, Sabuncu M. Self-distillation as instance-specific label smoothing. In: Proceedings of Conference on Neural Information Processing Systems (NeurIPS), 2020. 2184\u20132195"},{"key":"4283_CR80","first-page":"21271","volume-title":"Proceedings of Conference on Neural Information Processing Systems (NeurIPS)","author":"J B Grill","year":"2020","unstructured":"Grill J B, Strub F, Altch\u00e9 F, et al. Bootstrap your own latent\u2014a new approach to self-supervised learning. In: Proceedings of Conference on Neural Information Processing Systems (NeurIPS), 2020. 21271\u201321284"},{"key":"4283_CR81","first-page":"9650","volume-title":"Proceedings of IEEE International Conference on Computer Vision (ICCV)","author":"M Caron","year":"2021","unstructured":"Caron M, Touvron H, Misra I, et al. Emerging properties in self-supervised vision transformers. In: Proceedings of IEEE International Conference on Computer Vision (ICCV), 2021. 9650\u20139660"},{"key":"4283_CR82","volume-title":"Proceedings of Conference on Neural Information Processing Systems (NeurIPS)","author":"A Paszke","year":"2019","unstructured":"Paszke A, Gross S, Massa F, et al. PyTorch: an imperative style, high-performance deep learning library. In: Proceedings of Conference on Neural Information Processing Systems (NeurIPS), 2019"},{"key":"4283_CR83","doi-asserted-by":"publisher","first-page":"400","DOI":"10.1214\/aoms\/1177729586","volume":"22","author":"H Robbins","year":"1951","unstructured":"Robbins H, Monro S. A stochastic approximation method. Ann Math Statist, 1951, 22: 400\u2013407","journal-title":"Ann Math Statist"}],"container-title":["Science China Information Sciences"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11432-023-4283-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11432-023-4283-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11432-023-4283-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,5]],"date-time":"2025-04-05T22:12:27Z","timestamp":1743891147000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11432-023-4283-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,28]]},"references-count":83,"journal-issue":{"issue":"9","published-print":{"date-parts":[[2025,9]]}},"alternative-id":["4283"],"URL":"https:\/\/doi.org\/10.1007\/s11432-023-4283-3","relation":{},"ISSN":["1674-733X","1869-1919"],"issn-type":[{"value":"1674-733X","type":"print"},{"value":"1869-1919","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,3,28]]},"assertion":[{"value":"17 September 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 March 2024","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 August 2024","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 March 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"192101"}}