{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,9]],"date-time":"2026-06-09T11:59:51Z","timestamp":1781006391626,"version":"3.54.1"},"reference-count":50,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/501100003725","name":"National Research Foundation of Korea","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100003725","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100010418","name":"Institute of Information & Communications Technology Planning & Evaluation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100010418","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100023231","name":"National Institute for International Education","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100023231","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Knowledge-Based Systems"],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1016\/j.knosys.2026.116101","type":"journal-article","created":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T06:24:41Z","timestamp":1777875881000},"page":"116101","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["RTKD: Responsive Teacher Knowledge Distillation with heterogeneous students"],"prefix":"10.1016","volume":"345","author":[{"given":"Geonyeong","family":"Son","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8623-3088","authenticated-orcid":false,"given":"Misuk","family":"Kim","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"78","reference":[{"key":"10.1016\/j.knosys.2026.116101_b1","series-title":"Scaling laws for neural language models","author":"Kaplan","year":"2020"},{"key":"10.1016\/j.knosys.2026.116101_b2","first-page":"13693","article-title":"Energy and policy considerations for modern deep learning research","volume":"vol. 34","author":"Strubell","year":"2020"},{"key":"10.1016\/j.knosys.2026.116101_b3","series-title":"Efficient large language models: A survey","author":"Wan","year":"2023"},{"key":"10.1016\/j.knosys.2026.116101_b4","series-title":"Distilling the knowledge in a neural network","author":"Hinton","year":"2015"},{"key":"10.1016\/j.knosys.2026.116101_b5","unstructured":"A. Sengupta, S. Dixit, M.S. Akhtar, T. Chakraborty, A good learner can teach better: Teacher-student collaborative knowledge distillation, in: The Twelfth International Conference on Learning Representations, 2023."},{"key":"10.1016\/j.knosys.2026.116101_b6","doi-asserted-by":"crossref","DOI":"10.1016\/j.inffus.2024.102586","article-title":"Multi-level knowledge distillation via dynamic decision boundaries exploration and exploitation","volume":"112","author":"Tao","year":"2024","journal-title":"Inf. Fusion"},{"issue":"3","key":"10.1016\/j.knosys.2026.116101_b7","doi-asserted-by":"crossref","first-page":"228","DOI":"10.1080\/0969594X.2021.1884042","article-title":"A systematic review on factors influencing teachers\u2019 intentions and implementations regarding formative assessment","volume":"28","author":"Yan","year":"2021","journal-title":"Assess. Educ.: Princ. Policy & Pr."},{"issue":"17","key":"10.1016\/j.knosys.2026.116101_b8","doi-asserted-by":"crossref","DOI":"10.3390\/su16177826","article-title":"A systematic review of meta-analyses on the impact of formative assessment on K-12 students\u2019 learning: Toward sustainable quality education","volume":"16","author":"Sortwell","year":"2024","journal-title":"Sustainability"},{"key":"10.1016\/j.knosys.2026.116101_b9","article-title":"Measuring adaptive teaching in classroom discourse: Effects on student learning in elementary science education","volume":"vol. 7","author":"Hardy","year":"2022"},{"key":"10.1016\/j.knosys.2026.116101_b10","doi-asserted-by":"crossref","DOI":"10.3389\/fpsyg.2019.03087","article-title":"The power of feedback revisited: A meta-analysis of educational feedback research","volume":"10","author":"Wisniewski","year":"2020","journal-title":"Front. Psychol."},{"key":"10.1016\/j.knosys.2026.116101_b11","series-title":"Learning to teach with student feedback","author":"Liu","year":"2021"},{"key":"10.1016\/j.knosys.2026.116101_b12","doi-asserted-by":"crossref","DOI":"10.1109\/TMM.2024.3372833","article-title":"Reciprocal teacher-student learning via forward and feedback knowledge distillation","author":"Gou","year":"2024","journal-title":"IEEE Trans. Multimed."},{"key":"10.1016\/j.knosys.2026.116101_b13","series-title":"Visible Learning: a Synthesis of Over 800 Meta-Analyses Relating to Achievement","author":"Hattie","year":"2008"},{"issue":"1","key":"10.1016\/j.knosys.2026.116101_b14","doi-asserted-by":"crossref","first-page":"7","DOI":"10.1080\/0969595980050102","article-title":"Assessment and classroom learning","volume":"5","author":"Black","year":"1998","journal-title":"Assess. Educ.: Princ. Policy & Pr."},{"key":"10.1016\/j.knosys.2026.116101_b15","series-title":"Embedded Formative Assessment","author":"Wiliam","year":"2011"},{"key":"10.1016\/j.knosys.2026.116101_b16","series-title":"The Reflective Practitioner: How Professionals Think in Action","author":"Sch\u00f6n","year":"2017"},{"key":"10.1016\/j.knosys.2026.116101_b17","unstructured":"M.P.V. Kumar, M.M.S. Vani, A Cyber Security Knowledge Graph for Advanced Persistent Threat Organization Attribution."},{"key":"10.1016\/j.knosys.2026.116101_b18","doi-asserted-by":"crossref","DOI":"10.1109\/TKDE.2024.3474792","article-title":"Threatinsight: Innovating early threat detection through threat-intelligence-driven analysis and attribution","author":"Wang","year":"2024","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"10.1016\/j.knosys.2026.116101_b19","unstructured":"Y. Zhou, Z. Wang, Y. Jiang, B. Ma, R. Wang, Y. Liu, Y. Zhao, Z. Tian, AEKG4APT: An AI-Enhanced Knowledge Graph for Advanced Persistent Threats with Large Language Model Analysis, ACM Trans. Intell. Syst. Technol.."},{"issue":"5","key":"10.1016\/j.knosys.2026.116101_b20","first-page":"4754","article-title":"Dynamic prototype network based on sample adaptation for few-shot malware detection","volume":"35","author":"Chai","year":"2022","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"10.1016\/j.knosys.2026.116101_b21","article-title":"Malfscil: A few-shot class-incremental learning approach for malware detection","author":"Chai","year":"2024","journal-title":"IEEE Trans. Inf. Forensics Secur."},{"key":"10.1016\/j.knosys.2026.116101_b22","series-title":"Fitnets: Hints for thin deep nets","author":"Romero","year":"2014"},{"key":"10.1016\/j.knosys.2026.116101_b23","doi-asserted-by":"crossref","unstructured":"W. Park, D. Kim, Y. Lu, M. Cho, Relational knowledge distillation, in: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 2019, pp. 3967\u20133976.","DOI":"10.1109\/CVPR.2019.00409"},{"key":"10.1016\/j.knosys.2026.116101_b24","series-title":"Contrastive representation distillation","author":"Tian","year":"2019"},{"key":"10.1016\/j.knosys.2026.116101_b25","doi-asserted-by":"crossref","unstructured":"F. Tung, G. Mori, Similarity-preserving knowledge distillation, in: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 2019, pp. 1365\u20131374.","DOI":"10.1109\/ICCV.2019.00145"},{"key":"10.1016\/j.knosys.2026.116101_b26","series-title":"Patient knowledge distillation for bert model compression","author":"Sun","year":"2019"},{"key":"10.1016\/j.knosys.2026.116101_b27","series-title":"Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","first-page":"1001","article-title":"Multi-granularity structural knowledge distillation for language model compression","author":"Liu","year":"2022"},{"key":"10.1016\/j.knosys.2026.116101_b28","series-title":"Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","first-page":"8449","article-title":"AD-KD: Attribution-driven knowledge distillation for language model compression","author":"Wu","year":"2023"},{"key":"10.1016\/j.knosys.2026.116101_b29","first-page":"5191","article-title":"Improved knowledge distillation via teacher assistant","volume":"vol. 34","author":"Mirzadeh","year":"2020"},{"key":"10.1016\/j.knosys.2026.116101_b30","series-title":"Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","first-page":"7037","article-title":"BERT learns to teach: Knowledge distillation with meta learning","author":"Zhou","year":"2022"},{"key":"10.1016\/j.knosys.2026.116101_b31","series-title":"International Conference on Machine Learning","first-page":"1126","article-title":"Model-agnostic meta-learning for fast adaptation of deep networks","author":"Finn","year":"2017"},{"key":"10.1016\/j.knosys.2026.116101_b32","series-title":"Findings of the Association for Computational Linguistics","first-page":"883","article-title":"COM2SENSE: A commonsense reasoning benchmark with complementary sentences","author":"Singh","year":"2021"},{"key":"10.1016\/j.knosys.2026.116101_b33","series-title":"Findings of the Association for Computational Linguistics","first-page":"470","article-title":"Generating deep questions with commonsense reasoning ability from the text by disentangled adversarial inference","author":"Yu","year":"2023"},{"key":"10.1016\/j.knosys.2026.116101_b34","series-title":"Commonsense reasoning for conversational ai: A survey of the state of the art","author":"Richardson","year":"2023"},{"key":"10.1016\/j.knosys.2026.116101_b35","first-page":"8082","article-title":"Qasc: A dataset for question answering via sentence composition","volume":"vol. 34","author":"Khot","year":"2020"},{"key":"10.1016\/j.knosys.2026.116101_b36","series-title":"Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing","first-page":"2381","article-title":"Can a suit of armor conduct electricity? A new dataset for open book question answering","author":"Mihaylov","year":"2018"},{"key":"10.1016\/j.knosys.2026.116101_b37","series-title":"Proceedings of the 3rd Workshop on Evaluating Vector Space Representations for NLP","first-page":"63","article-title":"CODAH: An adversarially-authored question answering dataset for common sense","author":"Chen","year":"2019"},{"key":"10.1016\/j.knosys.2026.116101_b38","series-title":"Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing","first-page":"93","article-title":"SWAG: A large-scale adversarial dataset for grounded commonsense inference","author":"Zellers","year":"2018"},{"key":"10.1016\/j.knosys.2026.116101_b39","series-title":"Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers)","first-page":"4149","article-title":"CommonsenseQA: A question answering challenge targeting commonsense knowledge","author":"Talmor","year":"2019"},{"key":"10.1016\/j.knosys.2026.116101_b40","article-title":"Conceptnet 5.5: An open multilingual graph of general knowledge","volume":"vol. 31","author":"Speer","year":"2017"},{"key":"10.1016\/j.knosys.2026.116101_b41","series-title":"Think you have solved question answering? Try ARC, the AI2 reasoning challenge","author":"Clark","year":"2018"},{"key":"10.1016\/j.knosys.2026.116101_b42","series-title":"Two is better than many? binary classification as an effective approach to multi-choice question answering","author":"Ghosal","year":"2022"},{"key":"10.1016\/j.knosys.2026.116101_b43","series-title":"Bart: Denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension","author":"Lewis","year":"2019"},{"key":"10.1016\/j.knosys.2026.116101_b44","series-title":"Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long Papers)","first-page":"1112","article-title":"A broad-coverage challenge corpus for sentence understanding through inference","author":"Williams","year":"2018"},{"key":"10.1016\/j.knosys.2026.116101_b45","doi-asserted-by":"crossref","unstructured":"J. Devlin, M.-W. Chang, K. Lee, K. Toutanova, Bert: Pre-training of deep bidirectional transformers for language understanding, in: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers), 2019, pp. 4171\u20134186.","DOI":"10.18653\/v1\/N19-1423"},{"key":"10.1016\/j.knosys.2026.116101_b46","series-title":"Well-read students learn better: The impact of student initialization on knowledge distillation, 13","first-page":"3","author":"Turc","year":"2019"},{"key":"10.1016\/j.knosys.2026.116101_b47","first-page":"8024","article-title":"PyTorch: An imperative style, high-performance deep learning library","volume":"vol. 32","author":"Paszke","year":"2019"},{"key":"10.1016\/j.knosys.2026.116101_b48","series-title":"Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing: System Demonstrations","first-page":"38","article-title":"Transformers: State-of-the-art natural language processing","author":"Wolf","year":"2020"},{"key":"10.1016\/j.knosys.2026.116101_b49","unstructured":"B. Dolan, C. Brockett, Automatically constructing a corpus of sentential paraphrases, in: Third International Workshop on Paraphrasing, IWP2005, 2005."},{"key":"10.1016\/j.knosys.2026.116101_b50","series-title":"Machine Learning Challenges Workshop","first-page":"177","article-title":"The pascal recognising textual entailment challenge","author":"Dagan","year":"2005"}],"container-title":["Knowledge-Based Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0950705126008270?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0950705126008270?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,6,9]],"date-time":"2026-06-09T11:22:01Z","timestamp":1781004121000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0950705126008270"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,6]]},"references-count":50,"alternative-id":["S0950705126008270"],"URL":"https:\/\/doi.org\/10.1016\/j.knosys.2026.116101","relation":{},"ISSN":["0950-7051"],"issn-type":[{"value":"0950-7051","type":"print"}],"subject":[],"published":{"date-parts":[[2026,6]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"RTKD: Responsive Teacher Knowledge Distillation with heterogeneous students","name":"articletitle","label":"Article Title"},{"value":"Knowledge-Based Systems","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.knosys.2026.116101","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier B.V. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"116101"}}