{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,8]],"date-time":"2026-06-08T12:59:56Z","timestamp":1780923596151,"version":"3.54.1"},"reference-count":61,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/100007219","name":"Shanghai Municipal Natural Science Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100007219","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Knowledge-Based Systems"],"published-print":{"date-parts":[[2026,7]]},"DOI":"10.1016\/j.knosys.2026.116262","type":"journal-article","created":{"date-parts":[[2026,5,23]],"date-time":"2026-05-23T06:50:40Z","timestamp":1779519040000},"page":"116262","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["Multi-Scale Attention-Relation-Based Knowledge Distillation for real-time intrusion detection system in IoT networks"],"prefix":"10.1016","volume":"347","author":[{"ORCID":"https:\/\/orcid.org\/0009-0008-8012-7963","authenticated-orcid":false,"given":"Jianheng","family":"Tong","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2637-6765","authenticated-orcid":false,"given":"Ying","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"78","reference":[{"issue":"12","key":"10.1016\/j.knosys.2026.116262_b1","doi-asserted-by":"crossref","first-page":"9531","DOI":"10.1109\/JIOT.2020.3007130","article-title":"Deep-learning-enabled security issues in the internet of things","volume":"8","author":"Lv","year":"2020","journal-title":"IEEE Internet Things J."},{"key":"10.1016\/j.knosys.2026.116262_b2","series-title":"2021 International Conference on Advancements in Electrical, Electronics, Communication, Computing and Automation","first-page":"1","article-title":"Intrusion detection and prevention in networks using machine learning and deep learning approaches: a review","author":"Abraham","year":"2021"},{"issue":"7","key":"10.1016\/j.knosys.2026.116262_b3","doi-asserted-by":"crossref","first-page":"6481","DOI":"10.1109\/JIOT.2019.2958185","article-title":"Anomaly detection for IoT time-series data: A survey","volume":"7","author":"Cook","year":"2019","journal-title":"IEEE Internet Things J."},{"issue":"6","key":"10.1016\/j.knosys.2026.116262_b4","doi-asserted-by":"crossref","first-page":"4937","DOI":"10.1109\/JIOT.2020.2971463","article-title":"Sybil attack in RPL-based internet of things: Analysis and defenses","volume":"7","author":"Pu","year":"2020","journal-title":"IEEE Internet Things J."},{"key":"10.1016\/j.knosys.2026.116262_b5","doi-asserted-by":"crossref","first-page":"15881","DOI":"10.1007\/s11042-018-6338-1","article-title":"Cyber forensics framework for big data analytics in IoT environment using machine learning","volume":"79","author":"Chhabra","year":"2020","journal-title":"Multimedia Tools Appl."},{"key":"10.1016\/j.knosys.2026.116262_b6","doi-asserted-by":"crossref","DOI":"10.1016\/j.jclepro.2020.121571","article-title":"Towards automated aquaponics: A review on monitoring, IoT, and smart systems","volume":"263","author":"Yanes","year":"2020","journal-title":"J. Clean. Prod."},{"key":"10.1016\/j.knosys.2026.116262_b7","doi-asserted-by":"crossref","first-page":"78847","DOI":"10.1109\/ACCESS.2020.2990195","article-title":"A review of insider threat detection approaches with IoT perspective","volume":"8","author":"Kim","year":"2020","journal-title":"IEEE Access"},{"issue":"15","key":"10.1016\/j.knosys.2026.116262_b8","doi-asserted-by":"crossref","first-page":"12251","DOI":"10.1109\/JIOT.2021.3060878","article-title":"Semi-supervised spatiotemporal deep learning for intrusions detection in IoT networks","volume":"8","author":"Abdel-Basset","year":"2021","journal-title":"IEEE Internet Things J."},{"key":"10.1016\/j.knosys.2026.116262_b9","doi-asserted-by":"crossref","DOI":"10.1016\/j.jnca.2023.103760","article-title":"Deep transfer learning for intrusion detection in industrial control networks: A comprehensive review","volume":"220","author":"Kheddar","year":"2023","journal-title":"J. Netw. Comput. Appl."},{"key":"10.1016\/j.knosys.2026.116262_b10","doi-asserted-by":"crossref","DOI":"10.1016\/j.inffus.2025.103347","article-title":"Transformers and large language models for efficient intrusion detection systems: A comprehensive survey","volume":"124","author":"Kheddar","year":"2025","journal-title":"Inf. Fusion"},{"issue":"1","key":"10.1016\/j.knosys.2026.116262_b11","first-page":"857","article-title":"Self-supervised learning: Generative or contrastive","volume":"35","author":"Liu","year":"2021","journal-title":"IEEE Trans. Knowl. Data Eng."},{"issue":"4","key":"10.1016\/j.knosys.2026.116262_b12","doi-asserted-by":"crossref","first-page":"2860","DOI":"10.1109\/TII.2020.3015026","article-title":"An adaptive trust boundary protection for iIoT networks using deep-learning feature-extraction-based semisupervised model","volume":"17","author":"Hassan","year":"2020","journal-title":"IEEE Trans. Ind. Informatics"},{"key":"10.1016\/j.knosys.2026.116262_b13","doi-asserted-by":"crossref","first-page":"1965","DOI":"10.1109\/TIFS.2025.3539100","article-title":"Intrusion detection for internet of things: an anchor graph clustering approach","volume":"20","author":"Wu","year":"2025","journal-title":"IEEE Trans. Inf. Forensics Secur."},{"key":"10.1016\/j.knosys.2026.116262_b14","doi-asserted-by":"crossref","first-page":"5668","DOI":"10.1109\/TIFS.2024.3402148","article-title":"Online self-supervised deep learning for intrusion detection systems","volume":"19","author":"Nak\u0131p","year":"2024","journal-title":"IEEE Trans. Inf. Forensics Secur."},{"key":"10.1016\/j.knosys.2026.116262_b15","article-title":"Attention is all you need","author":"Vaswani","year":"2017","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.knosys.2026.116262_b16","first-page":"11106","article-title":"Informer: Beyond efficient transformer for long sequence time-series forecasting","volume":"vol. 35","author":"Zhou","year":"2021"},{"key":"10.1016\/j.knosys.2026.116262_b17","series-title":"International Conference on Machine Learning","first-page":"27268","article-title":"Fedformer: Frequency enhanced decomposed transformer for long-term series forecasting","author":"Zhou","year":"2022"},{"key":"10.1016\/j.knosys.2026.116262_b18","series-title":"Distilling the knowledge in a neural network","author":"Hinton","year":"2015"},{"key":"10.1016\/j.knosys.2026.116262_b19","doi-asserted-by":"crossref","unstructured":"W. Park, D. Kim, Y. Lu, M. Cho, Relational knowledge distillation, in: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 2019, pp. 3967\u20133976.","DOI":"10.1109\/CVPR.2019.00409"},{"key":"10.1016\/j.knosys.2026.116262_b20","article-title":"Crossformer++: A versatile vision transformer hinging on cross-scale attention","author":"Wang","year":"2023","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.knosys.2026.116262_b21","series-title":"The Twelfth International Conference on Learning Representations","article-title":"ModernTCN: A modern pure convolution structure for general time series analysis","author":"donghao","year":"2024"},{"key":"10.1016\/j.knosys.2026.116262_b22","series-title":"Rwkv-7\u201d goose\u201d with expressive dynamic state evolution","author":"Peng","year":"2025"},{"key":"10.1016\/j.knosys.2026.116262_b23","series-title":"Retentive network: A successor to transformer for large language models","author":"Sun","year":"2023"},{"key":"10.1016\/j.knosys.2026.116262_b24","doi-asserted-by":"crossref","unstructured":"B. Peng, X. Jin, J. Liu, D. Li, Y. Wu, Y. Liu, S. Zhou, Z. Zhang, Correlation Congruence for Knowledge Distillation, in: Proceedings of the IEEE\/CVF International Conference on Computer Vision, ICCV, 2019.","DOI":"10.1109\/ICCV.2019.00511"},{"issue":"1","key":"10.1016\/j.knosys.2026.116262_b25","first-page":"857","article-title":"Self-supervised learning: Generative or contrastive","volume":"35","author":"Liu","year":"2021","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"10.1016\/j.knosys.2026.116262_b26","doi-asserted-by":"crossref","first-page":"261","DOI":"10.1016\/j.neucom.2022.03.048","article-title":"Efficient time series anomaly detection by multiresolution self-supervised discriminative network","volume":"491","author":"Huang","year":"2022","journal-title":"Neurocomputing"},{"issue":"8","key":"10.1016\/j.knosys.2026.116262_b27","doi-asserted-by":"crossref","first-page":"6247","DOI":"10.1109\/JIOT.2020.3024800","article-title":"Intrusion detection for cyber\u2013physical systems using generative adversarial networks in fog environment","volume":"8","author":"de Araujo-Filho","year":"2020","journal-title":"IEEE Internet Things J."},{"issue":"11","key":"10.1016\/j.knosys.2026.116262_b28","doi-asserted-by":"crossref","first-page":"9389","DOI":"10.1109\/TNNLS.2022.3159538","article-title":"Self-supervised attentive generative adversarial networks for video anomaly detection","volume":"34","author":"Huang","year":"2022","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"issue":"1","key":"10.1016\/j.knosys.2026.116262_b29","article-title":"Deep semisupervised learning-based network anomaly detection in heterogeneous information systems.","volume":"70","author":"Lutsiv","year":"2022","journal-title":"Comput. Mater. Contin."},{"key":"10.1016\/j.knosys.2026.116262_b30","doi-asserted-by":"crossref","DOI":"10.1016\/j.engappai.2025.111973","article-title":"A network intrusion detection system based on self-supervised learning of traffic differentiation in internet of things","volume":"160","author":"Chen","year":"2025","journal-title":"Eng. Appl. Artif. Intell."},{"key":"10.1016\/j.knosys.2026.116262_b31","doi-asserted-by":"crossref","DOI":"10.1016\/j.compeleceng.2025.110753","article-title":"Low-latency and interpretable intrusion detection for iIoT using self-supervised learning with entropy-based masking","volume":"128","author":"Khan","year":"2025","journal-title":"Comput. Electr. Eng."},{"key":"10.1016\/j.knosys.2026.116262_b32","unstructured":"T. Dao, A. Gu, Transformers are SSMs: Generalized Models and Efficient Algorithms Through Structured State Space Duality, in: Forty-First International Conference on Machine Learning."},{"key":"10.1016\/j.knosys.2026.116262_b33","series-title":"xLSTM: Extended long short-term memory","author":"Beck","year":"2024"},{"key":"10.1016\/j.knosys.2026.116262_b34","series-title":"Fitnets: Hints for thin deep nets","author":"Romero","year":"2014"},{"key":"10.1016\/j.knosys.2026.116262_b35","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/j.ins.2021.10.043","article-title":"Online knowledge distillation with elastic peer","volume":"583","author":"Tan","year":"2022","journal-title":"Inform. Sci."},{"key":"10.1016\/j.knosys.2026.116262_b36","doi-asserted-by":"crossref","unstructured":"J. Zhu, S. Tang, D. Chen, S. Yu, Y. Liu, M. Rong, A. Yang, X. Wang, Complementary relation contrastive distillation, in: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 2021, pp. 9260\u20139269.","DOI":"10.1109\/CVPR46437.2021.00914"},{"key":"10.1016\/j.knosys.2026.116262_b37","doi-asserted-by":"crossref","unstructured":"S. Zhou, Y. Wang, D. Chen, J. Chen, X. Wang, C. Wang, J. Bu, Distilling holistic knowledge with graph neural networks, in: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 2021, pp. 10387\u201310396.","DOI":"10.1109\/ICCV48922.2021.01022"},{"key":"10.1016\/j.knosys.2026.116262_b38","series-title":"International Conference on Knowledge Science, Engineering and Management","first-page":"357","article-title":"Knowledge distillation via channel correlation structure","author":"Li","year":"2021"},{"issue":"2","key":"10.1016\/j.knosys.2026.116262_b39","doi-asserted-by":"crossref","first-page":"1817","DOI":"10.1109\/TPAMI.2022.3160328","article-title":"Generalized knowledge distillation via relationship matching","volume":"45","author":"Ye","year":"2022","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"5","key":"10.1016\/j.knosys.2026.116262_b40","doi-asserted-by":"crossref","first-page":"7099","DOI":"10.1109\/TII.2022.3209672","article-title":"Multilevel attention-based sample correlations for knowledge distillation","volume":"19","author":"Gou","year":"2022","journal-title":"IEEE Trans. Ind. Informatics"},{"key":"10.1016\/j.knosys.2026.116262_b41","doi-asserted-by":"crossref","DOI":"10.1016\/j.engappai.2025.112356","article-title":"Research on lightweight network for real-time detection of steel structure corrosion based on knowledge distillation","volume":"162","author":"Hou","year":"2025","journal-title":"Eng. Appl. Artif. Intell."},{"key":"10.1016\/j.knosys.2026.116262_b42","doi-asserted-by":"crossref","DOI":"10.1016\/j.inffus.2026.104158","article-title":"A novel knowledge distillation and hybrid explainability approach for phenology stage classification from multi-source time series","author":"Ullah","year":"2026","journal-title":"Inf. Fusion"},{"issue":"20","key":"10.1016\/j.knosys.2026.116262_b43","first-page":"64","article-title":"Review of attention mechanism in convolutional neural networks","volume":"57","author":"Zhang","year":"2021","journal-title":"Comput. Eng. Appl."},{"key":"10.1016\/j.knosys.2026.116262_b44","series-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition","first-page":"7132","article-title":"Squeeze-and-excitation networks","author":"Hu","year":"2018"},{"key":"10.1016\/j.knosys.2026.116262_b45","series-title":"Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition","first-page":"11534","article-title":"ECA-net: Efficient channel attention for deep convolutional neural networks","author":"Wang","year":"2020"},{"key":"10.1016\/j.knosys.2026.116262_b46","unstructured":"Y. Liu, T. Hu, H. Zhang, H. Wu, S. Wang, L. Ma, M. Long, iTransformer: Inverted Transformers Are Effective for Time Series Forecasting, in: The Twelfth International Conference on Learning Representations."},{"key":"10.1016\/j.knosys.2026.116262_b47","series-title":"Eagle and finch: RWKV with matrix-valued states and dynamic recurrence","author":"Peng","year":"2024"},{"key":"10.1016\/j.knosys.2026.116262_b48","unstructured":"Z. Qiu, Z. Wang, B. Zheng, Z. Huang, K. Wen, S. Yang, R. Men, L. Yu, F. Huang, S. Huang, et al., Gated Attention for Large Language Models: Non-linearity, Sparsity, and Attention-Sink-Free, in: The Thirty-Ninth Annual Conference on Neural Information Processing Systems, 2025."},{"key":"10.1016\/j.knosys.2026.116262_b49","doi-asserted-by":"crossref","unstructured":"Q. Fan, H. Huang, Y. Ai, R. He, Rectifying magnitude neglect in linear attention, in: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 2025, pp. 21505\u201321514.","DOI":"10.1109\/ICCV51701.2025.01997"},{"key":"10.1016\/j.knosys.2026.116262_b50","first-page":"22419","article-title":"Autoformer: Decomposition transformers with auto-correlation for long-term series forecasting","volume":"vol. 34","author":"Wu","year":"2021"},{"key":"10.1016\/j.knosys.2026.116262_b51","series-title":"Less is more: Fast multivariate time series forecasting with light sampling-oriented mlp structures","author":"Zhang","year":"2022"},{"key":"10.1016\/j.knosys.2026.116262_b52","series-title":"The Eleventh International Conference on Learning Representations","article-title":"TimesNet: Temporal 2D-variation modeling for general time series analysis","author":"Wu","year":"2023"},{"key":"10.1016\/j.knosys.2026.116262_b53","series-title":"The Eleventh International Conference on Learning Representations","article-title":"MICN: Multi-scale local and global context modeling for long-term series forecasting","author":"Wang","year":"2023"},{"key":"10.1016\/j.knosys.2026.116262_b54","series-title":"13th International Conference on Learning Representations, ICLR 2025","first-page":"18810","article-title":"Towards a general time series anomaly detector with adaptive bottlenecks and dual adversarial decoders","author":"Shentu","year":"2025"},{"key":"10.1016\/j.knosys.2026.116262_b55","doi-asserted-by":"crossref","unstructured":"Z. Liang, D. Cai, C. Zhang, Z. Liang, C. Liang, B. Zheng, S. Qiu, J. Wang, H. Wang, KDSelector: A Knowledge-Enhanced and Data-Efficient Model Selector Learning Framework for Time Series Anomaly Detection, in: Companion of the 2025 International Conference on Management of Data, 2025, pp. 175\u2013178.","DOI":"10.1145\/3722212.3725110"},{"key":"10.1016\/j.knosys.2026.116262_b56","doi-asserted-by":"crossref","unstructured":"Y. Xie, H. Zhang, M.A. Babar, Multivariate time series anomaly detection by capturing coarse-grained intra-and inter-variate dependencies, in: Proceedings of the ACM on Web Conference 2025, 2025, pp. 697\u2013705.","DOI":"10.1145\/3696410.3714941"},{"key":"10.1016\/j.knosys.2026.116262_b57","unstructured":"Y. Tian, D. Krishnan, P. Isola, Contrastive Representation Distillation, in: International Conference on Learning Representations."},{"key":"10.1016\/j.knosys.2026.116262_b58","unstructured":"N. Komodakis, S. Zagoruyko, Paying more attention to attention: improving the performance of convolutional neural networks via attention transfer, in: ICLR, 2017."},{"key":"10.1016\/j.knosys.2026.116262_b59","doi-asserted-by":"crossref","unstructured":"S. Ahn, S.X. Hu, A. Damianou, N.D. Lawrence, Z. Dai, Variational Information Distillation for Knowledge Transfer, in: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, CVPR, 2019.","DOI":"10.1109\/CVPR.2019.00938"},{"key":"10.1016\/j.knosys.2026.116262_b60","series-title":"Proceedings of the IEEE\/CVF International Conference on Computer Vision","first-page":"1365","article-title":"Similarity-preserving knowledge distillation","author":"Tung","year":"2019"},{"key":"10.1016\/j.knosys.2026.116262_b61","series-title":"TimeDistill: Efficient long-term time series forecasting with MLP via cross-architecture distillation","author":"Ni","year":"2025"}],"container-title":["Knowledge-Based Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0950705126009883?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0950705126009883?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,6,8]],"date-time":"2026-06-08T12:04:35Z","timestamp":1780920275000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0950705126009883"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,7]]},"references-count":61,"alternative-id":["S0950705126009883"],"URL":"https:\/\/doi.org\/10.1016\/j.knosys.2026.116262","relation":{},"ISSN":["0950-7051"],"issn-type":[{"value":"0950-7051","type":"print"}],"subject":[],"published":{"date-parts":[[2026,7]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Multi-Scale Attention-Relation-Based Knowledge Distillation for real-time intrusion detection system in IoT networks","name":"articletitle","label":"Article Title"},{"value":"Knowledge-Based Systems","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.knosys.2026.116262","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier B.V. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"116262"}}