{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,14]],"date-time":"2026-04-14T20:00:15Z","timestamp":1776196815631,"version":"3.50.1"},"reference-count":53,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/501100021171","name":"Basic and Applied Basic Research Foundation of Guangdong Province","doi-asserted-by":"publisher","award":["2024A15150 11466"],"award-info":[{"award-number":["2024A15150 11466"]}],"id":[{"id":"10.13039\/501100021171","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100010256","name":"Guangzhou Municipal Science and Technology Project","doi-asserted-by":"publisher","award":["2023B01J0037"],"award-info":[{"award-number":["2023B01J0037"]}],"id":[{"id":"10.13039\/501100010256","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62271214"],"award-info":[{"award-number":["62271214"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Advanced Engineering Informatics"],"published-print":{"date-parts":[[2026,9]]},"DOI":"10.1016\/j.aei.2026.104660","type":"journal-article","created":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T13:46:19Z","timestamp":1775310379000},"page":"104660","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"PA","title":["Multimodal Generalized Defect Category Discovery in industrial scenarios via defect-aware representation guided calibrated clustering"],"prefix":"10.1016","volume":"74","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9562-5198","authenticated-orcid":false,"given":"Hao","family":"Cheng","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8603-6132","authenticated-orcid":false,"given":"Jiaxiang","family":"Luo","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0001-8652-1653","authenticated-orcid":false,"given":"Zilong","family":"Huang","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.aei.2026.104660_b1","doi-asserted-by":"crossref","DOI":"10.1016\/j.compind.2023.103990","article-title":"Industrial anomaly detection with domain shift: A real-world dataset and masked multi-scale reconstruction","volume":"151","author":"Zhang","year":"2023","journal-title":"Comput. Ind."},{"issue":"12","key":"10.1016\/j.aei.2026.104660_b2","doi-asserted-by":"crossref","first-page":"7448","DOI":"10.1109\/TII.2019.2958826","article-title":"PGA-Net: Pyramid feature fusion and global context attention network for automated surface defect detection","volume":"16","author":"Dong","year":"2020","journal-title":"IEEE Trans. Ind. Inf."},{"issue":"3","key":"10.1016\/j.aei.2026.104660_b3","first-page":"2271","article-title":"Unsupervised saliency detection of rail surface defects using stereoscopic images","volume":"17","author":"Niu","year":"2021","journal-title":"IEEE Trans. Ind. Inf."},{"key":"10.1016\/j.aei.2026.104660_b4","series-title":"Proc. Int. Joint Conf. Comput. Vis. Imag. Comput. Graph. Theory Appl.","first-page":"202","article-title":"The mvtec 3D-AD dataset for unsupervised 3D anomaly detection and localization","author":"Bergmann.","year":"2022"},{"key":"10.1016\/j.aei.2026.104660_b5","doi-asserted-by":"crossref","DOI":"10.1016\/j.aei.2025.103240","article-title":"CPIR: Multimodal industrial anomaly detection via latent bridged cross-modal prediction and intra-modal reconstruction","volume":"65","author":"Shangguan","year":"2025","journal-title":"Adv. Eng. Inf."},{"key":"10.1016\/j.aei.2026.104660_b6","series-title":"Proc. IEEE Winter Conf. Appl. Comput. Vis.","first-page":"2592","article-title":"Asymmetric student-teacher networks for industrial anomaly detection","author":"Rudolph","year":"2023"},{"issue":"3","key":"10.1016\/j.aei.2026.104660_b7","doi-asserted-by":"crossref","first-page":"3986","DOI":"10.1109\/TII.2023.3318302","article-title":"A discrepancy aware framework for robust anomaly detection","volume":"20","author":"Cai","year":"2024","journal-title":"IEEE Trans. Ind. Inf."},{"key":"10.1016\/j.aei.2026.104660_b8","series-title":"Proc. IEEE Conf. Comput. Vis. Pattern Recognit.","first-page":"14298","article-title":"Towards total recall in industrial anomaly detection","author":"Roth","year":"2022"},{"key":"10.1016\/j.aei.2026.104660_b9","series-title":"Proc. IEEE Winter Conf. Appl. Comput. Vis","first-page":"5468","article-title":"Anomaly clustering: Grouping images into coherent clusters of anomaly types","author":"Sohn","year":"2023"},{"key":"10.1016\/j.aei.2026.104660_b10","doi-asserted-by":"crossref","DOI":"10.1016\/j.aei.2025.103138","article-title":"Geometric spatial constraints network for slender and tiny surface defect detection","volume":"65","author":"Pu","year":"2025","journal-title":"Adv. Eng. Inf."},{"issue":"6","key":"10.1016\/j.aei.2026.104660_b11","doi-asserted-by":"crossref","first-page":"4874","DOI":"10.1109\/TMECH.2022.3167412","article-title":"Collaborative learning attention network based on RGB image and depth image for surface defect inspection of no-service rail","volume":"27","author":"Wang","year":"2022","journal-title":"IEEE-ASME Trans. Mechatron."},{"issue":"3","key":"10.1016\/j.aei.2026.104660_b12","doi-asserted-by":"crossref","first-page":"1694","DOI":"10.1109\/TII.2021.3085848","article-title":"Attention network for rail surface defect detection via consistency of intersection-over-union (IoU)-guided center-point estimation","volume":"18","author":"Ni","year":"2021","journal-title":"IEEE Trans. Ind. Inf."},{"key":"10.1016\/j.aei.2026.104660_b13","first-page":"1","article-title":"SMD anomaly detection: A self-supervised texture\u2013structure anomaly detection framework","volume":"71","author":"Luo","year":"2022","journal-title":"IEEE Trans. Instrum. Meas."},{"key":"10.1016\/j.aei.2026.104660_b14","series-title":"Proc. IEEE Conf. Comput. Vis. Pattern Recognit.","first-page":"7482","article-title":"Generalized category discovery","author":"Vaze","year":"2022"},{"key":"10.1016\/j.aei.2026.104660_b15","series-title":"Proc. IEEE Conf. Comput. Vis. Pattern Recognit.","first-page":"16590","article-title":"Parametric classification for generalized category discovery: A baseline study","author":"Wen","year":"2023"},{"key":"10.1016\/j.aei.2026.104660_b16","series-title":"Proc. Int. Conf. Learn. Represent.","first-page":"16028","article-title":"DebGCD: Debiased learning with distribution guidance for generalized category discovery","author":"Liu","year":"2025"},{"key":"10.1016\/j.aei.2026.104660_b17","doi-asserted-by":"crossref","first-page":"58625","DOI":"10.52202\/075280-2555","article-title":"Towards distribution-agnostic generalized category discovery","volume":"36","author":"Bai","year":"2023","journal-title":"Adv. Neural Inf. Process. Syst."},{"issue":"7","key":"10.1016\/j.aei.2026.104660_b18","doi-asserted-by":"crossref","first-page":"6022","DOI":"10.1109\/TPAMI.2025.3557502","article-title":"ProtoGCD: Unified and unbiased prototype learning for generalized category discovery","volume":"47","author":"Ma","year":"2025","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.aei.2026.104660_b19","series-title":"Proc. IEEE Conf. Comput. Vis. Pattern Recognit.","first-page":"4755","article-title":"AnomalyNCD: Towards novel anomaly class discovery in industrial scenarios","author":"Huang","year":"2025"},{"key":"10.1016\/j.aei.2026.104660_b20","series-title":"Proc. IEEE Conf. Comput. Vis. Pattern Recognit.","first-page":"7579","article-title":"Dynamic conceptional contrastive learning for generalized category discovery","author":"Pu","year":"2023"},{"key":"10.1016\/j.aei.2026.104660_b21","series-title":"Proc. IEEE Conf. Comput. Vis. Pattern Recognit.","first-page":"4182","article-title":"Uninformed students: Student-teacher anomaly detection with discriminative latent embeddings","author":"Bergmann","year":"2020"},{"key":"10.1016\/j.aei.2026.104660_b22","series-title":"Proc. IEEE Winter Conf. Appl. Comput. Vis.","first-page":"1906","article-title":"Same same but DifferNet: Semi-supervised defect detection with normalizing flows","author":"Rudolph","year":"2021"},{"key":"10.1016\/j.aei.2026.104660_b23","doi-asserted-by":"crossref","DOI":"10.1016\/j.patcog.2020.107706","article-title":"Reconstruction by inpainting for visual anomaly detection","volume":"112","author":"Zavrtanik","year":"2021","journal-title":"Pattern Recognit."},{"key":"10.1016\/j.aei.2026.104660_b24","doi-asserted-by":"crossref","first-page":"9","DOI":"10.1016\/j.neucom.2020.11.018","article-title":"Unsupervised anomaly segmentation via deep feature reconstruction","volume":"424","author":"Shi","year":"2021","journal-title":"Neurocomputing"},{"key":"10.1016\/j.aei.2026.104660_b25","series-title":"Proc. AAAI Conf. Artif. Intell.","first-page":"8472","article-title":"A diffusion-based framework for multi-class anomaly detection","volume":"vol. 38","author":"He","year":"2024"},{"key":"10.1016\/j.aei.2026.104660_b26","doi-asserted-by":"crossref","first-page":"1329","DOI":"10.1109\/TIP.2023.3242775","article-title":"LSNet: Lightweight spatial boosting network for detecting salient objects in RGB-thermal images","volume":"32","author":"Zhou","year":"2023","journal-title":"IEEE Trans. Image Process."},{"key":"10.1016\/j.aei.2026.104660_b27","doi-asserted-by":"crossref","first-page":"3027","DOI":"10.1109\/TIP.2023.3275538","article-title":"WaveNet: Wavelet network with knowledge distillation for RGB-T salient object detection","volume":"32","author":"Zhou","year":"2023","journal-title":"IEEE Trans. Image Process."},{"issue":"3","key":"10.1016\/j.aei.2026.104660_b28","doi-asserted-by":"crossref","first-page":"1224","DOI":"10.1109\/TCSVT.2021.3077058","article-title":"ECFFNet: Effective and consistent feature fusion network for RGB-T salient object detection","volume":"32","author":"Zhou","year":"2022","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"key":"10.1016\/j.aei.2026.104660_b29","doi-asserted-by":"crossref","first-page":"2192","DOI":"10.1109\/TMM.2021.3077767","article-title":"CCAFNet: Crossflow and cross-scale adaptive fusion network for detecting salient objects in RGB-D images","volume":"24","author":"Zhou","year":"2022","journal-title":"IEEE Trans. Multimed."},{"key":"10.1016\/j.aei.2026.104660_b30","first-page":"1","article-title":"RCNet: Dual-network resonance collaboration via mutual learning for RGB-D road defect detection","author":"Zhou","year":"2025","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"issue":"7","key":"10.1016\/j.aei.2026.104660_b31","doi-asserted-by":"crossref","first-page":"9276","DOI":"10.1109\/JIOT.2024.3506624","article-title":"Hybrid knowledge distillation for RGB-T crowd density estimation in smart surveillance systems","volume":"12","author":"Zhou","year":"2025","journal-title":"IEEE Internet Things J."},{"issue":"8","key":"10.1016\/j.aei.2026.104660_b32","doi-asserted-by":"crossref","first-page":"4140","DOI":"10.1109\/TCSI.2024.3521933","article-title":"Knowledge distillation and contrastive learning for detecting visible-infrared transmission lines using separated stagger registration network","volume":"72","author":"Zhou","year":"2025","journal-title":"IEEE Trans. Circuits Syst. I. Regul. Pap."},{"key":"10.1016\/j.aei.2026.104660_b33","series-title":"Proc. IEEE Conf. Comput. Vis. Pattern Recognit.","first-page":"19606","article-title":"Winclip: Zero-\/few-shot anomaly classification and segmentation","author":"Jeong","year":"2023"},{"key":"10.1016\/j.aei.2026.104660_b34","doi-asserted-by":"crossref","unstructured":"Y. Cao, J. Zhang, L. Frittoli, Y. Cheng, W. Shen, G. Boracchi, Adaclip: Adapting clip with hybrid learnable prompts for zero-shot anomaly detection, in: Proc. Eur. Conf. Comput. Vis., 2024, pp. 55\u201372.","DOI":"10.1007\/978-3-031-72761-0_4"},{"key":"10.1016\/j.aei.2026.104660_b35","series-title":"Proc. IEEE Conf. Comput. Vis. Pattern Recognit.","first-page":"8032","article-title":"Multimodal industrial anomaly detection via hybrid fusion","author":"Wang","year":"2023"},{"key":"10.1016\/j.aei.2026.104660_b36","unstructured":"Y.-M. Chu, C. Liu, T.-I. Hsieh, H.-T. Chen, T.-L. Liu, Shape-Guided Dual-Memory Learning for 3D Anomaly Detection, in: Proc. Int. Conf. Mach. Learn., 2023, pp. 6185\u20136194."},{"key":"10.1016\/j.aei.2026.104660_b37","doi-asserted-by":"crossref","unstructured":"A. Costanzino, P.Z. Ramirez, G. Lisanti, L. Di Stefano, Multimodal industrial anomaly detection by crossmodal feature mapping, in: Proc. IEEE Conf. Comput. Vis. Pattern Recognit., 2024, pp. 17234\u201317243.","DOI":"10.1109\/CVPR52733.2024.01631"},{"issue":"6","key":"10.1016\/j.aei.2026.104660_b38","doi-asserted-by":"crossref","first-page":"5000","DOI":"10.1109\/TII.2025.3552723","article-title":"Multimodal industrial anomaly detection via uni-modal and cross-modal fusion","volume":"21","author":"Cheng","year":"2025","journal-title":"IEEE Trans. Ind. Inf."},{"key":"10.1016\/j.aei.2026.104660_b39","unstructured":"A. Radford, J.W. Kim, C. Hallacy, A. Ramesh, G. Goh, S. Agarwal, G. Sastry, A. Askell, P. Mishkin, J. Clark, et al., Learning transferable visual models from natural language supervision, in: Proc. Int. Conf. Mach. Learn., 2021, pp. 8748\u20138763."},{"issue":"1","key":"10.1016\/j.aei.2026.104660_b40","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1023\/A:1011126920638","article-title":"Representing and recognizing the visual appearance of materials using three-dimensional textons","volume":"43","author":"Leung","year":"2001","journal-title":"Int. J. Comput. Vis."},{"key":"10.1016\/j.aei.2026.104660_b41","series-title":"Proc. IEEE Int. Conf. Comput. Vis.","first-page":"9864","article-title":"Invariant information clustering for unsupervised image classification and segmentation","author":"Ji","year":"2019"},{"key":"10.1016\/j.aei.2026.104660_b42","doi-asserted-by":"crossref","unstructured":"C. Niu, J. Zhang, G. Wang, J. Liang, Gatcluster: Self-supervised gaussian-attention network for image clustering, in: Proc. Eur. Conf. Comput. Vis., 2020, pp. 735\u2013751.","DOI":"10.1007\/978-3-030-58595-2_44"},{"key":"10.1016\/j.aei.2026.104660_b43","doi-asserted-by":"crossref","unstructured":"W. Van Gansbeke, S. Vandenhende, S. Georgoulis, M. Proesmans, L. Van Gool, Scan: Learning to classify images without labels, in: Proc. Eur. Conf. Comput. Vis, 2020, pp. 268\u2013285.","DOI":"10.1007\/978-3-030-58607-2_16"},{"key":"10.1016\/j.aei.2026.104660_b44","doi-asserted-by":"crossref","unstructured":"Y. Pang, W. Wang, F.E. Tay, W. Liu, Y. Tian, L. Yuan, Masked autoencoders for point cloud self-supervised learning, in: Proc. Eur. Conf. Comput. Vis., 2022, pp. 604\u2013621.","DOI":"10.1007\/978-3-031-20086-1_35"},{"issue":"1","key":"10.1016\/j.aei.2026.104660_b45","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/2733381","article-title":"Hierarchical density estimates for data clustering, visualization, and outlier detection","volume":"10","author":"Campello","year":"2015","journal-title":"ACM Trans. Knowl. Discov. Data"},{"key":"10.1016\/j.aei.2026.104660_b46","article-title":"Co-regularized multi-view spectral clustering","volume":"24","author":"Kumar","year":"2011","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.aei.2026.104660_b47","doi-asserted-by":"crossref","unstructured":"L. Bonfiglioli, M. Toschi, D. Silvestri, N. Fioraio, D. De Gregorio, The Eyecandies Dataset for Unsupervised Multimodal Anomaly Detection and Localization, in: Proceedings of the 16th Asian Conference on Computer Vision, 2022, ACCV.","DOI":"10.1007\/978-3-031-26348-4_27"},{"key":"10.1016\/j.aei.2026.104660_b48","series-title":"Proc. IEEE Conf. Comput. Vis. Pattern Recognit.","first-page":"9584","article-title":"MVTec AD \u2014 A comprehensive real-world dataset for unsupervised anomaly detection","author":"Bergmann","year":"2019"},{"key":"10.1016\/j.aei.2026.104660_b49","series-title":"Proc. IEEE Int. Conf. Comput. Vis.","first-page":"9630","article-title":"Emerging properties in self-supervised vision transformers","author":"Caron","year":"2021"},{"key":"10.1016\/j.aei.2026.104660_b50","doi-asserted-by":"crossref","DOI":"10.1016\/j.compind.2023.103990","article-title":"Industrial anomaly detection with domain shift: A real-world dataset and masked multi-scale reconstruction","volume":"151","author":"Zhang","year":"2023","journal-title":"Comput. Ind."},{"key":"10.1016\/j.aei.2026.104660_b51","unstructured":"X. Li, Z. Huang, F. Xue, Y. Zhou, Musc: Zero-shot industrial anomaly classification and segmentation with mutual scoring of the unlabeled images, in: The Twelfth International Conference on Learning Representations, 2024."},{"key":"10.1016\/j.aei.2026.104660_b52","doi-asserted-by":"crossref","first-page":"5606","DOI":"10.1109\/TIP.2024.3448263","article-title":"Target before shooting: Accurate anomaly detection and localization under one millisecond via cascade patch retrieval","volume":"33","author":"Li","year":"2024","journal-title":"IEEE Trans. Image Process."},{"key":"10.1016\/j.aei.2026.104660_b53","series-title":"Adv. Neural Inf. Process. Syst.","first-page":"30402","article-title":"Real3D-AD: A dataset of point cloud anomaly detection","volume":"vol. 36","author":"Liu","year":"2023"}],"container-title":["Advanced Engineering Informatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1474034626003526?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1474034626003526?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,4,14]],"date-time":"2026-04-14T19:06:52Z","timestamp":1776193612000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1474034626003526"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,9]]},"references-count":53,"alternative-id":["S1474034626003526"],"URL":"https:\/\/doi.org\/10.1016\/j.aei.2026.104660","relation":{},"ISSN":["1474-0346"],"issn-type":[{"value":"1474-0346","type":"print"}],"subject":[],"published":{"date-parts":[[2026,9]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Multimodal Generalized Defect Category Discovery in industrial scenarios via defect-aware representation guided calibrated clustering","name":"articletitle","label":"Article Title"},{"value":"Advanced Engineering Informatics","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.aei.2026.104660","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier Ltd. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"104660"}}