{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T14:18:30Z","timestamp":1778249910631,"version":"3.51.4"},"reference-count":40,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Expert Systems with Applications"],"published-print":{"date-parts":[[2026,9]]},"DOI":"10.1016\/j.eswa.2026.132502","type":"journal-article","created":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T17:52:20Z","timestamp":1777571540000},"page":"132502","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["Adaptive frequency modulated transformer for industrial surface defect detection"],"prefix":"10.1016","volume":"325","author":[{"ORCID":"https:\/\/orcid.org\/0009-0009-6119-4738","authenticated-orcid":false,"given":"Lei","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4007-4501","authenticated-orcid":false,"given":"Xiaoqian","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-7445-9593","authenticated-orcid":false,"given":"Zejun","family":"Huang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-3286-7227","authenticated-orcid":false,"given":"Shijie","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-1025-0236","authenticated-orcid":false,"given":"Huan","family":"Yuan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-9132-938X","authenticated-orcid":false,"given":"Wenlong","family":"Qiu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"78","reference":[{"key":"10.1016\/j.eswa.2026.132502_bib0001","doi-asserted-by":"crossref","DOI":"10.1115\/1.4049535","article-title":"Image-based surface defect detection using deep learning: A review","volume":"21","author":"Bhatt","year":"2021","journal-title":"Journal of Computing and Information Science in Engineering"},{"key":"10.1016\/j.eswa.2026.132502_bib0002","series-title":"Proceedings of the IEEE conference on computer vision and pattern recognition","first-page":"6154","article-title":"Cascade R-CNN: Delving into high quality object detection","author":"Cai","year":"2018"},{"key":"10.1016\/j.eswa.2026.132502_bib0003","series-title":"European conference on computer vision","first-page":"213","article-title":"End-to-end object detection with transformers","author":"Carion","year":"2020"},{"key":"10.1016\/j.eswa.2026.132502_bib0004","unstructured":"Zhu, X., Su, W., Lu, L., Li, B., Wang, X., & Dai, J. (2020). Deformable DETR: Deformable transformers for end-to-end object detection. arXiv: 2010.04159."},{"key":"10.1016\/j.eswa.2026.132502_bib0005","series-title":"Computer vision and pattern recognition","first-page":"1","article-title":"YOLOv3: An incremental improvement","author":"Farhadi","year":"2018"},{"key":"10.1016\/j.eswa.2026.132502_bib0006","series-title":"2021 IEEE\/CVF international conference on computer vision (ICCV)","first-page":"3490","article-title":"Tood: Task-aligned one-stage object detection","author":"Feng","year":"2021"},{"key":"10.1016\/j.eswa.2026.132502_bib0007","series-title":"Proceedings of the IEEE international conference on computer vision","first-page":"1440","article-title":"Fast R-CNN","author":"Girshick","year":"2015"},{"key":"10.1016\/j.eswa.2026.132502_bib0008","series-title":"Proceedings of the IEEE conference on computer vision and pattern recognition","first-page":"580","article-title":"Rich feature hierarchies for accurate object detection and semantic segmentation","author":"Girshick","year":"2014"},{"issue":"6","key":"10.1016\/j.eswa.2026.132502_bib0009","doi-asserted-by":"crossref","first-page":"610","DOI":"10.1109\/TSMC.1973.4309314","article-title":"Textural features for image classification","volume":"SMC-3","author":"Haralick","year":"1973","journal-title":"IEEE Transactions on Systems, Man, and Cybernetics"},{"key":"10.1016\/j.eswa.2026.132502_bib0010","series-title":"Proceedings of the IEEE international conference on computer vision","first-page":"2961","article-title":"Mask R-CNN","author":"He","year":"2017"},{"key":"10.1016\/j.eswa.2026.132502_bib0011","unstructured":"Jocher, G. (2020). YOLOv5 by Ultralytics. https:\/\/github.com\/ultralytics\/yolov5. 10.5281\/zenodo.3908559."},{"key":"10.1016\/j.eswa.2026.132502_bib0012","unstructured":"Jocher, G., Chaurasia, A., & Qiu, J. (2023). Ultralytics YOLOv8. https:\/\/github.com\/ultralytics\/ultralytics. Accessed: [Insert Access Date]."},{"key":"10.1016\/j.eswa.2026.132502_bib0013","unstructured":"Jocher, G., & Qiu, J. (2024). Ultralytics YOLOv11. https:\/\/github.com\/ultralytics\/ultralytics. Version 11.0.0, License: AGPL-3.0."},{"key":"10.1016\/j.eswa.2026.132502_bib0014","series-title":"Proceedings of the 2022 conference of the North American chapter of the association for computational linguistics: Human language technologies","first-page":"4296","article-title":"FNet: Mixing tokens with fourier transforms","author":"Lee-Thorp","year":"2022"},{"key":"10.1016\/j.eswa.2026.132502_bib0015","unstructured":"Li, C., Li, L., Jiang, H., Weng, K., Geng, Y., Li, L., Ke, Z., Li, Q., Cheng, M., Nie, W. et al. (2022). YOLOv6: A single-stage object detection framework for industrial applications. arXiv: 2209.02976."},{"key":"10.1016\/j.eswa.2026.132502_bib0016","series-title":"Proceedings of the IEEE conference on computer vision and pattern recognition","first-page":"2117","article-title":"Feature pyramid networks for object detection","author":"Lin","year":"2017"},{"key":"10.1016\/j.eswa.2026.132502_bib0017","series-title":"Proceedings of the IEEE international conference on computer vision","first-page":"2980","article-title":"Focal loss for dense object detection","author":"Lin","year":"2017"},{"key":"10.1016\/j.eswa.2026.132502_bib0018","series-title":"European conference on computer vision","first-page":"21","article-title":"SSD: Single shot multibox detector","author":"Liu","year":"2016"},{"key":"10.1016\/j.eswa.2026.132502_bib0019","series-title":"Proceedings of the IEEE\/CVF international conference on computer vision","first-page":"10012","article-title":"Swin transformer: Hierarchical vision transformer using shifted windows","author":"Liu","year":"2021"},{"key":"10.1016\/j.eswa.2026.132502_bib0020","doi-asserted-by":"crossref","first-page":"626","DOI":"10.1109\/TIM.2019.2963555","article-title":"Automated visual defect detection for flat steel surface: A survey","volume":"69","author":"Luo","year":"2020","journal-title":"IEEE Transactions on Instrumentation and Measurement"},{"key":"10.1016\/j.eswa.2026.132502_bib0021","doi-asserted-by":"crossref","first-page":"837","DOI":"10.1109\/34.531803","article-title":"Texture features for browsing and retrieval of image data","volume":"18","author":"Manjunath","year":"2002","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"10.1016\/j.eswa.2026.132502_bib0022","series-title":"Proceedings of the IEEE\/CVF international conference on computer vision","first-page":"3651","article-title":"Conditional detr for fast training convergence","author":"Meng","year":"2021"},{"key":"10.1016\/j.eswa.2026.132502_bib0023","doi-asserted-by":"crossref","first-page":"971","DOI":"10.1109\/TPAMI.2002.1017623","article-title":"Multiresolution gray-scale and rotation invariant texture classification with local binary patterns","volume":"24","author":"Ojala","year":"2002","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"10.1016\/j.eswa.2026.132502_bib0024","series-title":"2025 IEEE\/CVF winter conference on applications of computer vision (wacv)","first-page":"9543","article-title":"SpectFormer: Frequency and attention is what you need in a vision transformer","author":"Patro","year":"2025"},{"key":"10.1016\/j.eswa.2026.132502_bib0025","series-title":"Proceedings of the IEEE\/CVF international conference on computer vision","first-page":"783","article-title":"FCANet: Frequency channel attention networks","author":"Qin","year":"2021"},{"key":"10.1016\/j.eswa.2026.132502_bib0026","series-title":"Advances in neural information processing systems","first-page":"980","article-title":"Global filter networks for image classification","volume":"vol. 34","author":"Rao","year":"2021"},{"key":"10.1016\/j.eswa.2026.132502_bib0027","series-title":"Proceedings of the IEEE\/CVF international conference on computer vision","first-page":"4308","article-title":"Learning frequency-aware dynamic network for efficient super-resolution","author":"Xie","year":"2021"},{"key":"10.1016\/j.eswa.2026.132502_bib0028","series-title":"Advances in neural information processing systems","article-title":"Faster R-CNN: Towards real-time object detection with region proposal networks","volume":"vol. 28","author":"Ren","year":"2015"},{"key":"10.1016\/j.eswa.2026.132502_bib0029","doi-asserted-by":"crossref","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","article-title":"Faster R-CNN: Towards real-time object detection with region proposal networks","volume":"39","author":"Ren","year":"2016","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"10.1016\/j.eswa.2026.132502_bib0030","doi-asserted-by":"crossref","first-page":"759","DOI":"10.1007\/s10845-019-01476-x","article-title":"Segmentation-based deep-learning approach for surface-defect detection","volume":"31","author":"Tabernik","year":"2020","journal-title":"Journal of Intelligent Manufacturing"},{"key":"10.1016\/j.eswa.2026.132502_bib0031","series-title":"Proceedings of the IEEE\/CVF international conference on computer vision","first-page":"9627","article-title":"FCOS: Fully convolutional one-stage object detection","author":"Tian","year":"2019"},{"key":"10.1016\/j.eswa.2026.132502_bib0032","unstructured":"Wang, A., Chen, H., L.L., & et al. (2024a). YOLOv10: Real-time end-to-end object detection. arXiv preprint arXiv: 2405.14458."},{"key":"10.1016\/j.eswa.2026.132502_bib0033","series-title":"European conference on computer vision","first-page":"1","article-title":"YOLOv9: Learning what you want to learn using programmable gradient information","author":"Wang","year":"2024"},{"key":"10.1016\/j.eswa.2026.132502_bib0034","doi-asserted-by":"crossref","first-page":"144","DOI":"10.1016\/j.jmsy.2018.01.003","article-title":"Deep learning for smart manufacturing: Methods and applications","volume":"48","author":"Wang","year":"2018","journal-title":"Journal of Manufacturing Systems"},{"key":"10.1016\/j.eswa.2026.132502_bib0035","doi-asserted-by":"crossref","first-page":"1","DOI":"10.5565\/rev\/elcvia.268","article-title":"A review of recent advances in surface defect detection using texture analysis techniques","author":"Xie","year":"2008","journal-title":"ELCVIA: Electronic letters on computer vision and image analysis"},{"key":"10.1016\/j.eswa.2026.132502_bib0036","doi-asserted-by":"crossref","first-page":"284","DOI":"10.1109\/TSM.2010.2046108","article-title":"A wavelet-based approach in detecting visual defects on semiconductor wafer dies","volume":"23","author":"Yeh","year":"2010","journal-title":"IEEE Transactions on Semiconductor Manufacturing"},{"key":"10.1016\/j.eswa.2026.132502_bib0037","unstructured":"Zhang, H., Li, F., Liu, S., Zhang, L., Su, H., Zhu, J., Ni, L., & Shum, H. (2022). DINO: DETR with improved denoising anchor boxes for end-to-end object detection. arXiv: 2203.03605."},{"key":"10.1016\/j.eswa.2026.132502_bib0038","series-title":"Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition","first-page":"8514","article-title":"VarifocalNet: An IoU-aware dense object detector","author":"Zhang","year":"2021"},{"key":"10.1016\/j.eswa.2026.132502_bib0039","series-title":"Advances in neural information processing systems","first-page":"15475","article-title":"Rest: An efficient transformer for visual recognition","volume":"vol. 34","author":"Zhang","year":"2021"},{"key":"10.1016\/j.eswa.2026.132502_bib0040","series-title":"Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition","first-page":"16965","article-title":"DETRS beat yolos on real-time object detection","author":"Zhao","year":"2024"}],"container-title":["Expert Systems with Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0957417426014156?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0957417426014156?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T14:04:24Z","timestamp":1778249064000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0957417426014156"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,9]]},"references-count":40,"alternative-id":["S0957417426014156"],"URL":"https:\/\/doi.org\/10.1016\/j.eswa.2026.132502","relation":{},"ISSN":["0957-4174"],"issn-type":[{"value":"0957-4174","type":"print"}],"subject":[],"published":{"date-parts":[[2026,9]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Adaptive frequency modulated transformer for industrial surface defect detection","name":"articletitle","label":"Article Title"},{"value":"Expert Systems with Applications","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.eswa.2026.132502","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier Ltd. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"132502"}}