{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,16]],"date-time":"2026-05-16T01:39:45Z","timestamp":1778895585137,"version":"3.51.4"},"reference-count":33,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,11,7]],"date-time":"2025-11-07T00:00:00Z","timestamp":1762473600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,11,7]],"date-time":"2025-11-07T00:00:00Z","timestamp":1762473600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"Shandong Province Natural Science Foundation of China","award":["ZR2022ME194"],"award-info":[{"award-number":["ZR2022ME194"]}]},{"name":"Shandong Energy Group Technology Project","award":["YK2023B47-R45"],"award-info":[{"award-number":["YK2023B47-R45"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Real-Time Image Proc"],"published-print":{"date-parts":[[2026,2]]},"DOI":"10.1007\/s11554-025-01800-0","type":"journal-article","created":{"date-parts":[[2025,11,7]],"date-time":"2025-11-07T11:30:40Z","timestamp":1762515040000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["A lightweight transformer-based framework for real-time foreign object detection in complex railway environments"],"prefix":"10.1007","volume":"23","author":[{"given":"Zhe","family":"Dong","sequence":"first","affiliation":[]},{"given":"Qing","family":"Yang","sequence":"additional","affiliation":[]},{"given":"HaoLin","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Heng","family":"Zhou","sequence":"additional","affiliation":[]},{"given":"Dexin","family":"Gao","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,11,7]]},"reference":[{"issue":"1","key":"1800_CR1","doi-asserted-by":"publisher","first-page":"136","DOI":"10.1186\/s44147-025-00708-7","volume":"72","author":"H Niu","year":"2025","unstructured":"Niu, H., Feng, D., Hou, T.: Research on foreign object intrusion detection in railway tracks based on MSL-YOLO. J. Eng. Appl. Sci. 72(1), 136 (2025)","journal-title":"J. Eng. Appl. Sci."},{"key":"1800_CR2","doi-asserted-by":"crossref","unstructured":"Qu, Y., Wang, B., Qiu, R., Zheng, C.: The research and realization of contactless collision early warning assistant system. In: Proceedings of the 2015 International Conference on Electrical and Information Technologies for Rail Transportation: Transportation, pp. 147\u2013154 (2016)","DOI":"10.1007\/978-3-662-49370-0_15"},{"issue":"2","key":"1800_CR3","doi-asserted-by":"publisher","first-page":"316","DOI":"10.1007\/s11367-021-02012-x","volume":"27","author":"C Liljenstr\u00f6m","year":"2022","unstructured":"Liljenstr\u00f6m, C., Bj\u00f6rklund, A., Toller, S.: Including maintenance in life cycle assessment of road and rail infrastructure\u2014a literature review. Int. J. Life Cycle Assess. 27(2), 316\u2013341 (2022)","journal-title":"Int. J. Life Cycle Assess."},{"key":"1800_CR4","doi-asserted-by":"crossref","unstructured":"Girshick, R.: Fast R-CNN. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1440\u20131448 (2015)","DOI":"10.1109\/ICCV.2015.169"},{"key":"1800_CR5","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster R-CNN: towards real-time object detection with region proposal networks. In: Advances in Neural Information Processing Systems, vol. 28 (2015)"},{"key":"1800_CR6","doi-asserted-by":"crossref","unstructured":"Liu, W., Anguelov, D., Erhan, D., Szegedy, C., Reed, S., Fu, C.-Y., Berg, A. C.: SSD: single shot multibox detector. In: European Conference on Computer Vision, pp. 21\u201337 (2016)","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"1800_CR7","doi-asserted-by":"crossref","unstructured":"Redmon, J., Divvala, S., Girshick, R., Farhadi, A.: You only look once: unified, real-time object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 779\u2013788 (2016)","DOI":"10.1109\/CVPR.2016.91"},{"key":"1800_CR8","first-page":"107984","volume":"37","author":"A Wang","year":"2024","unstructured":"Wang, A., Chen, H., Liu, L., Chen, K., Lin, Z., Han, J., et al.: YOLOv10: real-time end-to-end object detection. Adv. Neural. Inf. Process. Syst. 37, 107984\u2013108011 (2024)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"1800_CR9","unstructured":"Li, C., Li, L., Jiang, H., Weng, K., Geng, Y., Li, L., Ke, Z., Li, Q., Cheng, M., Nie, W. et al.: YOLOv6: a single-stage object detection framework for industrial applications. arXiv preprint arXiv:2209.02976 (2022)"},{"key":"1800_CR10","doi-asserted-by":"publisher","first-page":"24330","DOI":"10.1109\/TITS.2022.3203715","volume":"23","author":"J Shen","year":"2022","unstructured":"Shen, J., Zhou, W., Liu, N., Sun, H., Li, D., Zhang, Y.: An anchor-free lightweight deep convolutional network for vehicle detection in aerial images. IEEE Trans. Intell. Transp. Syst. 23, 24330\u201324342 (2022)","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"key":"1800_CR11","first-page":"1","volume":"73","author":"J Shen","year":"2024","unstructured":"Shen, J., Liu, N., Sun, H., Li, D., Zhang, Y.: An instrument indication acquisition algorithm based on lightweight deep convolutional neural network and hybrid attention fine-grained features. IEEE Trans. Instrum. Meas. 73, 1\u201316 (2024)","journal-title":"IEEE Trans. Instrum. Meas."},{"key":"1800_CR12","first-page":"1","volume":"71","author":"J Shen","year":"2021","unstructured":"Shen, J., Liu, N., Xu, C., Sun, H., Xiao, Y., Li, D., Zhang, Y.: Finger vein recognition algorithm based on lightweight deep convolutional neural network. IEEE Trans. Instrum. Meas. 71, 1\u201313 (2021)","journal-title":"IEEE Trans. Instrum. Meas."},{"issue":"5","key":"1800_CR13","doi-asserted-by":"publisher","first-page":"368","DOI":"10.1007\/s11760-025-03958-3","volume":"19","author":"W Gu","year":"2025","unstructured":"Gu, W., Gao, W., Zou, Y., Ma, S.: ATW-YOLO: reconstructing the downsampling process and attention mechanism of YOLO network for rail foreign body detection. SIViP 19(5), 368 (2025)","journal-title":"SIViP"},{"key":"1800_CR14","doi-asserted-by":"crossref","unstructured":"Liu, Z., Li, P.: Detection of foreign object encroachment limit in railroad based on improved YOLOv11 algorithm. In: 2025 IEEE 7th International Conference on Communications, Information System and Computer Engineering (CISCE), pp. 908\u2013912 (2025)","DOI":"10.1109\/CISCE65916.2025.11064992"},{"key":"1800_CR15","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A. N., Kaiser, \u0141., Polosukhin, I.: Attention is all you need. In: Advances in Neural Information Processing Systems, vol. 30 (2017)"},{"issue":"12","key":"1800_CR16","doi-asserted-by":"publisher","first-page":"24330","DOI":"10.1109\/TITS.2022.3203715","volume":"23","author":"J Shen","year":"2022","unstructured":"Shen, J., Zhou, W., Liu, N., Sun, H., Li, D., Zhang, Y.: An anchor-free lightweight deep convolutional network for vehicle detection in aerial images. IEEE Trans. Intell. Transp. Syst. 23(12), 24330\u201324342 (2022)","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"key":"1800_CR17","doi-asserted-by":"crossref","unstructured":"Carion, N., Massa, F., Synnaeve, G., Usunier, N., Kirillov, A., Zagoruyko, S.: End-to-end object detection with transformers. In: European Conference on Computer Vision, pp. 213\u2013229 (2020)","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"1800_CR18","doi-asserted-by":"crossref","unstructured":"Zhao, Y., Lv, W., Xu, S., Wei, J., Wang, G., Dang, Q., Liu, Y., Chen, J.: DETRs beat YOLOs on real-time object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16965\u201316974 (2024)","DOI":"10.1109\/CVPR52733.2024.01605"},{"key":"1800_CR19","doi-asserted-by":"crossref","unstructured":"Liu, X., Huang, R., Cai, J., Yang, X., Xie, Z.: Feasibility analysis of RT-DETR in the context of foreign object intrusion at railway boundaries. In: International Conference on Electrical and Information Technologies for Rail Transportation, pp. 538\u2013545 (2023)","DOI":"10.1007\/978-981-99-9319-2_60"},{"issue":"4","key":"1800_CR20","doi-asserted-by":"publisher","first-page":"146","DOI":"10.1007\/s11554-024-01530-9","volume":"21","author":"C Yu","year":"2024","unstructured":"Yu, C., Chen, X.: Railway rutting defects detection based on improved RT-DETR. J. Real-Time Image Proc. 21(4), 146 (2024)","journal-title":"J. Real-Time Image Proc."},{"key":"1800_CR21","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2025.3589159","author":"P Li","year":"2025","unstructured":"Li, P., Peng, Y., Wang, S.-M., Zhong, C.: Improved RT-DETR framework for railway obstacle detection. IEEE Access (2025). https:\/\/doi.org\/10.1109\/ACCESS.2025.3589159","journal-title":"IEEE Access"},{"key":"1800_CR22","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"1800_CR23","doi-asserted-by":"crossref","unstructured":"Yao, T., Li, Y., Pan, Y., Mei, T.: HGNet: learning hierarchical geometry from points, edges, and surfaces. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 21846\u201321855 (2023)","DOI":"10.1109\/CVPR52729.2023.02092"},{"key":"1800_CR24","doi-asserted-by":"publisher","first-page":"1169","DOI":"10.1109\/TIP.2020.3042065","volume":"30","author":"T Wu","year":"2020","unstructured":"Wu, T., Tang, S., Zhang, R., Cao, J., Zhang, Y.: CGNet: a light-weight context guided network for semantic segmentation. IEEE Trans. Image Process. 30, 1169\u20131179 (2020)","journal-title":"IEEE Trans. Image Process."},{"key":"1800_CR25","doi-asserted-by":"crossref","unstructured":"Liu, W., Lu, H., Fu, H., Cao, Z.: Learning to upsample by learning to sample. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 6027\u20136037 (2023)","DOI":"10.1109\/ICCV51070.2023.00554"},{"issue":"2","key":"1800_CR26","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","volume":"88","author":"M Everingham","year":"2010","unstructured":"Everingham, M., Van Gool, L., Williams, C.K.I., Winn, J., Zisserman, A.: The PASCAL visual object classes (VOC) challenge. Int. J. Comput. Vis. 88(2), 303\u2013338 (2010)","journal-title":"Int. J. Comput. Vis."},{"key":"1800_CR27","first-page":"9969","volume":"35","author":"Y Tang","year":"2022","unstructured":"Tang, Y., Han, K., Guo, J., Xu, C., Xu, C., Wang, Y.: GhostNetV2: enhance cheap operation with long-range attention. Adv. Neural. Inf. Process. Syst. 35, 9969\u20139982 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"1800_CR28","unstructured":"Narayanan, M.: SENetV2: aggregated dense layer for channelwise and global representations. arXiv preprint arXiv:2311.10807 (2023)"},{"key":"1800_CR29","doi-asserted-by":"crossref","unstructured":"Wang, J., Chen, K., Xu, R., Liu, Z., Loy, C.C., Lin, D.: CARAFE: content-aware reassembly of features. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3007\u20133016 (2019)","DOI":"10.1109\/ICCV.2019.00310"},{"key":"1800_CR30","doi-asserted-by":"crossref","unstructured":"Tan, M., Pang, R., Le, Q. V.: EfficientDet: scalable and efficient object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10781\u201310790 (2020)","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"1800_CR31","unstructured":"Xu, X., Jiang, Y., Chen, W., Huang, Y., Zhang, Y., Sun, X.: DAMO-YOLO: a report on real-time object detection design. arXiv preprint arXiv:2211.15444 (2022)"},{"key":"1800_CR32","doi-asserted-by":"crossref","unstructured":"Yang, Z., Guan, Q., Zhao, K., Yang, J., Xu, X., Long, H., Tang, Y.: Multi-branch auxiliary fusion YOLO with re-parameterization heterogeneous convolutional for accurate object detection. In: Chinese Conference on Pattern Recognition and Computer Vision (PRCV), pp. 492\u2013505 (2024)","DOI":"10.1007\/978-981-97-8858-3_34"},{"key":"1800_CR33","doi-asserted-by":"crossref","unstructured":"Varghese, R., Sambath, M.: YOLOv8: a novel object detection algorithm with enhanced performance and robustness. In: 2024 International Conference on Advances in Data Engineering and Intelligent Computing Systems (ADICS), pp. 1\u20136 (2024)","DOI":"10.1109\/ADICS58448.2024.10533619"}],"container-title":["Journal of Real-Time Image Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-025-01800-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11554-025-01800-0","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-025-01800-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,6]],"date-time":"2026-02-06T16:48:20Z","timestamp":1770396500000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11554-025-01800-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11,7]]},"references-count":33,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,2]]}},"alternative-id":["1800"],"URL":"https:\/\/doi.org\/10.1007\/s11554-025-01800-0","relation":{},"ISSN":["1861-8200","1861-8219"],"issn-type":[{"value":"1861-8200","type":"print"},{"value":"1861-8219","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,11,7]]},"assertion":[{"value":"26 September 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 November 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 November 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"The type of research in this paper does not involve ethical issues. Informed consent was obtained from all authors for the publication of this article.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}}],"article-number":"3"}}