{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,15]],"date-time":"2026-01-15T07:51:03Z","timestamp":1768463463083,"version":"3.49.0"},"reference-count":52,"publisher":"Springer Science and Business Media LLC","issue":"10","license":[{"start":{"date-parts":[[2025,9,1]],"date-time":"2025-09-01T00:00:00Z","timestamp":1756684800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,9,1]],"date-time":"2025-09-01T00:00:00Z","timestamp":1756684800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62372242"],"award-info":[{"award-number":["62372242"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Complex Intell. Syst."],"published-print":{"date-parts":[[2025,10]]},"DOI":"10.1007\/s40747-025-02072-8","type":"journal-article","created":{"date-parts":[[2025,9,1]],"date-time":"2025-09-01T07:33:01Z","timestamp":1756711981000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Starnet-tex: lightweight real-time text detection via middle-order enhanced contextual attention"],"prefix":"10.1007","volume":"11","author":[{"ORCID":"https:\/\/orcid.org\/0009-0009-1661-8714","authenticated-orcid":false,"given":"Zheng","family":"Hu","sequence":"first","affiliation":[]},{"given":"Yingnan","family":"Zhao","sequence":"additional","affiliation":[]},{"given":"Zuguo","family":"Yang","sequence":"additional","affiliation":[]},{"given":"Jielin","family":"Jiang","sequence":"additional","affiliation":[]},{"given":"Xiaolong","family":"Xu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,9,1]]},"reference":[{"issue":"3","key":"2072_CR1","doi-asserted-by":"publisher","first-page":"3229","DOI":"10.1007\/s40747-022-00916-1","volume":"9","author":"H Heng","year":"2023","unstructured":"Heng H, Li P, Guan T, Yang T (2023) Scene text recognition via context modeling for low-quality image in logistics industry. Complex Intell Syst 9(3):3229\u20133248","journal-title":"Complex Intell Syst"},{"issue":"1","key":"2072_CR2","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1007\/s11263-020-01369-0","volume":"129","author":"S Long","year":"2021","unstructured":"Long S, He X, Yao C (2021) Scene text detection and recognition: the deep learning era. Int J Comput Vis 129(1):161\u2013184","journal-title":"Int J Comput Vis"},{"key":"2072_CR3","doi-asserted-by":"crossref","unstructured":"Xiong B, Grauman K (2016) Text detection in stores using a repetition prior. In: 2016 IEEE Winter Conference on Applications of Computer Vision (WACV), pp. 1\u20139. IEEE","DOI":"10.1109\/WACV.2016.7477575"},{"key":"2072_CR4","doi-asserted-by":"crossref","unstructured":"Liao M, Shi B, Bai X, Wang X, Liu W (2017) Textboxes: A fast text detector with a single deep neural network. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 31","DOI":"10.1609\/aaai.v31i1.11196"},{"key":"2072_CR5","doi-asserted-by":"crossref","unstructured":"Jiang Y, Zhu X, Wang X, Yang S, Li W, Wang H, Fu P, Luo Z (2017) R2cnn: Rotational region cnn for orientation robust scene text detection. arXiv preprint arXiv:1706.09579","DOI":"10.1109\/ICPR.2018.8545598"},{"key":"2072_CR6","doi-asserted-by":"crossref","unstructured":"He W, Zhang X-Y, Yin F, Liu C-L (2017) Deep direct regression for multi-oriented scene text detection. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 745\u2013753","DOI":"10.1109\/ICCV.2017.87"},{"key":"2072_CR7","doi-asserted-by":"crossref","unstructured":"Liu W, Anguelov D, Erhan D, Szegedy C, Reed S, Fu C-Y, Berg AC (2016) Ssd: Single shot multibox detector. In: Computer Vision\u2013ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part I 14, pp. 21\u201337. Springer","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"2072_CR8","unstructured":"Ren S, He K, Girshick R, Sun J (2015) Faster r-cnn: Towards real-time object detection with region proposal networks. Advances in neural information processing systems 28"},{"key":"2072_CR9","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2024.126159","volume":"267","author":"B Zhu","year":"2025","unstructured":"Zhu B, Chen X, Tang Q, Chen CP, Liu F (2025) Ek-net++: real-time scene text detection with expand kernel distance and epoch adaptive weight. Expert Syst Appl 267:126159","journal-title":"Expert Syst Appl"},{"key":"2072_CR10","doi-asserted-by":"crossref","unstructured":"Deng D, Liu H, Li X, Cai D (2018) Pixellink: Detecting scene text via instance segmentation. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 32","DOI":"10.1609\/aaai.v32i1.12269"},{"key":"2072_CR11","doi-asserted-by":"crossref","unstructured":"Wang K, Liew JH, Zou Y, Zhou D, Feng J (2019) Panet: Few-shot image semantic segmentation with prototype alignment. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 9197\u20139206","DOI":"10.1109\/ICCV.2019.00929"},{"key":"2072_CR12","doi-asserted-by":"crossref","unstructured":"Liao M, Wan Z, Yao C, Chen K, Bai X (2020) Real-time scene text detection with differentiable binarization. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 34, pp. 11474\u201311481","DOI":"10.1609\/aaai.v34i07.6812"},{"key":"2072_CR13","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"2072_CR14","doi-asserted-by":"crossref","unstructured":"Lin T-Y, Doll\u00e1r P, Girshick R, He K, Hariharan B, Belongie S (2017) Feature pyramid networks for object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2117\u20132125","DOI":"10.1109\/CVPR.2017.106"},{"issue":"1","key":"2072_CR15","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1007\/s40747-023-01134-z","volume":"10","author":"H Chen","year":"2024","unstructured":"Chen H, Qiu Y, Jiang M, Lin J, Chen P (2024) Kernel-mask knowledge distillation for efficient and accurate arbitrary-shaped text detection. Complex Intell Syst 10(1):75\u201386","journal-title":"Complex Intell Syst"},{"key":"2072_CR16","doi-asserted-by":"crossref","unstructured":"Wang W, Xie E, Song X, Zang Y, Wang W, Lu T, Yu G, Shen C (2019) Efficient and accurate arbitrary-shaped text detection with pixel aggregation network. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 8440\u20138449","DOI":"10.1109\/ICCV.2019.00853"},{"key":"2072_CR17","doi-asserted-by":"crossref","unstructured":"Zhao Y, Cai Y, Wu W, Wang W (2023) Explore faster localization learning for scene text detection. In: 2023 IEEE International Conference on Multimedia and Expo (ICME), pp. 156\u2013161. IEEE","DOI":"10.1109\/ICME55011.2023.00035"},{"key":"2072_CR18","doi-asserted-by":"crossref","unstructured":"Li X, Wang W, Hu X, Yang J (2019) Selective kernel networks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 510\u2013519","DOI":"10.1109\/CVPR.2019.00060"},{"key":"2072_CR19","doi-asserted-by":"crossref","unstructured":"Li J, Wen Y, He L (2023) Scconv: Spatial and channel reconstruction convolution for feature redundancy. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6153\u20136162","DOI":"10.1109\/CVPR52729.2023.00596"},{"key":"2072_CR20","doi-asserted-by":"publisher","first-page":"337","DOI":"10.1016\/j.patcog.2019.02.002","volume":"90","author":"Y Liu","year":"2019","unstructured":"Liu Y, Jin L, Zhang S, Luo C, Zhang S (2019) Curved scene text detection via transverse and longitudinal sequence connection. Pattern Recogn 90:337\u2013345","journal-title":"Pattern Recogn"},{"key":"2072_CR21","doi-asserted-by":"crossref","unstructured":"Ch\u2019ng CK, Chan CS (2017) Total-text: A comprehensive dataset for scene text detection and recognition. In: 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR), vol. 1, pp. 935\u2013942. IEEE","DOI":"10.1109\/ICDAR.2017.157"},{"key":"2072_CR22","doi-asserted-by":"crossref","unstructured":"Karatzas D, Gomez-Bigorda L, Nicolaou A, Ghosh S, Bagdanov A, Iwamura M, Matas J, Neumann L, Chandrasekhar VR, Lu S et al (2015) Icdar 2015 competition on robust reading. In: 2015 13th International Conference on Document Analysis and Recognition (ICDAR), pp. 1156\u20131160. IEEE","DOI":"10.1109\/ICDAR.2015.7333942"},{"key":"2072_CR23","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2022.117564","volume":"205","author":"D Zhong","year":"2022","unstructured":"Zhong D, Lyu S, Shivakumara P, Pal U, Lu Y (2022) Text proposals with location-awareness-attention network for arbitrarily shaped scene text detection and recognition. Expert Syst Appl 205:117564","journal-title":"Expert Syst Appl"},{"key":"2072_CR24","doi-asserted-by":"crossref","unstructured":"Zheng J, Fan H, Zhang L (2024) Kernel adaptive convolution for scene text detection via distance map prediction. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5957\u20135966","DOI":"10.1109\/CVPR52733.2024.00569"},{"issue":"3","key":"2072_CR25","doi-asserted-by":"publisher","first-page":"1815","DOI":"10.1109\/TCSVT.2023.3299087","volume":"34","author":"Z Shao","year":"2023","unstructured":"Shao Z, Su Y, Zhou Y, Meng F, Zhu H, Liu B, Yao R (2023) Ct-net: arbitrary-shaped text detection via contour transformer. IEEE Trans Circ Syst Video Technol 34(3):1815\u20131826","journal-title":"IEEE Trans Circ Syst Video Technol"},{"key":"2072_CR26","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11263-015-0823-z","volume":"116","author":"M Jaderberg","year":"2016","unstructured":"Jaderberg M, Simonyan K, Vedaldi A, Zisserman A (2016) Reading text in the wild with convolutional neural networks. Int J Comput Vis 116:1\u201320","journal-title":"Int J Comput Vis"},{"key":"2072_CR27","doi-asserted-by":"crossref","unstructured":"Duan C, Fu P, Guo S, Jiang Q, Wei X (2024) Odm: A text-image further alignment pre-training approach for scene text detection and spotting. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 15587\u201315597","DOI":"10.1109\/CVPR52733.2024.01476"},{"issue":"11","key":"2072_CR28","doi-asserted-by":"publisher","first-page":"3111","DOI":"10.1109\/TMM.2018.2818020","volume":"20","author":"J Ma","year":"2018","unstructured":"Ma J, Shao W, Ye H, Wang L, Wang H, Zheng Y, Xue X (2018) Arbitrary-oriented scene text detection via rotation proposals. IEEE Trans Multimedia 20(11):3111\u20133122","journal-title":"IEEE Trans Multimedia"},{"key":"2072_CR29","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser \u0141, Polosukhin I (2017) Attention is all you need. Adv Neural Inf Process Syst 30"},{"key":"2072_CR30","doi-asserted-by":"crossref","unstructured":"Zhang X, Su Y, Tripathi S, Tu Z (2022) Text spotting transformers. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9519\u20139528","DOI":"10.1109\/CVPR52688.2022.00930"},{"key":"2072_CR31","doi-asserted-by":"crossref","unstructured":"Wang W, Xie E, Li X, Hou W, Lu T, Yu G, Shao S (2019) Shape robust text detection with progressive scale expansion network. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9336\u20139345","DOI":"10.1109\/CVPR.2019.00956"},{"key":"2072_CR32","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2021.107767","volume":"236","author":"Y Zhong","year":"2022","unstructured":"Zhong Y, Cheng X, Chen T, Zhang J, Zhou Z, Huang G (2022) Prpn: progressive region prediction network for natural scene text detection. Knowl-Based Syst 236:107767","journal-title":"Knowl-Based Syst"},{"issue":"1","key":"2072_CR33","doi-asserted-by":"publisher","first-page":"919","DOI":"10.1109\/TPAMI.2022.3155612","volume":"45","author":"M Liao","year":"2022","unstructured":"Liao M, Zou Z, Wan Z, Yao C, Bai X (2022) Real-time scene text detection with differentiable binarization and adaptive scale fusion. IEEE Trans Pattern Anal Mach Intell 45(1):919\u2013931","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"2072_CR34","doi-asserted-by":"crossref","unstructured":"Zhang H, Yao Q, Yang M, Xu Y, Bai X (2020) Autostr: efficient backbone search for scene text recognition. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XXIV 16, pp. 751\u2013767. Springer","DOI":"10.1007\/978-3-030-58586-0_44"},{"issue":"5","key":"2072_CR35","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3526217","volume":"22","author":"K Manjari","year":"2023","unstructured":"Manjari K, Verma M, Singal G, Namasudra S (2023) Qest: quantized and efficient scene text detector using deep learning. ACM Trans Asian Low-Resour Lang Inf Process 22(5):1\u201318","journal-title":"ACM Trans Asian Low-Resour Lang Inf Process"},{"key":"2072_CR36","doi-asserted-by":"crossref","unstructured":"Zhou X, Yao C, Wen H, Wang Y, Zhou S, He W, Liang J (2017) East: an efficient and accurate scene text detector. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5551\u20135560","DOI":"10.1109\/CVPR.2017.283"},{"key":"2072_CR37","doi-asserted-by":"crossref","unstructured":"Liu Z, Lin G, Yang S, Feng J, Lin W, Goh WL (2018) Learning markov clustering networks for scene text detection. arXiv preprint arXiv:1805.08365","DOI":"10.1109\/CVPR.2018.00725"},{"key":"2072_CR38","doi-asserted-by":"crossref","unstructured":"Ma X, Dai X, Bai Y, Wang Y, Fu Y (2024) Rewrite the stars. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5694\u20135703","DOI":"10.1109\/CVPR52733.2024.00544"},{"key":"2072_CR39","doi-asserted-by":"crossref","unstructured":"Cai X, Lai Q, Wang Y, Wang W, Sun Z, Yao Y (2024) Poly kernel inception network for remote sensing detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 27706\u201327716","DOI":"10.1109\/CVPR52733.2024.02617"},{"key":"2072_CR40","doi-asserted-by":"crossref","unstructured":"Wang Y, Li Y, Wang G, Liu X (2024) Multi-scale attention network for single image super-resolution. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5950\u20135960","DOI":"10.1109\/CVPRW63382.2024.00602"},{"key":"2072_CR41","doi-asserted-by":"crossref","unstructured":"Li Y, Hou Q, Zheng Z, Cheng M-M, Yang J, Li X (2023) Large selective kernel network for remote sensing object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 16794\u201316805","DOI":"10.1109\/ICCV51070.2023.01540"},{"key":"2072_CR42","unstructured":"Li S, Wang Z, Liu Z, Tan C, Lin H, Wu D, Chen Z, Zheng J, Li SZ (2022) Moganet: Multi-order gated aggregation network. arXiv preprint arXiv:2211.03295"},{"key":"2072_CR43","doi-asserted-by":"crossref","unstructured":"Milletari F, Navab N, Ahmadi S-A (2016) V-net: Fully convolutional neural networks for volumetric medical image segmentation. In: 2016 Fourth International Conference on 3D Vision (3DV), pp. 565\u2013571. Ieee","DOI":"10.1109\/3DV.2016.79"},{"key":"2072_CR44","doi-asserted-by":"crossref","unstructured":"Shrivastava A, Gupta A, Girshick R (2016) Training region-based object detectors with online hard example mining. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 761\u2013769","DOI":"10.1109\/CVPR.2016.89"},{"key":"2072_CR45","doi-asserted-by":"crossref","unstructured":"Gupta A, Vedaldi A, Zisserman A (2016) Synthetic data for text localisation in natural images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2315\u20132324","DOI":"10.1109\/CVPR.2016.254"},{"key":"2072_CR46","doi-asserted-by":"crossref","unstructured":"Shi B, Bai X, Belongie S (2017) Detecting oriented text in natural images by linking segments. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2550\u20132558","DOI":"10.1109\/CVPR.2017.371"},{"key":"2072_CR47","doi-asserted-by":"crossref","unstructured":"Zhao H, Shi J, Qi X, Wang X, Jia J (2017) Pyramid scene parsing network. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2881\u20132890","DOI":"10.1109\/CVPR.2017.660"},{"key":"2072_CR48","doi-asserted-by":"crossref","unstructured":"Hu J, Shen L, Sun G (2018) Squeeze-and-excitation networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7132\u20137141","DOI":"10.1109\/CVPR.2018.00745"},{"key":"2072_CR49","doi-asserted-by":"crossref","unstructured":"Woo S, Park J, Lee J-Y, Kweon IS (2018) Cbam: Convolutional block attention module. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 3\u201319","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"2072_CR50","doi-asserted-by":"crossref","unstructured":"Zhu Y, Chen J, Liang L, Kuang Z, Jin L, Zhang W (2021) Fourier contour embedding for arbitrary-shaped text detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3123\u20133131","DOI":"10.1109\/CVPR46437.2021.00314"},{"key":"2072_CR51","unstructured":"Luo W, Li Y, Urtasun R, Zemel R (2016) Understanding the effective receptive field in deep convolutional neural networks. Advances in neural information processing systems 29"},{"key":"2072_CR52","doi-asserted-by":"crossref","unstructured":"Liu Z, Lin Y, Cao Y, Hu H, Wei Y, Zhang Z, Lin S, Guo B (2021) Swin transformer: Hierarchical vision transformer using shifted windows. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 10012\u201310022","DOI":"10.1109\/ICCV48922.2021.00986"}],"container-title":["Complex &amp; Intelligent Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s40747-025-02072-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s40747-025-02072-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s40747-025-02072-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,25]],"date-time":"2025-09-25T13:34:29Z","timestamp":1758807269000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s40747-025-02072-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,1]]},"references-count":52,"journal-issue":{"issue":"10","published-print":{"date-parts":[[2025,10]]}},"alternative-id":["2072"],"URL":"https:\/\/doi.org\/10.1007\/s40747-025-02072-8","relation":{},"ISSN":["2199-4536","2198-6053"],"issn-type":[{"value":"2199-4536","type":"print"},{"value":"2198-6053","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,9,1]]},"assertion":[{"value":"24 March 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 August 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 September 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"432"}}