{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,2]],"date-time":"2026-02-02T07:09:27Z","timestamp":1770016167464,"version":"3.49.0"},"reference-count":48,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T00:00:00Z","timestamp":1769904000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"the Henan Provincial Key R&D Special Project \u201dKey Technology Research and Demonstration Applications of Large Multi- modal Self-Training Models Based on Domestic Chips\u2019","award":["231111212000"],"award-info":[{"award-number":["231111212000"]}]},{"name":"the Graduate Innovation Fund of Zhengzhou University of Aeronautical Industry Managemen","award":["2025CX117"],"award-info":[{"award-number":["2025CX117"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-026-21227-4","type":"journal-article","created":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T20:59:22Z","timestamp":1769979562000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["High-precision YOLOv5 object detection technology based on multi-module collaborative optimization"],"prefix":"10.1007","volume":"85","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-6236-9850","authenticated-orcid":false,"given":"Yong","family":"Yang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tianci","family":"Wan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Menglu","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lingling","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,2,1]]},"reference":[{"issue":"4","key":"21227_CR1","doi-asserted-by":"publisher","first-page":"1064","DOI":"10.3390\/s25041064","volume":"25","author":"H Xu","year":"2025","unstructured":"Xu H, Yang L, Zhao S, Tao S, Tian X, Liu K (2025) Sps-rcnn: Semantic-guided proposal sampling for 3d object detection from lidar point clouds. Sensors 25(4):1064","journal-title":"Sensors"},{"key":"21227_CR2","doi-asserted-by":"crossref","unstructured":"Sasirekha R, Surya V, Nandhini P, Preethy\u00a0Jemima P, Bhanushree T, Hanitha G (2025) Ensemble of fast r-cnn with bi-lstm for object detection. In: 2025 6th International Conference on Mobile Computing and Sustainable Informatics (ICMCSI), pp 1200\u20131206. IEEE","DOI":"10.1109\/ICMCSI64620.2025.10883212"},{"key":"21227_CR3","doi-asserted-by":"crossref","unstructured":"Zhong Z, Lai J, Zhong Y, Xu Y, Cui F (2025) Enhancing lunar dem data using super-resolution techniques and optimizing the faster r-cnn network for sub-kilometer crater detection. Icarus 116483","DOI":"10.1016\/j.icarus.2025.116483"},{"issue":"4","key":"21227_CR4","doi-asserted-by":"publisher","first-page":"592","DOI":"10.1007\/s11227-025-07078-0","volume":"81","author":"A Gheibi-Fetrat","year":"2025","unstructured":"Gheibi-Fetrat A, Serajeh Hassani F, Mohammadi-Lak M, Mirzaei A, Akbarzadeh N, Kheyrati-Fard MR, Hosseini M, Javadi Nezhad A, Tavakkol A, Lee JA et al (2025) A survey of ssd simulators and emulators. J Supercomput 81(4):592","journal-title":"J Supercomput"},{"key":"21227_CR5","doi-asserted-by":"crossref","unstructured":"Gao C, Gao J, Cao L, Zhao L, Gao S (2025) Research on improvement strategy of detr real-time object detection algorithm for small devices. In: Fourth International Conference on Computer Vision, Application, and Algorithm (CVAA 2024), vol 13486, pp 307\u2013313. SPIE","DOI":"10.1117\/12.3055829"},{"issue":"1","key":"21227_CR6","doi-asserted-by":"publisher","first-page":"7969","DOI":"10.1038\/s41598-025-92143-0","volume":"15","author":"Y Alhwaiti","year":"2025","unstructured":"Alhwaiti Y, Khan M, Asim M, Siddiqi MH, Ishaq M, Alruwaili M (2025) Leveraging yolo deep learning models to enhance plant disease identification. Sci Rep 15(1):7969","journal-title":"Sci Rep"},{"key":"21227_CR7","doi-asserted-by":"crossref","unstructured":"Woo S, Park J, Lee J-Y, Kweon IS (2018) Cbam: Convolutional block attention module. In: Proceedings of the European Conference on Computer Vision (ECCV), pp 3\u201319","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"21227_CR8","unstructured":"Yang L, Zhang R-Y, Li L, Xie X (2021) Simam: A simple, parameter-free attention module for convolutional neural networks. In: International Conference on Machine Learning, pp 11863\u201311874. PMLR"},{"key":"21227_CR9","doi-asserted-by":"crossref","unstructured":"Lee Y, Park J (2020) Centermask: Real-time anchor-free instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 13906\u201313915","DOI":"10.1109\/CVPR42600.2020.01392"},{"key":"21227_CR10","unstructured":"Li X, Hu X, Yang J (2019) Spatial group-wise enhance: Improving semantic feature learning in convolutional networks. arXiv preprint arXiv:1905.09646"},{"issue":"3","key":"21227_CR11","doi-asserted-by":"publisher","first-page":"62","DOI":"10.1007\/s11554-024-01436-6","volume":"21","author":"H Li","year":"2024","unstructured":"Li H, Li J, Wei H, Liu Z, Zhan Z, Ren Q (2024) Slim-neck by gsconv: A lightweight-design for real-time detector architectures. J Real-Time Image Proc 21(3):62","journal-title":"J Real-Time Image Proc"},{"key":"21227_CR12","doi-asserted-by":"crossref","unstructured":"Qin D, Leichner C, Delakis M, Fornoni M, Luo S, Yang F, Wang W, Banbury C, Ye C, Akin B et al (2024) Mobilenetv4: universal models for the mobile ecosystem. In: European Conference on Computer Vision, pp 78\u201396. Springer","DOI":"10.1007\/978-3-031-73661-2_5"},{"key":"21227_CR13","doi-asserted-by":"crossref","unstructured":"Koonce B (2021) Mobilenetv3. In: Convolutional Neural Networks with Swift for Tensorflow: Image Recognition and Dataset Categorization, pp 125\u2013144. Springer, ???","DOI":"10.1007\/978-1-4842-6168-2_11"},{"key":"21227_CR14","unstructured":"Chen Y, Kalantidis Y, Li J, Yan S, Feng J (2018) A$$\\hat{~}$$ 2-nets: Double attention networks. Adv Neural Inf Process Syst 31"},{"key":"21227_CR15","first-page":"7050","volume":"36","author":"H Chen","year":"2023","unstructured":"Chen H, Wang Y, Guo J, Tao D (2023) Vanillanet: the power of minimalism in deep learning. Adv Neural Inf Process Syst 36:7050\u20137064","journal-title":"Adv Neural Inf Process Syst"},{"key":"21227_CR16","doi-asserted-by":"crossref","unstructured":"Zhang X, Zhou X, Lin M, Sun J (2018) Shufflenet: An extremely efficient convolutional neural network for mobile devices. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 6848\u20136856","DOI":"10.1109\/CVPR.2018.00716"},{"key":"21227_CR17","doi-asserted-by":"crossref","unstructured":"Gong Y, Yu X, Ding Y, Peng X, Zhao J, Han Z (2021) Effective fusion factor in fpn for tiny object detection. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp 1160\u20131168","DOI":"10.1109\/WACV48630.2021.00120"},{"key":"21227_CR18","doi-asserted-by":"crossref","unstructured":"Chen J, Mai H, Luo L, Chen X, Wu K (2021) Effective feature fusion network in bifpn for small object detection. In: 2021 IEEE International Conference on Image Processing (ICIP), pp 699\u2013703","DOI":"10.1109\/ICIP42928.2021.9506347"},{"key":"21227_CR19","doi-asserted-by":"crossref","unstructured":"Wang C-Y, Liao H-YM, Wu Y-H, Chen P-Y, Hsieh J-W, Yeh I-H (2020) Cspnet: A new backbone that can enhance learning capability of cnn. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, pp 390\u2013391","DOI":"10.1109\/CVPRW50498.2020.00203"},{"issue":"5","key":"21227_CR20","doi-asserted-by":"publisher","first-page":"241","DOI":"10.1007\/s00530-024-01447-0","volume":"30","author":"S Peng","year":"2024","unstructured":"Peng S, Fan X, Tian S, Yu L (2024) Ps-yolo: a small object detector based on efficient convolution and multi-scale feature fusion. Multimedia Syst 30(5):241","journal-title":"Multimedia Syst"},{"key":"21227_CR21","doi-asserted-by":"publisher","first-page":"106442","DOI":"10.1016\/j.engappai.2023.106442","volume":"123","author":"D Wan","year":"2023","unstructured":"Wan D, Lu R, Shen S, Xu T, Lang X, Ren Z (2023) Mixed local channel attention for object detection. Eng Appl Artif Intell 123:106442","journal-title":"Eng Appl Artif Intell"},{"key":"21227_CR22","doi-asserted-by":"crossref","unstructured":"Liu Y, Hu Y, Cao G, Wang J (2025) Senet: Super-resolution enhancement network for crowd counting. Patt Recogn 111420","DOI":"10.1016\/j.patcog.2025.111420"},{"issue":"2","key":"21227_CR23","doi-asserted-by":"publisher","first-page":"243","DOI":"10.1080\/14693062.2023.2200758","volume":"24","author":"G Magacho","year":"2024","unstructured":"Magacho G, Espagne E, Godin A (2024) Impacts of the cbam on eu trade partners: consequences for developing countries. Clim Pol 24(2):243\u2013259","journal-title":"Clim Pol"},{"key":"21227_CR24","unstructured":"Yang L, Zhang R-Y, Li L, Xie X (2021) Simam: A simple, parameter-free attention module for convolutional neural networks. In: International Conference on Machine Learning, pp 11863\u201311874. PMLR"},{"key":"21227_CR25","unstructured":"Wei H, Liu X, Xu S, Dai Z, Dai Y, Xu X (2022) Dwrseg: Rethinking efficient acquisition of multi-scale contextual information for real-time semantic segmentation. arXiv preprint arXiv:2212.01173"},{"key":"21227_CR26","unstructured":"Jiang Y, Tan Z, Wang J, Sun X, Lin M, Li H (2022) Giraffedet: A heavy-neck paradigm for object detection. arXiv preprint arXiv:2202.04256"},{"key":"21227_CR27","doi-asserted-by":"crossref","unstructured":"Misra D, Nalamada T, Arasanipalai AU, Hou Q (2021) Rotate to attend: Convolutional triplet attention module. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp 3139\u20133148","DOI":"10.1109\/WACV48630.2021.00318"},{"key":"21227_CR28","unstructured":"Jocher G, Stoken A, Borovec J, Changyu L, Hogan A, Diaconu L, Poznanski J, Yu L, Rai P, Ferriday R et al (2020) ultralytics\/yolov5: v3. 0. Zenodo"},{"key":"21227_CR29","doi-asserted-by":"crossref","unstructured":"Bhatt R, Malik K, Indra G (2024) Asl detection in real-time using tensorflow. In: 2024 IEEE International Conference on Interdisciplinary Approaches in Technology and Management for Social Innovation (IATMSI), vol 2, pp 1\u20136. IEEE","DOI":"10.1109\/IATMSI60426.2024.10503138"},{"key":"21227_CR30","doi-asserted-by":"publisher","first-page":"42","DOI":"10.1016\/j.neucom.2018.03.030","volume":"299","author":"X Sun","year":"2018","unstructured":"Sun X, Wu P, Hoi SC (2018) Face detection using deep learning: An improved faster rcnn approach. Neurocomputing 299:42\u201350","journal-title":"Neurocomputing"},{"key":"21227_CR31","unstructured":"Redmon J, Farhadi A (2018) Yolov3: An incremental improvement. arXiv preprint arXiv:1804.02767"},{"issue":"22","key":"21227_CR32","doi-asserted-by":"publisher","first-page":"7308","DOI":"10.3390\/s24227308","volume":"24","author":"M Hu","year":"2024","unstructured":"Hu M, Zhang Y, Jiao T, Xue H, Wu X, Luo J, Han S, Lv H (2024) An enhanced feature-fusion network for small-scale pedestrian detection on edge devices. Sensors 24(22):7308","journal-title":"Sensors"},{"key":"21227_CR33","unstructured":"Bochkovskiy A, Wang C-Y, Liao H-YM (2020) Yolov4: Optimal speed and accuracy of object detection. arXiv preprint arXiv:2004.10934"},{"key":"21227_CR34","unstructured":"Li C, Li L, Jiang H, Weng K, Geng Y, Li L, Ke Z, Li Q, Cheng M, Nie W et al (2022) Yolov6: A single-stage object detection framework for industrial applications. arXiv preprint arXiv:2209.02976"},{"key":"21227_CR35","doi-asserted-by":"crossref","unstructured":"Wang C-Y, Bochkovskiy A, Liao H-YM (2023) Yolov7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 7464\u20137475","DOI":"10.1109\/CVPR52729.2023.00721"},{"key":"21227_CR36","unstructured":"Zhu X, Su W, Lu L, Li B, Wang X, Dai J (2020) Deformable detr: Deformable transformers for end-to-end object detection. arXiv preprint arXiv:2010.04159"},{"key":"21227_CR37","doi-asserted-by":"crossref","unstructured":"Sohan M, Sai\u00a0Ram T, Rami\u00a0Reddy CV (2024) A review on yolov8 and its advancements. In: International Conference on Data Intelligence and Cognitive Informatics, pp 529\u2013545. Springer","DOI":"10.1007\/978-981-99-7962-2_39"},{"key":"21227_CR38","doi-asserted-by":"crossref","unstructured":"Senhua et al (2024) Multi-scale context-aware network for continuous sign language recognition. Virt Real Intell Hardw 6(4):323\u2013337","DOI":"10.1016\/j.vrih.2023.06.011"},{"key":"21227_CR39","doi-asserted-by":"crossref","unstructured":"Keskin C et al (2012) Hand pose estimation and hand shape classification using multi-layered randomized decision forests. In: Computer Vision\u2013ECCV 2012: 12th European Conference on Computer Vision, Florence, Italy, Proceedings, Part VI, pp 852\u2013863. Springer","DOI":"10.1007\/978-3-642-33783-3_61"},{"key":"21227_CR40","doi-asserted-by":"crossref","unstructured":"Tao et al (2020) American sign language alphabet recognition using convolutional neural networks with multiview augmentation and inference fusion. Eng Appl Artif Intell 76:202\u2013213","DOI":"10.1016\/j.engappai.2018.09.006"},{"key":"21227_CR41","doi-asserted-by":"crossref","unstructured":"Rahman MM, Islam MS, Rahman MH, Sassi R, Rivolta MW, Aktaruzzaman M (2019) A new benchmark on american sign language recognition using convolutional neural network. In: 2019 International Conference on Sustainable Technologies for Industry 4.0 (STI), pp 1\u20136","DOI":"10.1109\/STI47673.2019.9067974"},{"key":"21227_CR42","doi-asserted-by":"crossref","unstructured":"Aly et al (2019) User-independent american sign language alphabet recognition based on depth image and pcanet features. IEEE Access 7:123138\u2013123150","DOI":"10.1109\/ACCESS.2019.2938829"},{"key":"21227_CR43","doi-asserted-by":"crossref","unstructured":"Chandra A, Ranjan A, Sahu DP, Prakash S, Yang T, Rathore RS, Vajpayee A (2024) An efficient model for american sign language recognition using deep-neural networks. In: 2024 International Conference on Decision Aid Sciences and Applications (DASA), pp 1\u20135","DOI":"10.1109\/DASA63652.2024.10836568"},{"key":"21227_CR44","doi-asserted-by":"crossref","unstructured":"Kothadiya et al (2022) Deepsign: Sign language detection and recognition using deep learning. Electronics 11(11):1780","DOI":"10.3390\/electronics11111780"},{"key":"21227_CR45","doi-asserted-by":"crossref","unstructured":"Ravinder et al (2023) An approach for gesture recognition based on a lightweight convolutional neural network. Intern J Artif Intell Tools 32(03):2340014","DOI":"10.1142\/S0218213023400146"},{"key":"21227_CR46","doi-asserted-by":"crossref","unstructured":"Alsharif et al (2023) Deep learning technology to recognize american sign language alphabet. Sensors 23(18):7970","DOI":"10.3390\/s23187970"},{"key":"21227_CR47","doi-asserted-by":"crossref","unstructured":"Poornima et al (2024) Hand and sign recognition of alphabets using yolov5. SN Comput Sci 5(3):311","DOI":"10.1007\/s42979-024-02628-4"},{"key":"21227_CR48","doi-asserted-by":"crossref","unstructured":"Jia et al (2024) Slr-yolo: An improved yolov8 network for real-time sign language recognition. J Intell Fuzzy Syst 46(1):1663\u20131680","DOI":"10.3233\/JIFS-235132"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-026-21227-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-026-21227-4","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-026-21227-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,1]],"date-time":"2026-02-01T20:59:28Z","timestamp":1769979568000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-026-21227-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,1]]},"references-count":48,"journal-issue":{"issue":"2","published-online":{"date-parts":[[2026,2]]}},"alternative-id":["21227"],"URL":"https:\/\/doi.org\/10.1007\/s11042-026-21227-4","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2,1]]},"assertion":[{"value":"26 April 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 October 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 November 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 February 2026","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"We have no competing interest to disclose.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing Interests"}},{"value":"No ethical clearance is required.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical Approval"}}],"article-number":"69"}}