{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,15]],"date-time":"2026-05-15T17:51:09Z","timestamp":1778867469339,"version":"3.51.4"},"reference-count":38,"publisher":"Springer Science and Business Media LLC","issue":"12","license":[{"start":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T00:00:00Z","timestamp":1757376000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T00:00:00Z","timestamp":1757376000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"Xiamen University Malaysia","award":["XMUMRF\/2022-C10\/IECE\/0040"],"award-info":[{"award-number":["XMUMRF\/2022-C10\/IECE\/0040"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["SIViP"],"published-print":{"date-parts":[[2025,12]]},"DOI":"10.1007\/s11760-025-04637-z","type":"journal-article","created":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T10:44:37Z","timestamp":1757414677000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["EV2M-YOLOv8: enhancing AI computer vision with EfficientNetV2 and multi-head self-attention for low-complexity agricultural crop, chilli maturity detection"],"prefix":"10.1007","volume":"19","author":[{"given":"Yap Miao","family":"Rong","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tan Jian","family":"Ding","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lee Yan","family":"Kang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mohammadmadhi","family":"Ariannejad","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lin","family":"Anzhou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,9,9]]},"reference":[{"key":"4637_CR1","doi-asserted-by":"publisher","unstructured":"Cao, Y., Li, S., Liu, Y., Yan, Z., Dai, Y., Yu, P.S., Sun, L.: A Comprehensive survey of ai-generated content (AIGC): a history of generative AI from GAN to ChatGPT. arXiv. (2023). https:\/\/doi.org\/10.48550\/arXiv.2303.04226","DOI":"10.48550\/arXiv.2303.04226"},{"key":"4637_CR2","doi-asserted-by":"publisher","first-page":"2695","DOI":"10.1007\/s11760-023-02941-0","volume":"18","author":"J Chen","year":"2023","unstructured":"Chen, J., Wen, R., Ma, L.: Small object detection model for UAV aerial image based on YOLOv7. Signal Image Video Process. 18, 2695\u20132707 (2023). https:\/\/doi.org\/10.1007\/s11760-023-02941-0","journal-title":"Signal Image Video Process."},{"issue":"2","key":"4637_CR3","doi-asserted-by":"publisher","first-page":"715","DOI":"10.1109\/tcsvt.2020.2987465","volume":"31","author":"X Chen","year":"2020","unstructured":"Chen, X., Li, H., Wu, Q., Ngan, K.N., Xu, L.: High-quality R-CNN object detection using multi-path detection calibration network. IEEE Trans. Circuits Syst. Video Technol. 31(2), 715\u2013727 (2020). https:\/\/doi.org\/10.1109\/tcsvt.2020.2987465","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"issue":"2","key":"4637_CR4","doi-asserted-by":"publisher","first-page":"2249","DOI":"10.32604\/csse.2023.032231","volume":"45","author":"S Devi","year":"2023","unstructured":"Devi, S., Vijay, R., Sivakumar, P.: EfficientNetV2 model for plant disease classification and pest recognition. Comput. Syst. Sci. Eng. 45(2), 2249\u20132263 (2023)","journal-title":"Comput. Syst. Sci. Eng."},{"key":"4637_CR5","doi-asserted-by":"publisher","DOI":"10.1007\/s11760-025-04059-x","volume":"19","author":"Z Gao","year":"2025","unstructured":"Gao, Z., Meng, Q., Wang, J., Bu, F.: Lao-yolo: improved yoloV10 model for lightweight aerial object detection. Signal Image Video Process. 19, 451 (2025). https:\/\/doi.org\/10.1007\/s11760-025-04059-x","journal-title":"Signal Image Video Process."},{"key":"4637_CR6","doi-asserted-by":"publisher","DOI":"10.1080\/21642583.2024.2394428","author":"W Hao","year":"2024","unstructured":"Hao, W., Zhang, L., Xu, S., Han, M., Li, F., Yang, H.: YOLOv5-MHSA-DS: an efficient pig detection and counting method. Syst. Sci. Control Eng. (2024). https:\/\/doi.org\/10.1080\/21642583.2024.2394428","journal-title":"Syst. Sci. Control Eng."},{"key":"4637_CR7","doi-asserted-by":"publisher","unstructured":"Hollard, L., Mohimont, L., Gaveau, N., Luiz Angelo Steffenel.: LeYOLO, New scalable and efficient CNN architecture for object detection. ArXiv, pp. 1\u201334. (2024). https:\/\/doi.org\/10.48550\/arxiv.2406.14239","DOI":"10.48550\/arxiv.2406.14239"},{"key":"4637_CR8","doi-asserted-by":"publisher","first-page":"207","DOI":"10.1007\/s11760-023-02728-3","volume":"18","author":"Z Hong","year":"2023","unstructured":"Hong, Z., Hamdan, E., Zhao, Y., Ye, T., Pan, H., Cetin, A.E.: Wildfire detection via transfer learning: a survey. Signal Image Video Process. 18, 207\u2013214 (2023). https:\/\/doi.org\/10.1007\/s11760-023-02728-3","journal-title":"Signal Image Video Process."},{"key":"4637_CR9","doi-asserted-by":"publisher","unstructured":"Hussain, M.: YOLOv5, YOLOv8 and YOLOv10: the go-to detectors for real-time vision. ArXiv, pp. 1\u201312. (2024). https:\/\/doi.org\/10.48550\/arXiv.2407.02988","DOI":"10.48550\/arXiv.2407.02988"},{"key":"4637_CR10","unstructured":"Jocher, G., Qiu, J., Chaurasia, A.: Ultralytics YOLO (Version 8.0.0). GitHub. (2023). https:\/\/github.com\/ultralytics\/ultralytics"},{"key":"4637_CR11","doi-asserted-by":"publisher","DOI":"10.1007\/s11760-025-03952-9","volume":"19","author":"MH Junos","year":"2025","unstructured":"Junos, M.H., Zulkifli, S., Bakar, E.A., Hawary, A.F., Khairuddin, A.S.M.: YOLO-ME: an enhanced lightweight YOLOv7 tiny model for efficient object detection in aerial imagery. Signal Image Video Process. 19, 312 (2025). https:\/\/doi.org\/10.1007\/s11760-025-03952-9","journal-title":"Signal Image Video Process."},{"key":"4637_CR12","doi-asserted-by":"publisher","first-page":"1444","DOI":"10.1016\/j.procs.2020.03.355","volume":"167","author":"AI Khan","year":"2020","unstructured":"Khan, A.I., Al-Habsi, S.: Machine learning in computer vision. Procedia Comput. Sci. 167, 1444\u20131451 (2020). https:\/\/doi.org\/10.1016\/j.procs.2020.03.355","journal-title":"Procedia Comput. Sci."},{"key":"4637_CR13","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/ICIRCA51532.2021.9544598","volume":"2021","author":"NM Krishna","year":"2021","unstructured":"Krishna, N.M., Reddy, R.Y., Reddy, M.S.C., Madhav, K.P., Sudham, G.: Object Detection and Tracking Using Yolo. Third International Conference on Inventive Research in Computing Applications (ICIRCA) 2021, 1\u20137 (2021). https:\/\/doi.org\/10.1109\/ICIRCA51532.2021.9544598","journal-title":"Third International Conference on Inventive Research in Computing Applications (ICIRCA)"},{"key":"4637_CR14","doi-asserted-by":"publisher","unstructured":"Li, Y., Dua, A., & Ren, F.: Light-weight RetinaNet for object detection on edge devices. In: 2020 IEEE 6th World Forum on Internet of Things (WF-IoT), pp. 1\u20136. (2020) https:\/\/doi.org\/10.1109\/wf-iot48130.2020.9221150","DOI":"10.1109\/wf-iot48130.2020.9221150"},{"key":"4637_CR15","unstructured":"Lin, D.T.T: labelImg. GitHub. (2023). https:\/\/github.com\/HumanSignal\/labelImg"},{"key":"4637_CR16","doi-asserted-by":"publisher","unstructured":"Mahendru, M., Dubey, S.K.: Real time object detection with audio feedback using Yolo vs. Yolo_v3. In: 2021 11th International Conference on Cloud Computing, Data Science & Engineering (Confluence), pp\/ 734\u2013740. (2021). https:\/\/doi.org\/10.1109\/Confluence51648.2021.9377064","DOI":"10.1109\/Confluence51648.2021.9377064"},{"key":"4637_CR17","doi-asserted-by":"publisher","unstructured":"Muhammad Rusydan, M.K., Shahrani, S., Farah Yasmin, A.R:. Photovoltaic (PV) module defect image classification analysis using EfficientNetV2 architectures. In: 2023 IEEE 14th Control and System Graduate Research Colloquium (ICSGRC), pp. 236\u2013241. (2023) https:\/\/doi.org\/10.1109\/icsgrc57744.2023.10215491","DOI":"10.1109\/icsgrc57744.2023.10215491"},{"key":"4637_CR18","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1016\/j.biosystemseng.2020.12.002","volume":"202","author":"S Parvathi","year":"2021","unstructured":"Parvathi, S., Tamil Selvi, S.: Detection of maturity stages of coconuts in complex background using faster R-CNN model. Biosyst. Eng. 202, 119\u2013132 (2021). https:\/\/doi.org\/10.1016\/j.biosystemseng.2020.12.002","journal-title":"Biosyst. Eng."},{"key":"4637_CR19","doi-asserted-by":"publisher","DOI":"10.1016\/j.rineng.2025.104869","volume":"26","author":"LT Ramos","year":"2025","unstructured":"Ramos, L.T., Casas, E., Romero, C., Rivas-Echeverr\u00eda, F., Bendek, E.: A study of YOLO architectures for wildfire and smoke detection in ground and aerial imagery. Results Eng. 26, 104869 (2025). https:\/\/doi.org\/10.1016\/j.rineng.2025.104869","journal-title":"Results Eng."},{"key":"4637_CR20","unstructured":"RangeKing.: Brief summary of YOLOv8 model structure, issue no. 189 ultralytics\/ultralytics. GitHub. https:\/\/github.com\/ultralytics\/ultralytics\/issues\/189"},{"key":"4637_CR21","doi-asserted-by":"publisher","DOI":"10.1007\/s11760-025-04038-2","volume":"19","author":"S Rong","year":"2025","unstructured":"Rong, S., Hamdan, E., Cetin, A.E.: Multi-resolution training improves robustness against adversarial attacks. Signal Image Video Process. 19, 481 (2025). https:\/\/doi.org\/10.1007\/s11760-025-04038-2","journal-title":"Signal Image Video Process."},{"key":"4637_CR22","doi-asserted-by":"publisher","unstructured":"Sikindar, S., Prasanna, M.S.L., Osama, S., Sahithi, P.: Detection and prediction of pests based on leaf images using efficient Net V2. In: 2024 2nd International Conference on Sustainable Computing and Smart Systems (ICSCSS), pp. 1186\u20131192. (2024) https:\/\/doi.org\/10.1109\/icscss60660.2024.10624916","DOI":"10.1109\/icscss60660.2024.10624916"},{"key":"4637_CR23","doi-asserted-by":"crossref","unstructured":"Sun, J., Xie, Y., Zhang, S., Chen, L., Zhang, G., Bao, H., Zhou, X.: You don\u2019t only look once: constructing spatial-temporal memory for integrated 3D object detection and tracking. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 3185\u20133194. (2021). https:\/\/ieeexplore.ieee.org\/document\/9710513","DOI":"10.1109\/ICCV48922.2021.00317"},{"issue":"11","key":"4637_CR24","doi-asserted-by":"publisher","first-page":"8210","DOI":"10.1109\/tnnls.2022.3144163","volume":"34","author":"H Tan","year":"2023","unstructured":"Tan, H., Liu, X., Tian, S., Yin, B., Li, X.: MHSA-net: multihead self-attention network for occluded person re-identification. IEEE Trans. Neural Netw. Learn. Syst. 34(11), 8210\u20138224 (2023). https:\/\/doi.org\/10.1109\/tnnls.2022.3144163","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"4637_CR25","doi-asserted-by":"publisher","unstructured":"Tan, M., Le, Q.V.: EfficientNetV2: Smaller models and faster training. Arxiv.org, pp. 1\u201311. (2021). https:\/\/doi.org\/10.48550\/arXiv.2104.00298","DOI":"10.48550\/arXiv.2104.00298"},{"key":"4637_CR26","doi-asserted-by":"publisher","unstructured":"Terven, J., Cordova-Esparza, D.: A comprehensive review of YOLO: from YOLOv1 to YOLOv8 and beyond. ArXiv (Cornell University), pp. 1\u201336. (2023). https:\/\/doi.org\/10.48550\/arxiv.2304.00501","DOI":"10.48550\/arxiv.2304.00501"},{"key":"4637_CR27","doi-asserted-by":"publisher","DOI":"10.1007\/s44196-023-00302-w","author":"S Uddagiri Sirisha","year":"2023","unstructured":"Uddagiri Sirisha, S., Praveen, P.N., Srinivasu, P.B., Bhoi, A.K.: Statistical analysis of design aspects of various YOLO-based deep learning models for object detection. Int. J. Comput. Intell. Syst. (2023). https:\/\/doi.org\/10.1007\/s44196-023-00302-w","journal-title":"Int. J. Comput. Intell. Syst."},{"key":"4637_CR28","doi-asserted-by":"publisher","unstructured":"Wajdi, A.Z., Wibowo, P., Sasaki, S.: YOLOv8 vs. YOLOv9: Evaluating object detection algorithms for marine waste recognition. In: 2024 IEEE International Symposium on Consumer Technology (ISCT), pp. 286\u2013292. (2024). https:\/\/doi.org\/10.1109\/isct62336.2024.10791223","DOI":"10.1109\/isct62336.2024.10791223"},{"key":"4637_CR29","doi-asserted-by":"publisher","first-page":"110227","DOI":"10.1109\/access.2020.3001279","volume":"8","author":"X Wang","year":"2020","unstructured":"Wang, X., Wang, S., Cao, J., Wang, Y.: Data-driven based tiny-YOLOv3 method for front vehicle detection inducing SPP-Net. IEEE Access 8, 110227\u2013110236 (2020). https:\/\/doi.org\/10.1109\/access.2020.3001279","journal-title":"IEEE Access"},{"key":"4637_CR30","doi-asserted-by":"publisher","first-page":"56416","DOI":"10.1109\/access.2021.3072211","volume":"9","author":"Z-Z Wang","year":"2021","unstructured":"Wang, Z.-Z., Xie, K., Zhang, X.-Y., Chen, H.-Q., Wen, C., He, J.-B.: Small-object detection based on YOLO and dense block via image super-resolution. IEEE Access 9, 56416\u201356429 (2021). https:\/\/doi.org\/10.1109\/access.2021.3072211","journal-title":"IEEE Access"},{"key":"4637_CR31","doi-asserted-by":"publisher","first-page":"143448","DOI":"10.1109\/ACCESS.2021.3121152","volume":"9","author":"C Xu","year":"2021","unstructured":"Xu, C., Shi, C., Bi, H., Liu, C., Yuan, Y., Guo, H., Chen, Y.: A page object detection method based on mask R-CNN. IEEE Access 9, 143448\u2013143457 (2021). https:\/\/doi.org\/10.1109\/ACCESS.2021.3121152","journal-title":"IEEE Access"},{"issue":"12","key":"4637_CR32","doi-asserted-by":"publisher","DOI":"10.1016\/j.heliyon.2024.e32678","volume":"10","author":"J Yan","year":"2024","unstructured":"Yan, J., Zeng, Y., Lin, J., Pei, Z., Fan, J., Fang, C., Cai, Y.: Enhanced object detection in pediatric bronchoscopy images using YOLO-based algorithms with CBAM attention mechanism. Heliyon 10(12), e32678 (2024). https:\/\/doi.org\/10.1016\/j.heliyon.2024.e32678","journal-title":"Heliyon"},{"key":"4637_CR33","doi-asserted-by":"publisher","unstructured":"Yonggui, W., Jing, H.: Improved algorithm for tomato disease detection based on YOLOv8. In: 2024 IEEE 4th International Conference on Electronic Technology, Communication and Information (ICETCI), pp. 230\u2013234. (2024). https:\/\/doi.org\/10.1109\/icetci61221.2024.10594250","DOI":"10.1109\/icetci61221.2024.10594250"},{"key":"4637_CR34","doi-asserted-by":"publisher","DOI":"10.1016\/j.compag.2020.105384","volume":"173","author":"J Zhang","year":"2020","unstructured":"Zhang, J., Karkee, M., Zhang, Q., Zhang, X., Yaqoob, M., Fu, L., Wang, S.: Multi-class object detection using faster R-CNN and estimation of shaking locations for automated shake-and-catch apple harvesting. Comput. Electron. Agric. 173, 105384 (2020). https:\/\/doi.org\/10.1016\/j.compag.2020.105384","journal-title":"Comput. Electron. Agric."},{"key":"4637_CR35","doi-asserted-by":"publisher","DOI":"10.1007\/s11760-024-03716-x","volume":"19","author":"X Zhong","year":"2024","unstructured":"Zhong, X.: Cal-ssd: lightweight SSD object detection based on coordinated attention. Signal Image Video Process. 19, 31 (2024). https:\/\/doi.org\/10.1007\/s11760-024-03716-x","journal-title":"Signal Image Video Process."},{"key":"4637_CR36","doi-asserted-by":"publisher","first-page":"8793","DOI":"10.1007\/s11760-024-03507-4","volume":"18","author":"Z Zhao","year":"2024","unstructured":"Zhao, Z., He, P.: YOLO-mamba: object detection method for infrared aerial images. Signal Image Video Process. 18, 8793\u20138803 (2024). https:\/\/doi.org\/10.1007\/s11760-024-03507-4","journal-title":"Signal Image Video Process."},{"issue":"17","key":"4637_CR37","doi-asserted-by":"publisher","first-page":"e36754","DOI":"10.1016\/j.heliyon.2024.e36754","volume":"10","author":"Z Zhao","year":"2024","unstructured":"Zhao, Z., Elmi, A.B., Norizham, A.R., Mohammad, N.A.: Corrosion image classification method based on EfficientNetV2. Heliyon 10(17), e36754\u2013e36754 (2024). https:\/\/doi.org\/10.1016\/j.heliyon.2024.e36754","journal-title":"Heliyon"},{"key":"4637_CR38","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.12225","volume":"238","author":"Y Zhou","year":"2024","unstructured":"Zhou, Y.: A yolo-nl object detector for real-time detection. Expert Syst. Appl. 238, 122256 (2024). https:\/\/doi.org\/10.1016\/j.eswa.2023.12225","journal-title":"Expert Syst. Appl."}],"container-title":["Signal, Image and Video Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11760-025-04637-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11760-025-04637-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11760-025-04637-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,22]],"date-time":"2025-09-22T13:15:49Z","timestamp":1758546949000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11760-025-04637-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,9]]},"references-count":38,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2025,12]]}},"alternative-id":["4637"],"URL":"https:\/\/doi.org\/10.1007\/s11760-025-04637-z","relation":{},"ISSN":["1863-1703","1863-1711"],"issn-type":[{"value":"1863-1703","type":"print"},{"value":"1863-1711","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,9,9]]},"assertion":[{"value":"4 April 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 July 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 August 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 September 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"1057"}}