{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,29]],"date-time":"2025-12-29T11:12:28Z","timestamp":1767006748416,"version":"3.40.5"},"reference-count":21,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2025,4,16]],"date-time":"2025-04-16T00:00:00Z","timestamp":1744761600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,4,16]],"date-time":"2025-04-16T00:00:00Z","timestamp":1744761600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"NSFC Special Fund of Tianyuan Visiting Scholar Fund","award":["11726616"],"award-info":[{"award-number":["11726616"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["SIViP"],"published-print":{"date-parts":[[2025,6]]},"DOI":"10.1007\/s11760-025-04084-w","type":"journal-article","created":{"date-parts":[[2025,4,16]],"date-time":"2025-04-16T13:50:48Z","timestamp":1744811448000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Cross-YOLO: an object detection algorithm for UAV based on improved YOLOv8 model"],"prefix":"10.1007","volume":"19","author":[{"given":"Ying","family":"Dong","sequence":"first","affiliation":[]},{"given":"Jiahao","family":"Guo","sequence":"additional","affiliation":[]},{"given":"Fucheng","family":"Xu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,4,16]]},"reference":[{"key":"4084_CR1","doi-asserted-by":"crossref","unstructured":"Redmon, J.: You only look once: unified, real-time object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (2016)","DOI":"10.1109\/CVPR.2016.91"},{"key":"4084_CR2","doi-asserted-by":"crossref","unstructured":"Liu, W., Anguelov, D., Erhan, D., Szegedy, C., Reed, S., Fu, C.-Y., Berg, A.C.: Ssd: single shot multibox detector. In: Computer Vision\u2013ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part I 14. Springer, pp 21\u201337 (2016)","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"4084_CR3","unstructured":"Ross, T.-Y., Doll\u00e1r, G.: Focal loss for dense object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 2980\u20132988 (2017)"},{"key":"4084_CR4","doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Rich feature hierarchies for accurate object detection and semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 580\u2013587 (2014)","DOI":"10.1109\/CVPR.2014.81"},{"key":"4084_CR5","doi-asserted-by":"publisher","unstructured":"Girshick, R.: Fast r-cnn. In: 2015 IEEE International Conference on Computer Vision (ICCV), pp 1440\u20131448 (2015). https:\/\/doi.org\/10.1109\/ICCV.2015.169","DOI":"10.1109\/ICCV.2015.169"},{"key":"4084_CR6","doi-asserted-by":"crossref","unstructured":"Cai, Z., Vasconcelos, N.: Cascade r-cnn: delving into high quality object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 6154\u20136162 (2018)","DOI":"10.1109\/CVPR.2018.00644"},{"key":"4084_CR7","doi-asserted-by":"crossref","unstructured":"Varghese, R., Sambath, M.: Yolov8: a novel object detection algorithm with enhanced performance and robustness. In: 2024 International Conference on Advances in Data Engineering and Intelligent Computing Systems (ADICS). IEEE, pp 1\u20136 (2024)","DOI":"10.1109\/ADICS58448.2024.10533619"},{"key":"4084_CR8","doi-asserted-by":"crossref","unstructured":"Tan, M., Pang, R., Le, Q.V.: Efficientdet: scalable and efficient object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 10781\u201310790 (2020)","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"4084_CR9","doi-asserted-by":"crossref","unstructured":"Chen, Z., He, Z., Lu, Z.-M.: Dea-net: Single image dehazing based on detail-enhanced convolution and content-guided attention. IEEE Transactions on Image Processing (2024)","DOI":"10.1109\/TIP.2024.3354108"},{"key":"4084_CR10","doi-asserted-by":"crossref","unstructured":"Hou, Q., Zhou, D., Feng, J.: Coordinate attention for efficient mobile network design. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 13713\u201313722 (2021)","DOI":"10.1109\/CVPR46437.2021.01350"},{"key":"4084_CR11","first-page":"1140","volume":"35","author":"M-H Guo","year":"2022","unstructured":"Guo, M.-H., Lu, C.-Z., Hou, Q., Liu, Z., Cheng, M.-M., Hu, S.-M.: Segnext: rethinking convolutional attention design for semantic segmentation. Adv. Neural Inf. Process. Syst. 35, 1140\u20131156 (2022)","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"4084_CR12","unstructured":"Tong, Z., Chen, Y., Xu, Z., Yu, R.: Wise-iou: bounding box regression loss with dynamic focusing mechanism (2023). arXiv preprint arXiv:2301.10051"},{"key":"4084_CR13","doi-asserted-by":"publisher","unstructured":"Tian, Z., Shen, C., Chen, H., He, T.: Fcos: fully convolutional one-stage object detection. In: 2019 IEEE\/CVF International Conference on Computer Vision (ICCV), pp 9626\u20139635 (2019). https:\/\/doi.org\/10.1109\/ICCV.2019.00972","DOI":"10.1109\/ICCV.2019.00972"},{"key":"4084_CR14","unstructured":"Ioffe, S.: Batch normalization: accelerating deep network training by reducing internal covariate shift. arXiv preprint arXiv:1502.03167 (2015)"},{"key":"4084_CR15","doi-asserted-by":"crossref","unstructured":"Wu, Y., He, K.: Group normalization. In: Proceedings of the European Conference on Computer Vision (ECCV), pp 3\u201319 (2018)","DOI":"10.1007\/978-3-030-01261-8_1"},{"key":"4084_CR16","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, J.-Y., Kweon, I.S.: Cbam: convolutional block attention module. In: Proceedings of the European Conference on Computer Vision (ECCV), pp 3\u201319 (2018)","DOI":"10.1007\/978-3-030-01234-2_1"},{"issue":"8","key":"4084_CR17","doi-asserted-by":"publisher","first-page":"8574","DOI":"10.1109\/TCYB.2021.3095305","volume":"52","author":"Z Zheng","year":"2021","unstructured":"Zheng, Z., Wang, P., Ren, D., Liu, W., Ye, R., Hu, Q., Zuo, W.: Enhancing geometric factors in model learning and inference for object detection and instance segmentation. IEEE Trans. Cybern. 52(8), 8574\u20138586 (2021)","journal-title":"IEEE Trans. Cybern."},{"key":"4084_CR18","doi-asserted-by":"publisher","unstructured":"Du, D., Zhu, P., Wen, L.: Visdrone-sot2019: the vision meets drone single object tracking challenge results. In: 2019 IEEE\/CVF International Conference on Computer Vision Workshop (ICCVW), pp 199\u2013212 (2019). https:\/\/doi.org\/10.1109\/ICCVW.2019.00029","DOI":"10.1109\/ICCVW.2019.00029"},{"key":"4084_CR19","doi-asserted-by":"crossref","unstructured":"Xia, G.-S., Bai, X., Ding, J., Zhu, Z., Belongie, S., Luo, J., Datcu, M., Pelillo, M., Zhang, L.: Dota: a large-scale dataset for object detection in aerial images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 3974\u20133983 (2018)","DOI":"10.1109\/CVPR.2018.00418"},{"key":"4084_CR20","doi-asserted-by":"crossref","unstructured":"Yu, X., Gong, Y., Jiang, N., Ye, Q., Han, Z.: Scale match for tiny person detection. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp 1257\u20131265 (2020)","DOI":"10.1109\/WACV45572.2020.9093394"},{"key":"4084_CR21","unstructured":"Wang, A., Chen, H., Liu, L., Chen, K., Lin, Z., Han, J., Ding, G.: Yolov10: real-time end-to-end object detection (2024). arXiv preprint arXiv:2405.14458"}],"container-title":["Signal, Image and Video Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11760-025-04084-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11760-025-04084-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11760-025-04084-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,19]],"date-time":"2025-05-19T10:41:51Z","timestamp":1747651311000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11760-025-04084-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,16]]},"references-count":21,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2025,6]]}},"alternative-id":["4084"],"URL":"https:\/\/doi.org\/10.1007\/s11760-025-04084-w","relation":{},"ISSN":["1863-1703","1863-1711"],"issn-type":[{"type":"print","value":"1863-1703"},{"type":"electronic","value":"1863-1711"}],"subject":[],"published":{"date-parts":[[2025,4,16]]},"assertion":[{"value":"17 November 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 February 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 March 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 April 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no Conflict of interest to declare that are relevant to the content of this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"489"}}