{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T15:59:20Z","timestamp":1780415960336,"version":"3.54.1"},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2024,8,18]],"date-time":"2024-08-18T00:00:00Z","timestamp":1723939200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,8,18]],"date-time":"2024-08-18T00:00:00Z","timestamp":1723939200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"Research Project on Economic and Social Development of Liaoning Province","award":["2022lsljdybkt-014"],"award-info":[{"award-number":["2022lsljdybkt-014"]}]},{"name":"Science and technology innovation fund program of Dalian","award":["2021JJ13SN81"],"award-info":[{"award-number":["2021JJ13SN81"]}]},{"name":"Scientific and Research Project of Education Department of Liaoning Province","award":["No. L2020006"],"award-info":[{"award-number":["No. L2020006"]}]},{"name":"Research project of China Federation of logistics and procurement","award":["Grant No.:2023CSLKT3-020"],"award-info":[{"award-number":["Grant No.:2023CSLKT3-020"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Pattern Anal Applic"],"published-print":{"date-parts":[[2024,9]]},"DOI":"10.1007\/s10044-024-01323-7","type":"journal-article","created":{"date-parts":[[2024,8,18]],"date-time":"2024-08-18T10:01:48Z","timestamp":1723975308000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":30,"title":["Small object detection based on YOLOv8 in UAV perspective"],"prefix":"10.1007","volume":"27","author":[{"given":"Tao","family":"Ning","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Wantong","family":"Wu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jin","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2024,8,18]]},"reference":[{"issue":"6","key":"1323_CR1","doi-asserted-by":"publisher","first-page":"147","DOI":"10.3390\/drones6060147","volume":"6","author":"SAH Mohsan","year":"2022","unstructured":"Mohsan SAH, Khan MA, Noor F et al (2022) Towards the unmanned aerial vehicles (UAVs): A comprehensive review. Drones 6(6):147","journal-title":"Drones"},{"key":"1323_CR2","doi-asserted-by":"crossref","unstructured":"Cheng N, Wu S, Wang X, Yin Z et al (2023) AI for UAV-assisted IoT applications: a comprehensive review. IEEE Internet Things J","DOI":"10.20944\/preprints202211.0302.v1"},{"key":"1323_CR3","doi-asserted-by":"crossref","unstructured":"Girshick R, Donahue J, Darrell T, Malik J (2014) Rich feature hierarchies for accurate object detection and semantic segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 580\u2013587","DOI":"10.1109\/CVPR.2014.81"},{"key":"1323_CR4","doi-asserted-by":"crossref","unstructured":"Girshick R (2015) Fast r-cnn. In: Proceedings of the IEEE international conference on computer vision, pp 1440\u20131448","DOI":"10.1109\/ICCV.2015.169"},{"key":"1323_CR5","unstructured":"Ren S, He K, Girshick R, Sun J (2015) Faster r-cnn: towards real-time object detection with region proposal networks. In: Advances in neural information processing systems, vol 28"},{"key":"1323_CR6","doi-asserted-by":"crossref","unstructured":"Liu W, Anguelov D, Erhan D et al (2016) Ssd: single shot multibox detector. In: Computer vision-ECCV 2016: 14th European conference, Amsterdam, The Netherlands, October 11\u201314, 2016, proceedings, part I 14. Springer, pp 21\u201337","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"1323_CR7","doi-asserted-by":"crossref","unstructured":"Redmon J, Divvala S, Girshick R, Farhadi A (2016) You only look once: unified, real-time object detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 779\u2013788","DOI":"10.1109\/CVPR.2016.91"},{"key":"1323_CR8","unstructured":"Redmon J, Farhadi A (2018) Yolov3: an incremental improvement. arXiv:1804.02767"},{"key":"1323_CR9","unstructured":"Bochkovskiy A, Wang C, Liao HM (2020) Yolov4: optimal speed and accuracy of object detection. arXiv:2004.10934"},{"key":"1323_CR10","unstructured":"Redmon J. Stoken Yolo v5. https:\/\/github.com\/ultralytics\/yolov5\/releases\/tag\/v6.0. Accessed on 12 Oct 2021"},{"key":"1323_CR11","unstructured":"Li C, Li L, Jiang H et al (2022) YOLOv6: a single-stage object detection framework for industrial applications. arXiv:2209.02976"},{"key":"1323_CR12","doi-asserted-by":"crossref","unstructured":"Wang C, Bochkovskiy A, Liao HM (2023) YOLOv7: trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 7464\u20137475","DOI":"10.1109\/CVPR52729.2023.00721"},{"key":"1323_CR13","unstructured":"Glenn-jocher U (2023) Yolo v8. https:\/\/github.com\/ultralytics\/ultralytics.git. Accessed on 9 Jan 2023"},{"key":"1323_CR14","doi-asserted-by":"crossref","unstructured":"Li Y, Chen Y, Wang N, Zhang Z et al (2019) Scale-aware trident networks for object detection. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 6054\u20136063","DOI":"10.1109\/ICCV.2019.00615"},{"key":"1323_CR15","doi-asserted-by":"crossref","unstructured":"Yang C, Huang Z, Wang N (2022) Querydet: cascaded sparse query for accelerating high-resolution small object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 13668\u201313677","DOI":"10.1109\/CVPR52688.2022.01330"},{"key":"1323_CR16","doi-asserted-by":"publisher","first-page":"1968","DOI":"10.1109\/TMM.2021.3074273","volume":"24","author":"C Deng","year":"2021","unstructured":"Deng C, Wang M, Liu L, Liu Y (2021) Extended feature pyramid network for small object detection. IEEE Trans Multimedia 24:1968\u20131979","journal-title":"IEEE Trans Multimedia"},{"issue":"21","key":"1323_CR17","doi-asserted-by":"publisher","first-page":"5488","DOI":"10.3390\/rs14215488","volume":"14","author":"T Shi","year":"2022","unstructured":"Shi T, Gong J, Hu J et al (2022) Feature-enhanced CenterNet for small object detection in remote sensing images. Remote Sens 14(21):5488","journal-title":"Remote Sens"},{"key":"1323_CR18","unstructured":"Howard AG, Zhu M, Chen B, Kalenichenko D (2017) Mobilenets: efficient convolutional neural networks for mobile vision applications. arXiv:1704.04861"},{"key":"1323_CR19","doi-asserted-by":"crossref","unstructured":"Sandler M, Howard A, Zhu M, Zhmoginov A, Chen L (2018) Mobilenetv2: inverted residuals and linear bottlenecks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 4510\u20134520","DOI":"10.1109\/CVPR.2018.00474"},{"key":"1323_CR20","doi-asserted-by":"crossref","unstructured":"Howard A, Sandler M, Chu G et al (2019) Searching for mobilenetv3. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 1314\u20131324","DOI":"10.1109\/ICCV.2019.00140"},{"key":"1323_CR21","doi-asserted-by":"crossref","unstructured":"Zhang X, Zhou X, Lin M, Sun J (2018) Shufflenet: an extremely efficient convolutional neural network for mobile devices. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 6848\u20136856","DOI":"10.1109\/CVPR.2018.00716"},{"key":"1323_CR22","doi-asserted-by":"crossref","unstructured":"Ma N, Zhang X, Zheng H, Sun J (2018) Shufflenet v2: practical guidelines for efficient cnn architecture design. In: Proceedings of the European conference on computer vision (ECCV), pp 116\u2013131","DOI":"10.1007\/978-3-030-01264-9_8"},{"key":"1323_CR23","doi-asserted-by":"crossref","unstructured":"Han K, Wang Y, Tian Q et al (2020) Ghostnet: more features from cheap operations. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 1580\u20131589","DOI":"10.1109\/CVPR42600.2020.00165"},{"key":"1323_CR24","first-page":"9969","volume":"35","author":"Y Tang","year":"2022","unstructured":"Tang Y, Han K, Guo J et al (2022) GhostNetv2: enhance cheap operation with long-range attention. Adv Neural Inf Process Syst 35:9969\u20139982","journal-title":"Adv Neural Inf Process Syst"},{"key":"1323_CR25","unstructured":"Wang J, Hu X, Zhang P, Li X, Wang L (2020) Minivlm: a smaller and faster vision-language model. arXiv:2012.06946"},{"key":"1323_CR26","unstructured":"Cui Y, Song T, Wu G, Wang L (2024) Mixformerv2: efficient fully transformer tracking. In: Advances in neural information processing systems, vol 36"},{"key":"1323_CR27","first-page":"13937","volume":"34","author":"Y Rao","year":"2021","unstructured":"Rao Y, Zhao W, Liu B et al (2021) Dynamicvit: efficient vision transformers with dynamic token sparsification. Adv Neural Inf Process Syst 34:13937\u201313949","journal-title":"Adv Neural Inf Process Syst"},{"key":"1323_CR28","doi-asserted-by":"crossref","unstructured":"Zhao Q, Sheng T, Wang Y et al (2019) M2det: a single-shot object detector based on multi-level feature pyramid network. In: Proceedings of the AAAI conference on artificial intelligence, vol 33, No. 01, pp 9259\u20139266","DOI":"10.1609\/aaai.v33i01.33019259"},{"key":"1323_CR29","doi-asserted-by":"crossref","unstructured":"Tan M, Pang R, Le QV (2020) Efficientdet: scalable and efficient object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 10781\u201310790","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"1323_CR30","unstructured":"Liu S, Huang D, Wang Y (2019) Learning spatial fusion for single-shot object detection. arXiv:1911.09516, 1911"},{"key":"1323_CR31","doi-asserted-by":"crossref","unstructured":"Gong Y, Yu X, Ding Y et al (2021) Effective fusion factor in FPN for tiny object detection. In: Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp 1160\u20131168","DOI":"10.1109\/WACV48630.2021.00120"},{"key":"1323_CR32","volume":"125","author":"L Deng","year":"2023","unstructured":"Deng L, Bolin Fu, Yan Wu et al (2023) Comparison of 2D and 3D vegetation species mapping in three natural scenarios using UAV-LiDAR point clouds and improved deep learning methods. Int J Appl Earth Obs Geoinf 125:103588","journal-title":"Int J Appl Earth Obs Geoinf"},{"key":"1323_CR33","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.122073","volume":"238","author":"J Gao","year":"2024","unstructured":"Gao J, Zhang J, Zhang F, Gao J (2024) LACTA: A lightweight and accurate algorithm for cherry tomato detection in unstructured environments. Expert Syst Appl 238:122073","journal-title":"Expert Syst Appl"},{"key":"1323_CR34","doi-asserted-by":"crossref","unstructured":"Sunkara R, Luo T (2022) No more strided convolutions or pooling: A new CNN building block for low-resolution images and small objects. In: Joint European conference on machine learning and knowledge discovery in databases. Springer, Cham, pp 443\u2013459","DOI":"10.1007\/978-3-031-26409-2_27"},{"issue":"5","key":"1323_CR35","doi-asserted-by":"publisher","first-page":"304","DOI":"10.3390\/drones7050304","volume":"7","author":"Y Li","year":"2023","unstructured":"Li Y, Fan Q, Huang H, Han Z, Qiang Gu (2023) A modified YOLOv8 detection network for UAV aerial image recognition. Drones 7(5):304","journal-title":"Drones"},{"issue":"1","key":"1323_CR36","doi-asserted-by":"publisher","first-page":"3510","DOI":"10.1038\/s41598-024-54146-1","volume":"14","author":"Wu Huixin","year":"2024","unstructured":"Huixin Wu, Zhu Y, Li S (2024) CDYL for infrared and visible light image dense small object detection. Sci Rep 14(1):3510","journal-title":"Sci Rep"},{"issue":"3","key":"1323_CR37","doi-asserted-by":"publisher","first-page":"84","DOI":"10.3390\/drones8030084","volume":"8","author":"NUA Tahir","year":"2024","unstructured":"Tahir NUA, Long Z, Zhang Z, Asim M, Elaffendi M (2024) PVswin-YOLOv8s: UAV-based pedestrian and vehicle detection for traffic management in smart cities using improved YOLOv8. Drones 8(3):84","journal-title":"Drones"},{"key":"1323_CR38","doi-asserted-by":"crossref","unstructured":"Tang S, Zhang S, Fang Y (2023) HIC-YOLOv5: improved YOLOv5 for small object detection. arXiv:2309.16393","DOI":"10.1109\/ICRA57147.2024.10610273"},{"issue":"6","key":"1323_CR39","doi-asserted-by":"publisher","first-page":"3061","DOI":"10.3390\/s23063061","volume":"23","author":"Lu Shun","year":"2023","unstructured":"Shun Lu, Hanyu Lu, Dong J, Shuang Wu (2023) Object detection for UAV aerial scenarios based on vectorized IOU. Sensors 23(6):3061","journal-title":"Sensors"},{"key":"1323_CR40","doi-asserted-by":"crossref","unstructured":"Liu S, Zha J, Sun J, Li Z, Wang G (2023) EdgeYOLO: an edge-real-time object detector. In: 2023 42nd Chinese control conference (CCC). IEEE, pp 7507\u20137512","DOI":"10.23919\/CCC58697.2023.10239786"}],"container-title":["Pattern Analysis and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-024-01323-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10044-024-01323-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-024-01323-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,12]],"date-time":"2024-09-12T18:17:16Z","timestamp":1726165036000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10044-024-01323-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,8,18]]},"references-count":40,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2024,9]]}},"alternative-id":["1323"],"URL":"https:\/\/doi.org\/10.1007\/s10044-024-01323-7","relation":{},"ISSN":["1433-7541","1433-755X"],"issn-type":[{"value":"1433-7541","type":"print"},{"value":"1433-755X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,8,18]]},"assertion":[{"value":"5 June 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 August 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 August 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"103"}}