{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,12]],"date-time":"2026-02-12T17:42:19Z","timestamp":1770918139250,"version":"3.50.1"},"reference-count":26,"publisher":"Springer Science and Business Media LLC","issue":"22","license":[{"start":{"date-parts":[[2024,8,24]],"date-time":"2024-08-24T00:00:00Z","timestamp":1724457600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,8,24]],"date-time":"2024-08-24T00:00:00Z","timestamp":1724457600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-024-20076-3","type":"journal-article","created":{"date-parts":[[2024,8,23]],"date-time":"2024-08-23T23:40:31Z","timestamp":1724456431000},"page":"24789-24803","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Improved multi-scale small target detection by UAV"],"prefix":"10.1007","volume":"84","author":[{"given":"Kai","family":"Sun","sequence":"first","affiliation":[]},{"given":"Danjing","family":"Li","sequence":"additional","affiliation":[]},{"given":"Ying","family":"Song","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,8,24]]},"reference":[{"key":"20076_CR1","doi-asserted-by":"publisher","DOI":"10.1201\/9781003138068-4","author":"M Khari","year":"2021","unstructured":"Khari M, Dalal R, Sharma A, Mehta B (2021) Person identification in uav shot videos by using machine learning. Multimodal Biometric Systems. https:\/\/doi.org\/10.1201\/9781003138068-4","journal-title":"Multimodal Biometric Systems"},{"key":"20076_CR2","doi-asserted-by":"publisher","unstructured":"Singh PK, Gupta A, Upadhyay M, Jain A, Khari M, Lamba PS (2023) Multimodal driver drowsiness detection from video frames. Journal of Mobile Multimedia, pp 567\u2013586 https:\/\/doi.org\/10.13052\/jmm1550-4646.19210","DOI":"10.13052\/jmm1550-4646.19210"},{"key":"20076_CR3","doi-asserted-by":"publisher","unstructured":"Saif S, Das P, Biswas S, Khari M, Shanmuganathan V (2022) Hiids: Hybrid intelligent intrusion detection system empowered with machine learning and metaheuristic algorithms for application in iot based healthcare. Microprocessors and Microsystems, p 104622. https:\/\/doi.org\/10.1016\/j.micpro.2022.104622","DOI":"10.1016\/j.micpro.2022.104622"},{"key":"20076_CR4","doi-asserted-by":"publisher","unstructured":"Redmon J, Farhadi A (2018) Yolov3: An incremental improvement. https:\/\/doi.org\/10.48550\/arXiv.1804.02767","DOI":"10.48550\/arXiv.1804.02767"},{"key":"20076_CR5","doi-asserted-by":"publisher","unstructured":"Bochkovskiy A, Wang C-Y, Liao H-YM (2020) Yolov4: Optimal speed and accuracy of object detection.. https:\/\/doi.org\/10.48550\/arXiv.2004.10934","DOI":"10.48550\/arXiv.2004.10934"},{"key":"20076_CR6","doi-asserted-by":"publisher","unstructured":"Ge Z, Liu S, Wang F, Li Z, Sun J (2021) Yolox: Exceeding yolo series in 2021. https:\/\/doi.org\/10.48550\/arXiv.2107.08430","DOI":"10.48550\/arXiv.2107.08430"},{"key":"20076_CR7","doi-asserted-by":"publisher","unstructured":"Li C, Li L, Jiang H, Weng K, Geng Y, Li L, Ke Z, Li Q, Cheng M, Nie W, et al (2022) Yolov6: A single-stage object detection framework for industrial applications. https:\/\/doi.org\/10.48550\/arXiv.2209.02976","DOI":"10.48550\/arXiv.2209.02976"},{"key":"20076_CR8","doi-asserted-by":"publisher","unstructured":"Wang C-Y, Bochkovskiy A, Liao H-YM (2023) Yolov7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 7464\u20137475. https:\/\/doi.org\/10.48550\/arXiv.2207.02696","DOI":"10.48550\/arXiv.2207.02696"},{"key":"20076_CR9","doi-asserted-by":"publisher","unstructured":"Liu W, Anguelov D, Erhan D, Szegedy C, Reed S, Fu C-Y, Berg AC (2016) Ssd: Single shot multibox detector. In: Computer vision\u2013ECCV 2016: 14th European conference, Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part I 14, pp 21\u201337. https:\/\/doi.org\/10.48550\/arXiv.1512.02325. Springer","DOI":"10.48550\/arXiv.1512.02325"},{"key":"20076_CR10","doi-asserted-by":"publisher","unstructured":"Girshick R, Donahue J, Darrell T, Malik J (2014) Rich feature hierarchies for accurate object detection and semantic segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 580\u2013587. https:\/\/doi.org\/10.48550\/arXiv.1311.2524","DOI":"10.48550\/arXiv.1311.2524"},{"key":"20076_CR11","doi-asserted-by":"publisher","unstructured":"Ren S, He K, Girshick R, Sun J (2015) Faster r-cnn: Towards real-time object detection with region proposal networks. Advances in neural information processing systems 28. https:\/\/doi.org\/10.48550\/arXiv.1506.01497","DOI":"10.48550\/arXiv.1506.01497"},{"key":"20076_CR12","doi-asserted-by":"publisher","DOI":"10.1016\/j.jvcir.2023.103936","volume":"97","author":"S Cao","year":"2023","unstructured":"Cao S, Wang T, Li T, Mao Z (2023) Uav small target detection algorithm based on an improved yolov5s model. J Vis Commun Image Represent 97:103936. https:\/\/doi.org\/10.1016\/j.jvcir.2023.103936","journal-title":"J Vis Commun Image Represent"},{"key":"20076_CR13","doi-asserted-by":"publisher","unstructured":"Zhao C, Song Y, Yang X, Zhou Y, Yang J (2023) Target detection based on multi-scale feature fusion and cross-channel interactive attention mechanism. In: Journal of physics: conference series, vol 2562, p 012046. https:\/\/doi.org\/10.1088\/1742-6596\/2562\/1\/012046. IOP Publishing","DOI":"10.1088\/1742-6596\/2562\/1\/012046"},{"key":"20076_CR14","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2023.3336178","author":"M Wang","year":"2023","unstructured":"Wang M, Zhang B (2023) Contrastive learning and similarity feature fusion for uav image target detection. IEEE Geosci Remote Sens Lett. https:\/\/doi.org\/10.1109\/LGRS.2023.3336178","journal-title":"IEEE Geosci Remote Sens Lett"},{"issue":"4","key":"20076_CR15","doi-asserted-by":"publisher","first-page":"605","DOI":"10.1002\/tee.23758","volume":"18","author":"H Liu","year":"2023","unstructured":"Liu H, Duan X, Chen H, Lou H, Deng L (2023) Dbf-yolo: Uav small targets detection based on shallow feature fusion. IEEJ Trans Electr Electron Eng 18(4):605\u2013612. https:\/\/doi.org\/10.1002\/tee.23758","journal-title":"IEEJ Trans Electr Electron Eng"},{"key":"20076_CR16","doi-asserted-by":"publisher","unstructured":"Feng C, Zhong Y, Gao Y, Scott MR, Huang W (2021) Tood: Task-aligned one-stage object detection. In: 2021 IEEE\/CVF international conference on computer vision (ICCV), pp 3490\u20133499. https:\/\/doi.org\/10.1109\/ICCV48922.2021.00349. IEEE Computer Society","DOI":"10.1109\/ICCV48922.2021.00349"},{"key":"20076_CR17","doi-asserted-by":"publisher","unstructured":"Li X, Wang W, Wu L, Chen S, Hu X, Li J, Tang J, Yang J (2020) Generalized focal loss: Learning qualified and distributed bounding boxes for dense object detection. Advances in Neural Information Processing Systems 33:21002\u201321012. https:\/\/doi.org\/10.48550\/arXiv.2006.04388","DOI":"10.48550\/arXiv.2006.04388"},{"issue":"8","key":"20076_CR18","doi-asserted-by":"publisher","first-page":"8574","DOI":"10.1109\/TCYB.2021.3095305","volume":"52","author":"Z Zheng","year":"2021","unstructured":"Zheng Z, Wang P, Ren D, Liu W, Ye R, Hu Q, Zuo W (2021) Enhancing geometric factors in model learning and inference for object detection and instance segmentation. IEEE transactions on cybernetics 52(8):8574\u20138586. https:\/\/doi.org\/10.1109\/TCYB.2021.3095305","journal-title":"IEEE transactions on cybernetics"},{"key":"20076_CR19","doi-asserted-by":"publisher","unstructured":"Tong Z, Chen Y, Xu Z, Yu R (2023) Wise-iou: Bounding box regression loss with dynamic focusing mechanism. https:\/\/doi.org\/10.48550\/arXiv.2301.10051","DOI":"10.48550\/arXiv.2301.10051"},{"key":"20076_CR20","doi-asserted-by":"publisher","unstructured":"Zhu P, Wen L, Bian X, Ling H, Hu Q (2018) Vision meets drones: A challenge. https:\/\/doi.org\/10.48550\/arXiv.1804.07437","DOI":"10.48550\/arXiv.1804.07437"},{"key":"20076_CR21","doi-asserted-by":"publisher","unstructured":"Du D, Qi Y, Yu H, Yang Y, Duan K, Li G, Zhang W, Huang Q, Tian Q (2018) The unmanned aerial vehicle benchmark: Object detection and tracking. In: Proceedings of the european conference on computer vision (ECCV), pp. 370\u2013386. https:\/\/doi.org\/10.48550\/arXiv.1804.00518","DOI":"10.48550\/arXiv.1804.00518"},{"key":"20076_CR22","doi-asserted-by":"publisher","unstructured":"Zhao Y, Lv W, Xu S, Wei J, Wang G, Dang Q, Liu Y, Chen J (2024) Detrs beat yolos on real-time object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 16965\u201316974. https:\/\/doi.org\/10.48550\/arXiv.2304.08069","DOI":"10.48550\/arXiv.2304.08069"},{"key":"20076_CR23","doi-asserted-by":"publisher","unstructured":"Zhang H, Li F, Liu S, Zhang L, Su H, Zhu J, Ni LM, Shum H-Y (2022) Dino: Detr with improved denoising anchor boxes for end-to-end object detection. https:\/\/doi.org\/10.48550\/arXiv.2203.03605","DOI":"10.48550\/arXiv.2203.03605"},{"key":"20076_CR24","doi-asserted-by":"publisher","unstructured":"Zhu X, Su W, Lu L, Li B, Wang X, Dai J (2020) Deformable detr: Deformable transformers for end-to-end object detection. https:\/\/doi.org\/10.48550\/arXiv.2010.04159","DOI":"10.48550\/arXiv.2010.04159"},{"key":"20076_CR25","doi-asserted-by":"publisher","unstructured":"Wang A, Chen H, Liu L, Chen K, Lin Z, Han J, Ding G (2024) Yolov10: Real-time end-to-end object detection.. https:\/\/doi.org\/10.48550\/arXiv.2405.14458","DOI":"10.48550\/arXiv.2405.14458"},{"key":"20076_CR26","doi-asserted-by":"publisher","unstructured":"Duan K, Bai S, Xie L, Qi H, Huang Q, Tian Q (2019) Centernet: Keypoint triplets for object detection. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 6569\u20136578. https:\/\/doi.org\/10.48550\/arXiv.1904.08189","DOI":"10.48550\/arXiv.1904.08189"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-20076-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-024-20076-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-20076-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,16]],"date-time":"2025-07-16T12:41:04Z","timestamp":1752669664000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-024-20076-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,8,24]]},"references-count":26,"journal-issue":{"issue":"22","published-online":{"date-parts":[[2025,7]]}},"alternative-id":["20076"],"URL":"https:\/\/doi.org\/10.1007\/s11042-024-20076-3","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,8,24]]},"assertion":[{"value":"2 October 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 July 2024","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 August 2024","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 August 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The data in this paper did not have an unethical mandate and the informed consent of all authors for publication of this article has been obtained","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical and informed consent for data used"}},{"value":"The authors have no relevant financial or non-financial interests to disclose.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing Interests"}}]}}