{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T18:34:35Z","timestamp":1776882875505,"version":"3.51.2"},"reference-count":44,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T00:00:00Z","timestamp":1740096000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T00:00:00Z","timestamp":1740096000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["52275003"],"award-info":[{"award-number":["52275003"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["52275003"],"award-info":[{"award-number":["52275003"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"name":"National Key Research and Development Program of China","award":["2023YFB4704000"],"award-info":[{"award-number":["2023YFB4704000"]}]},{"name":"National Key Research and Development Program of China","award":["2023YFB4704000"],"award-info":[{"award-number":["2023YFB4704000"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Supercomput"],"DOI":"10.1007\/s11227-025-06961-0","type":"journal-article","created":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T15:29:32Z","timestamp":1740151772000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["MLSA-YOLO: a multi-level feature fusion and scale-adaptive framework for small object detection"],"prefix":"10.1007","volume":"81","author":[{"given":"Jiayu","family":"Peng","sequence":"first","affiliation":[]},{"given":"Kai","family":"Lv","sequence":"additional","affiliation":[]},{"given":"Guoliang","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Wendong","family":"Xiao","sequence":"additional","affiliation":[]},{"given":"Teng","family":"Ran","sequence":"additional","affiliation":[]},{"given":"Liang","family":"Yuan","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,2,21]]},"reference":[{"issue":"4","key":"6961_CR1","doi-asserted-by":"publisher","first-page":"6551","DOI":"10.3934\/mbe.2023282","volume":"20","author":"Q Feng","year":"2023","unstructured":"Feng Q, Xu X, Wang Z (2023) Deep learning-based small object detection: a survey. Math Biosci Eng 20(4):6551\u20136590","journal-title":"Math Biosci Eng"},{"key":"6961_CR2","first-page":"13467","volume":"45","author":"G Cheng","year":"2023","unstructured":"Cheng G, Yuan X, Yao X, Yan K, Zeng Q, Xie X, Han J (2023) Towards large-scale small object detection: survey and benchmarks. IEEE Trans Pattern Anal Mach Intell 45:13467\u201313488","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"6961_CR3","unstructured":"Rekavandi AM, Rashidi S, Boussaid F, Hoefs S, Akbas E et al (2023) Transformers in small object detection: a benchmark and survey of state-of-the-art. arXiv preprint arXiv:2309.04902"},{"key":"6961_CR4","doi-asserted-by":"crossref","unstructured":"Girshick R, Donahue J, Darrell T, Malik J (2014) Rich feature hierarchies for accurate object detection and semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 580\u2013587","DOI":"10.1109\/CVPR.2014.81"},{"key":"6961_CR5","doi-asserted-by":"crossref","unstructured":"Girshick R (2015) Fast r-CNN. arXiv preprint arXiv:1504.08083","DOI":"10.1109\/ICCV.2015.169"},{"key":"6961_CR6","unstructured":"Ren S (2015) Faster r-CNN: towards real-time object detection with region proposal networks. arXiv preprint arXiv:1506.01497"},{"key":"6961_CR7","doi-asserted-by":"crossref","unstructured":"Redmon J (2016) You only look once: unified, real-time object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition","DOI":"10.1109\/CVPR.2016.91"},{"key":"6961_CR8","doi-asserted-by":"crossref","unstructured":"Redmon J, Farhadi A (2017) Yolo9000: better, faster, stronger. In: Proceedings of the IEEE Conference on Computer Vision And Pattern Recognition, pp 7263\u20137271","DOI":"10.1109\/CVPR.2017.690"},{"key":"6961_CR9","unstructured":"Redmon J (2018) Yolov3: an incremental improvement. arXiv preprint arXiv:1804.02767"},{"key":"6961_CR10","unstructured":"Bochkovskiy A, Wang C-Y, Liao H-YM (2020) Yolov4: optimal speed and accuracy of object detection. arXiv preprint arXiv:2004.10934"},{"key":"6961_CR11","doi-asserted-by":"crossref","unstructured":"Liu W, Anguelov D, Erhan D, Szegedy C, Reed S, Fu C-Y, Berg AC (2016) SSD: single shot multibox detector. In: Computer vision\u2014ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part I 14. Springer, Berlin, pp 21\u201337","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"6961_CR12","doi-asserted-by":"crossref","unstructured":"Lin T (2017) Focal loss for dense object detection. arXiv preprint arXiv:1708.02002","DOI":"10.1109\/ICCV.2017.324"},{"key":"6961_CR13","doi-asserted-by":"publisher","DOI":"10.1016\/j.jvcir.2023.103752","volume":"90","author":"M Wang","year":"2023","unstructured":"Wang M, Yang W, Wang L, Chen D, Wei F, KeZiErBieKe H, Liao Y (2023) Fe-yolov5: feature enhancement network based on yolov5 for small object detection. J Vis Commun Image Represent 90:103752","journal-title":"J Vis Commun Image Represent"},{"key":"6961_CR14","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2024.124848","volume":"256","author":"C Xue","year":"2024","unstructured":"Xue C, Xia Y, Wu M, Chen Z, Cheng F, Yun L (2024) EL-YOLO: an efficient and lightweight low-altitude aerial objects detector for onboard applications. Expert Syst Appl 256:124848","journal-title":"Expert Syst Appl"},{"key":"6961_CR15","doi-asserted-by":"crossref","unstructured":"Ghiasi G, Lin T-Y, Le QV (2019) NAS-FPN: learning scalable feature pyramid architecture for object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 7036\u20137045","DOI":"10.1109\/CVPR.2019.00720"},{"key":"6961_CR16","doi-asserted-by":"publisher","DOI":"10.1016\/j.dsp.2024.104554","volume":"151","author":"Y Fu","year":"2024","unstructured":"Fu Y, Ran T, Xiao W, Yuan L, Zhao J, He L, Mei J (2024) GD-YOLO: an improved convolutional neural network architecture for real-time detection of smoking and phone use behaviors. Digit Signal Process 151:104554","journal-title":"Digit Signal Process"},{"key":"6961_CR17","doi-asserted-by":"crossref","unstructured":"Lin T-Y, Doll\u00e1r P, Girshick R, He K, Hariharan B, Belongie S (2017) Feature pyramid networks for object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 2117\u20132125","DOI":"10.1109\/CVPR.2017.106"},{"key":"6961_CR18","doi-asserted-by":"crossref","unstructured":"Liu S, Qi L, Qin H, Shi J, Jia J (2018) Path aggregation network for instance segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 8759\u20138768","DOI":"10.1109\/CVPR.2018.00913"},{"key":"6961_CR19","doi-asserted-by":"crossref","unstructured":"Tan M, Pang R, Le QV (2020) EfficientDet: scalable and efficient object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 10781\u201310790","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"6961_CR20","unstructured":"Liu S, Huang D, Wang Y (2019) Learning spatial fusion for single-shot object detection. arXiv preprint arXiv:1911.09516"},{"key":"6961_CR21","doi-asserted-by":"crossref","unstructured":"Yang G, Lei J, Zhu Z, Cheng S, Feng Z, Liang R (2023) AFPN: asymptotic feature pyramid network for object detection. In: 2023 IEEE International Conference on Systems, Man, and Cybernetics (SMC). IEEE, pp 2184\u20132189","DOI":"10.1109\/SMC53992.2023.10394415"},{"key":"6961_CR22","doi-asserted-by":"crossref","unstructured":"Pang Y, Zhao X, Zhang L, Lu H (2020) Multi-scale interactive network for salient object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 9413\u20139422","DOI":"10.1109\/CVPR42600.2020.00943"},{"key":"6961_CR23","doi-asserted-by":"crossref","unstructured":"Zhu X, Lyu S, Wang X, Zhao Q (2021) Tph-yolov5: improved yolov5 based on transformer prediction head for object detection on drone-captured scenarios. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 2778\u20132788","DOI":"10.1109\/ICCVW54120.2021.00312"},{"key":"6961_CR24","unstructured":"Vaswani A (2017) Attention is all you need. Adv neural inf process syst"},{"key":"6961_CR25","doi-asserted-by":"publisher","unstructured":"Jocher G, Stoken A, Chaurasia A et al {2020) Ultralytics YOLOv5. https:\/\/doi.org\/10.5281\/zenodo.3908559. https:\/\/github.com\/ultralytics\/yolov5","DOI":"10.5281\/zenodo.3908559"},{"key":"6961_CR26","doi-asserted-by":"crossref","unstructured":"Woo S, Park J, Lee J-Y, Kweon IS (2018) CBAM: convolutional block attention module. In: Proceedings of the European Conference on Computer Vision (ECCV), pp 3\u201319","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"6961_CR27","doi-asserted-by":"crossref","unstructured":"Yang C, Huang Z, Wang N (2022) QueryDet: cascaded sparse query for accelerating high-resolution small object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 13668\u201313677","DOI":"10.1109\/CVPR52688.2022.01330"},{"issue":"8","key":"6961_CR28","doi-asserted-by":"publisher","first-page":"526","DOI":"10.3390\/drones7080526","volume":"7","author":"Z Zhang","year":"2023","unstructured":"Zhang Z (2023) Drone-YOLO: an efficient neural network method for target detection in drone images. Drones 7(8):526","journal-title":"Drones"},{"key":"6961_CR29","unstructured":"Jocher G, Chaurasia A, Qiu J, Ultralytics YOLOv8. https:\/\/github.com\/ultralytics\/ultralytics"},{"issue":"5","key":"6961_CR30","doi-asserted-by":"publisher","first-page":"304","DOI":"10.3390\/drones7050304","volume":"7","author":"Y Li","year":"2023","unstructured":"Li Y, Fan Q, Huang H, Han Z, Gu Q (2023) A modified yolov8 detection network for UAV aerial image recognition. Drones 7(5):304","journal-title":"Drones"},{"key":"6961_CR31","doi-asserted-by":"crossref","unstructured":"Han K, Wang Y, Tian Q, Guo J, Xu C, Xu C (2020) GhostNet: more features from cheap operations. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 1580\u20131589","DOI":"10.1109\/CVPR42600.2020.00165"},{"issue":"18","key":"6961_CR32","doi-asserted-by":"publisher","first-page":"4580","DOI":"10.3390\/rs15184580","volume":"15","author":"Y Wang","year":"2023","unstructured":"Wang Y, Zou H, Yin M, Zhang X (2023) SMFF-YOLO: a scale-adaptive yolo algorithm with multi-level feature fusion for object detection in UAV scenes. Remote Sens 15(18):4580","journal-title":"Remote Sens"},{"issue":"1","key":"6961_CR33","doi-asserted-by":"publisher","first-page":"10697","DOI":"10.1038\/s41598-024-61136-w","volume":"14","author":"Y Shi","year":"2024","unstructured":"Shi Y, Jia Y, Zhang X (2024) FocusDet: an efficient object detector for small object. Sci Rep 14(1):10697","journal-title":"Sci Rep"},{"key":"6961_CR34","doi-asserted-by":"crossref","unstructured":"Sunkara R, Luo T (2022) No more strided convolutions or pooling: a new CNN building block for low-resolution images and small objects. In: Joint European Conference on Machine Learning and Knowledge Discovery in Databases. Springer, Berlin, pp 443\u2013459","DOI":"10.1007\/978-3-031-26409-2_27"},{"key":"6961_CR35","unstructured":"Simonyan K, Zisserman A (2014) Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556"},{"key":"6961_CR36","unstructured":"Peng Y, Sonka M, Chen DZ (2023) U-net v2: rethinking the skip connections of u-net for medical image segmentation. arXiv preprint arXiv:2311.17791"},{"key":"6961_CR37","doi-asserted-by":"crossref","unstructured":"Wang W, Dai J, Chen Z, Huang Z, Li Z, Zhu X, Hu X, Lu T, Lu L, Li H (2023) Internimage: exploring large-scale vision foundation models with deformable convolutions. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 14408\u201314419","DOI":"10.1109\/CVPR52729.2023.01385"},{"issue":"11","key":"6961_CR38","doi-asserted-by":"publisher","first-page":"7380","DOI":"10.1109\/TPAMI.2021.3119563","volume":"44","author":"P Zhu","year":"2021","unstructured":"Zhu P, Wen L, Du D, Bian X, Fan H, Hu Q, Ling H (2021) Detection and tracking meet drones challenge. IEEE Trans Pattern Anal Mach Intell 44(11):7380\u20137399","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"6961_CR39","doi-asserted-by":"crossref","unstructured":"Xia G-S, Bai X, Ding J, Zhu Z, Belongie S, Luo J, Datcu M, Pelillo M, Zhang L (2018) Dota: a large-scale dataset for object detection in aerial images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 3974\u20133983","DOI":"10.1109\/CVPR.2018.00418"},{"key":"6961_CR40","doi-asserted-by":"crossref","unstructured":"Cai Z, Vasconcelos N (2018) Cascade r-CNN: Delving into high quality object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 6154\u20136162","DOI":"10.1109\/CVPR.2018.00644"},{"key":"6961_CR41","unstructured":"Wang A, Chen H, Liu L, Chen K, Lin Z, Han J, Ding G (2024) Yolov10: real-time end-to-end object detection. arXiv preprint arXiv:2405.14458"},{"key":"6961_CR42","unstructured":"Jocher G et al. Ultralytics YOLO11. https:\/\/github.com\/ultralytics\/ultralytics"},{"key":"6961_CR43","unstructured":"Zhou X, Wang D, Kr\u00e4henb\u00fchl P (2019) Objects as points. arXiv preprint arXiv:1904.07850"},{"issue":"12","key":"6961_CR44","volume":"43","author":"G Mao","year":"2022","unstructured":"Mao G, Deng T, Yu N (2022) Object detection in UAV images based on multi-scale split attention. Acta Aeronaut Astronaut Sin 43(12):326738","journal-title":"Acta Aeronaut Astronaut Sin"}],"container-title":["The Journal of Supercomputing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-025-06961-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11227-025-06961-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-025-06961-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T15:29:54Z","timestamp":1740151794000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11227-025-06961-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,2,21]]},"references-count":44,"journal-issue":{"issue":"4","published-online":{"date-parts":[[2025,3]]}},"alternative-id":["6961"],"URL":"https:\/\/doi.org\/10.1007\/s11227-025-06961-0","relation":{},"ISSN":["1573-0484"],"issn-type":[{"value":"1573-0484","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,2,21]]},"assertion":[{"value":"16 January 2025","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 February 2025","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"528"}}