{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,12]],"date-time":"2025-12-12T10:16:07Z","timestamp":1765534567130,"version":"3.48.0"},"reference-count":73,"publisher":"Springer Science and Business Media LLC","issue":"18","license":[{"start":{"date-parts":[[2025,12,12]],"date-time":"2025-12-12T00:00:00Z","timestamp":1765497600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,12,12]],"date-time":"2025-12-12T00:00:00Z","timestamp":1765497600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Supercomput"],"DOI":"10.1007\/s11227-025-08104-x","type":"journal-article","created":{"date-parts":[[2025,12,12]],"date-time":"2025-12-12T10:12:53Z","timestamp":1765534373000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["MD-DRIFPN: dilated multi-directional FPN for small drone object detection"],"prefix":"10.1007","volume":"81","author":[{"given":"Houyu","family":"Luan","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shuobo","family":"Xu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dishi","family":"Xu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lele","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mengwei","family":"Guo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shaoqing","family":"Huang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,12,12]]},"reference":[{"key":"8104_CR1","doi-asserted-by":"publisher","DOI":"10.3390\/drones7060398","author":"Z Zhang","year":"2023","unstructured":"Zhang Z, Zhu L (2023) A review on unmanned aerial vehicle remote sensing: platforms, sensors, data processing methods, and applications. Drones. https:\/\/doi.org\/10.3390\/drones7060398","journal-title":"Drones"},{"issue":"3","key":"8104_CR2","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1016\/j.ijtst.2017.01.004","volume":"5","author":"T Jiang","year":"2016","unstructured":"Jiang T, Geller J, Ni D, Collura J (2016) Unmanned aircraft system traffic management: concept of operation and system architecture. Int J Transport Sci Technol 5(3):123\u2013135. https:\/\/doi.org\/10.1016\/j.ijtst.2017.01.004","journal-title":"Int J Transport Sci Technol"},{"key":"8104_CR3","doi-asserted-by":"publisher","DOI":"10.1038\/s41598-025-92344-7","author":"S Zhou","year":"2025","unstructured":"Zhou S, Zhou H, Qian L (2025) A multi-scale small object detection algorithm SMA-yolo for UAV remote sensing images. Sci Reports. https:\/\/doi.org\/10.1038\/s41598-025-92344-7","journal-title":"Sci Reports"},{"issue":"22","key":"8104_CR4","doi-asserted-by":"publisher","first-page":"4265","DOI":"10.3390\/rs16224265","volume":"16","author":"Z Yuan","year":"2024","unstructured":"Yuan Z, Gong J, Guo B, Wang C, Liao N, Song J, Wu Q (2024) Small object detection in UAV remote sensing images based on intra-group multi-scale fusion attention and adaptive weighted feature fusion mechanism. Remote Sensing 16(22):4265. https:\/\/doi.org\/10.3390\/rs16224265","journal-title":"Remote Sensing"},{"key":"8104_CR5","doi-asserted-by":"publisher","DOI":"10.1038\/s41598-025-00239-4","author":"Y Wu","year":"2025","unstructured":"Wu Y, Mu X, Shi H, Hou M (2025) An object detection model AAPW-yolo for UAV remote sensing images based on adaptive convolution and reconstructed feature fusion. Sci Reports. https:\/\/doi.org\/10.1038\/s41598-025-00239-4","journal-title":"Sci Reports"},{"issue":"1","key":"8104_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/s41598-024-64232-z","volume":"14","author":"W Hua","year":"2024","unstructured":"Hua W, Chen Q, Chen W (2024) A new lightweight network for efficient UAV object detection. Sci Rep 14(1):1\u201315. https:\/\/doi.org\/10.1038\/s41598-024-64232-z","journal-title":"Sci Rep"},{"key":"8104_CR7","doi-asserted-by":"publisher","DOI":"10.1186\/s13638-024-02401-4","author":"AA Baktayan","year":"2024","unstructured":"Baktayan AA, Zahary AT, Sikora A, Welte D (2024) Computational offloading into UAV swarm networks: a systematic literature review. EURASIP J Wirel Commun Netw. https:\/\/doi.org\/10.1186\/s13638-024-02401-4","journal-title":"EURASIP J Wirel Commun Netw"},{"issue":"13","key":"8104_CR8","doi-asserted-by":"publisher","first-page":"24013","DOI":"10.1109\/JIOT.2024.3388045","volume":"11","author":"X Min","year":"2024","unstructured":"Min X, Zhou W, Hu R, Wu Y, Pang Y, Yi J (2024) Lwuavdet: A lightweight UAV object detection network on edge devices. IEEE Internet Things J 11(13):24013\u201324023. https:\/\/doi.org\/10.1109\/JIOT.2024.3388045","journal-title":"IEEE Internet Things J"},{"issue":"14","key":"8104_CR9","doi-asserted-by":"publisher","first-page":"21353","DOI":"10.1007\/s11042-022-13801-3","volume":"82","author":"E Arkin","year":"2022","unstructured":"Arkin E, Yadikar N, Xu X, Aysa A, Ubul K (2022) A survey: object detection methods from CNN to transformer. Multim Tools Appl 82(14):21353\u201321383. https:\/\/doi.org\/10.1007\/s11042-022-13801-3","journal-title":"Multim Tools Appl"},{"key":"8104_CR10","doi-asserted-by":"publisher","unstructured":"Girshick RB, Donahue J, Darrell T, Malik J (2013) Rich feature hierarchies for accurate object detection and semantic segmentation. In: 2014 IEEE Conference on Computer Vision and Pattern Recognition, pp. 580\u2013587 https:\/\/doi.org\/10.1109\/cvpr.2014.81","DOI":"10.1109\/cvpr.2014.81"},{"key":"8104_CR11","doi-asserted-by":"publisher","unstructured":"Girshick R (2015) Fast r-cnn. In: 2015 IEEE International Conference on Computer Vision (ICCV). IEEE, Santiago, Chile. https:\/\/doi.org\/10.1109\/iccv.2015.169. http:\/\/ieeexplore.ieee.org\/document\/7410526\/","DOI":"10.1109\/iccv.2015.169"},{"key":"8104_CR12","doi-asserted-by":"crossref","unstructured":"Liu W, Anguelov D, Erhan D, Szegedy C, Reed SE, Fu CY, Berg A (2015) Ssd: Single shot multibox detector. Computer Vision ECCV 2016, pp. 21\u201337 10.1007\/978-3-319-46448-0_2","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"8104_CR13","doi-asserted-by":"publisher","unstructured":"Lin TY, Goyal P, Girshick RB, He K, Doll RP (2017) Focal loss for dense object detection. In: 2017 IEEE International Conference on Computer Vision (ICCV), pp. 2999\u20133007 https:\/\/doi.org\/10.1109\/iccv.2017.324","DOI":"10.1109\/iccv.2017.324"},{"key":"8104_CR14","doi-asserted-by":"publisher","unstructured":"Redmon J, Farhadi A (2018) Yolov3: An incremental improvement. https:\/\/doi.org\/10.48550\/arXiv.1804.02767","DOI":"10.48550\/arXiv.1804.02767"},{"key":"8104_CR15","doi-asserted-by":"publisher","unstructured":"Bochkovskiy A, Wang CY, Liao HYM (2020) Yolov4: optimal speed and accuracy of object detection. https:\/\/doi.org\/10.48550\/arXiv.2004.10934","DOI":"10.48550\/arXiv.2004.10934"},{"key":"8104_CR16","doi-asserted-by":"publisher","unstructured":"Jocher G. YOLOv5 by Ultralytics. https:\/\/doi.org\/10.5281\/zenodo.3908559. https:\/\/github.com\/ultralytics\/yolov5","DOI":"10.5281\/zenodo.3908559"},{"key":"8104_CR17","doi-asserted-by":"publisher","unstructured":"Khanam R, Hussain M (2024) Yolov11: An overview of the key architectural enhancements. https:\/\/doi.org\/10.48550\/arXiv.2410.17725","DOI":"10.48550\/arXiv.2410.17725"},{"issue":"6","key":"8104_CR18","doi-asserted-by":"publisher","first-page":"162","DOI":"10.1007\/s10462-025-11150-9","volume":"58","author":"W Hua","year":"2025","unstructured":"Hua W, Chen Q (2025) A survey of small object detection based on deep learning in aerial images. Artif Intell Rev 58(6):162. https:\/\/doi.org\/10.1007\/s10462-025-11150-9","journal-title":"Artif Intell Rev"},{"issue":"18","key":"8104_CR19","doi-asserted-by":"publisher","first-page":"3608","DOI":"10.3390\/rs13183608","volume":"13","author":"H Zhang","year":"2021","unstructured":"Zhang H, An L, Chu V, Stow D, Liu X, Ding Q (2021) Learning adjustable reduced downsampling network for small object detection in urban environments. Remote Sensing 13(18):3608. https:\/\/doi.org\/10.3390\/rs13183608","journal-title":"Remote Sensing"},{"key":"8104_CR20","doi-asserted-by":"publisher","DOI":"10.3390\/rs17081438","author":"Z Li","year":"2025","unstructured":"Li Z, Hu X, Qian J, Zhao T, Xu D, Wang Y (2025) Self-supervised feature contrastive learning for small weak object detection in remote sensing. Remote Sens. https:\/\/doi.org\/10.3390\/rs17081438","journal-title":"Remote Sens"},{"key":"8104_CR21","doi-asserted-by":"publisher","DOI":"10.3390\/rs16163057","author":"Y Li","year":"2024","unstructured":"Li Y, Li Q, Pan J, Zhou Y, Zhu H, Wei H, Liu C (2024) Sod-yolo: Small-object-detection algorithm based on improved yolov8 for UAV images. Remote Sens. https:\/\/doi.org\/10.3390\/rs16163057","journal-title":"Remote Sens"},{"key":"8104_CR22","doi-asserted-by":"publisher","DOI":"10.3390\/rs15061687","author":"Q Zhao","year":"2023","unstructured":"Zhao Q, Liu B, Lyu S, Wang C, Zhang H (2023) Tph-yolov5++: Boosting object detection on drone-captured scenarios with cross-layer asymmetric transformer. Remote Sens. https:\/\/doi.org\/10.3390\/rs15061687","journal-title":"Remote Sens"},{"issue":"4","key":"8104_CR23","doi-asserted-by":"publisher","first-page":"6551","DOI":"10.3934\/mbe.2023282","volume":"20","author":"Q Feng","year":"2023","unstructured":"Feng Q, Xu X, Wang Z (2023) Deep learning-based small object detection: A survey. Math Biosci Eng 20(4):6551\u20136590. https:\/\/doi.org\/10.3934\/mbe.2023282","journal-title":"Math Biosci Eng"},{"key":"8104_CR24","doi-asserted-by":"publisher","DOI":"10.3390\/electronics13101849","author":"H Wang","year":"2024","unstructured":"Wang H, Sui C, Jiang F, Li S, Liu H, Wang A (2024) Value-guided adaptive data augmentation for imbalanced small object detection. Electronics. https:\/\/doi.org\/10.3390\/electronics13101849","journal-title":"Electronics"},{"key":"8104_CR25","doi-asserted-by":"publisher","first-page":"116675","DOI":"10.1016\/j.image.2022.116675","volume":"104","author":"OC Koyun","year":"2022","unstructured":"Koyun OC, Keser RK, Batuhan Akkaya T, Reyin BU (2022) Focus-and-detect: A small object detection framework for aerial images. Signal Processing: Image Commun 104:116675. https:\/\/doi.org\/10.1016\/j.image.2022.116675","journal-title":"Signal Processing: Image Commun"},{"key":"8104_CR26","doi-asserted-by":"publisher","unstructured":"Kaundanya C, Cesar P, Cronin B, Fleury A, Liu M, Little S (2025) Enhancing small object detection in resource-constrained ARAS using image cropping and slicing techniques. In: Proceedings of the 20th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications, pp. 570\u2013583 https:\/\/doi.org\/10.5220\/0013190400003912","DOI":"10.5220\/0013190400003912"},{"key":"8104_CR27","doi-asserted-by":"publisher","unstructured":"Yang G, Lei J, Zhu Z, Cheng S, Feng Z, Liang R (2023) AFPN: Asymptotic feature pyramid network for object detection. In: 2023 IEEE International Conference on Systems, Man, and Cybernetics (SMC), pp. 2184\u20132189 https:\/\/doi.org\/10.1109\/smc53992.2023.10394415","DOI":"10.1109\/smc53992.2023.10394415"},{"key":"8104_CR28","doi-asserted-by":"publisher","DOI":"10.3390\/rs16224265","author":"Z Yuan","year":"2024","unstructured":"Yuan Z, Gong J, Guo B, Wang C, Liao N, Song J, Wu Q (2024) Small object detection in UAV remote sensing images based on intra-group multi-scale fusion attention and adaptive weighted feature fusion mechanism. Remote Sens. https:\/\/doi.org\/10.3390\/rs16224265","journal-title":"Remote Sens"},{"key":"8104_CR29","doi-asserted-by":"publisher","DOI":"10.3390\/rs15112728","author":"J Qu","year":"2023","unstructured":"Qu J, Tang Z, Zhang L, Zhang Y, Zhang Z (2023) Remote sensing small object detection network based on attention mechanism and multi-scale feature fusion. Remote Sens. https:\/\/doi.org\/10.3390\/rs15112728","journal-title":"Remote Sens"},{"key":"8104_CR30","doi-asserted-by":"publisher","unstructured":"Gil H, Park S, Park Y, Han W, Hong J, Jung J (2020) Balance-oriented focal loss with linear scheduling for anchor free object detection. https:\/\/doi.org\/10.48550\/arXiv.2012.13763","DOI":"10.48550\/arXiv.2012.13763"},{"issue":"19","key":"8104_CR31","doi-asserted-by":"publisher","first-page":"6437","DOI":"10.3390\/s24196437","volume":"24","author":"Z Wang","year":"2024","unstructured":"Wang Z, Men S, Bai Y, Yuan Y, Wang J, Wang K, Zhang L (2024) Improved small object detection algorithm CRL-yolov5. Sensors 24(19):6437. https:\/\/doi.org\/10.3390\/s24196437","journal-title":"Sensors"},{"issue":"4","key":"8104_CR32","doi-asserted-by":"publisher","first-page":"3163","DOI":"10.1609\/aaai.v35i4.16426","volume":"35","author":"X Yang","year":"2021","unstructured":"Yang X, Yan J, Feng Z, He T (2021) R3det: Refined single-stage detector with feature refinement for rotating object. Proceed AAAI Conf Artif Intell 35(4):3163\u20133171. https:\/\/doi.org\/10.1609\/aaai.v35i4.16426","journal-title":"Proceed AAAI Conf Artif Intell"},{"key":"8104_CR33","doi-asserted-by":"publisher","unstructured":"Yang Z, Zhang C, Chen C, Li H (2024) Transparent projection networks for interpretable image recognition. In: 2024 International Joint Conference on Neural Networks (IJCNN), pp. 1\u20138 https:\/\/doi.org\/10.1109\/ijcnn60899.2024.10650509","DOI":"10.1109\/ijcnn60899.2024.10650509"},{"key":"8104_CR34","doi-asserted-by":"publisher","unstructured":"Lin TY, Dollar P, Girshick R, He K, Hariharan B, Belongie S (2017) Feature pyramid networks for object detection. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 936\u2013944. IEEE, Honolulu, HI https:\/\/doi.org\/10.1109\/cvpr.2017.106. http:\/\/ieeexplore.ieee.org\/document\/8099589\/","DOI":"10.1109\/cvpr.2017.106"},{"key":"8104_CR35","doi-asserted-by":"publisher","unstructured":"Tan M, Pang R, Le QV (2019) Efficientdet: Scalable and efficient object detection. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 10778\u201310787 https:\/\/doi.org\/10.1109\/cvpr42600.2020.01079","DOI":"10.1109\/cvpr42600.2020.01079"},{"key":"8104_CR36","doi-asserted-by":"publisher","unstructured":"Pang J, Chen K, Shi J, Feng H, Ouyang W, Lin D (2019) Libra r-cnn: towards balanced learning for object detection. In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 821\u2013830 https:\/\/doi.org\/10.1109\/cvpr.2019.00091","DOI":"10.1109\/cvpr.2019.00091"},{"key":"8104_CR37","doi-asserted-by":"publisher","unstructured":"Ghiasi G, Lin TY, Pang R, Le QV (2019) Nas-fpn: learning scalable feature pyramid architecture for object detection. In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 7029\u20137038 https:\/\/doi.org\/10.1109\/cvpr.2019.00720","DOI":"10.1109\/cvpr.2019.00720"},{"key":"8104_CR38","doi-asserted-by":"publisher","unstructured":"Yang Z, Guan Q, Zhao K, Yang J., Xu, X., Long, H., Tang, Y (2024) Multi-branch auxiliary fusion yolo with re-parameterization heterogeneous convolutional for accurate object detection. https:\/\/doi.org\/10.48550\/arXiv.2407.04381","DOI":"10.48550\/arXiv.2407.04381"},{"key":"8104_CR39","doi-asserted-by":"publisher","unstructured":"Wang X, Zhang S, Yu Z, Feng L, Zhang W (2020) Scale-equalizing pyramid convolution for object detection. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 13356\u201313365 https:\/\/doi.org\/10.1109\/cvpr42600.2020.01337","DOI":"10.1109\/cvpr42600.2020.01337"},{"key":"8104_CR40","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/tgrs.2023.3258666","volume":"61","author":"J Zhang","year":"2022","unstructured":"Zhang J, Lei J, Xie W, Fang Z, Li Y, Du Q (2022) Superyolo: super resolution assisted object detection in multimodal remote sensing imagery. IEEE Trans Geosci Remote Sens 61:1\u201315. https:\/\/doi.org\/10.1109\/tgrs.2023.3258666","journal-title":"IEEE Trans Geosci Remote Sens"},{"key":"8104_CR41","doi-asserted-by":"publisher","unstructured":"Rahman MM, Munir M, Marculescu R (2024) Emcad: efficient multi-scale convolutional attention decoding for medical image segmentation https:\/\/doi.org\/10.48550\/arXiv.2405.06880","DOI":"10.48550\/arXiv.2405.06880"},{"key":"8104_CR42","doi-asserted-by":"publisher","unstructured":"Zhang J, Li X, Li J, Liu L, Xue Z, Zhang B, Jiang Z, Huang T, Wang Y, Wang C (2023) Rethinking mobile block for efficient attention-based models. https:\/\/doi.org\/10.48550\/arXiv.2301.01146","DOI":"10.48550\/arXiv.2301.01146"},{"key":"8104_CR43","doi-asserted-by":"publisher","unstructured":"Ding X, Zhang Y, Ge Y, Zhao S, Song L, Yue X, Shan Y (2023) Unireplknet: A universal perception large-kernel convnet for audio, video, point cloud, time-series and image recognition. https:\/\/doi.org\/10.48550\/arXiv.2311.15599","DOI":"10.48550\/arXiv.2311.15599"},{"key":"8104_CR44","doi-asserted-by":"publisher","unstructured":"Li X, Wang W, Hu X, Li J, Tang J, Yang J (2020) Generalized focal loss v2: Learning reliable localization quality estimation for dense object detection. https:\/\/doi.org\/10.48550\/arXiv.2011.12885","DOI":"10.48550\/arXiv.2011.12885"},{"key":"8104_CR45","doi-asserted-by":"publisher","unstructured":"Zhang H, Zhang S (2024) Focaler-iou: more focused intersection over union loss. https:\/\/doi.org\/10.48550\/arXiv.2401.10525","DOI":"10.48550\/arXiv.2401.10525"},{"key":"8104_CR46","doi-asserted-by":"publisher","unstructured":"Zhu PF, Wen L, Du D, Bian X, Ling H, Hu Q, Nie Q, Cheng H, Liu C, Liu X, Ma W, Wu H, Wang L, Schumann A, Brown C, Chen Q, Li C, Li D, Michail E, Zhang F, Ni F, Zhu F, Wang G, Zhang H, Deng H, Liu H, Wang H, Qiu H, Qi H, Shi H, Li H, Xu H, Lin H, Kompatsiaris Y, Cheng J, Wang J, Yang J, Zhou J, Zhao J, Joseph K.J, Duan K, Suresh K, Ke B, Wang K, Avgerinakis K, Sommer L, Zhang L, Yang L, Cheng L, Ma L, Lu L, Ding L, Huang M, Vedurupaka N.K, Mamgain N, Bansal N, Acatay O, Giannakeris P, Wang Q, Zhao Q, Liu K, Huang Q, Liu Q, Cheng Q, Sun Q, Lagani re R, Jiang S, Wang S, Wei S, Wang S, Vrochidis S, Wang S, Lee T, Sajid U, Balasubramanian V, Li W, Zhang W, Wu W, Ma W, He W, Yang W.-z, Chen X, Sun X, Luo X, Lian X, Li X, Kuai Y, Li Y, Luo Y, Zhang Y, Liu Y, Li Y, Wang Y, Wang Y, Wu Y, Fan Y, Wei Y, Zhang Y, Wang Z, Wang Z, Xia Z, Cui Z, He Z, Deng Z, Guo Z, Song Z (2019) Visdrone-det2019: The vision meets drone object detection in image challenge results. 2019 IEEE\/CVF International Conference on Computer Vision Workshop (ICCVW), 213\u2013226 https:\/\/doi.org\/10.1109\/iccvw.2019.00030","DOI":"10.1109\/iccvw.2019.00030"},{"key":"8104_CR47","doi-asserted-by":"publisher","DOI":"10.1016\/j.isprsjprs.2019.11.023","author":"K Li","year":"2019","unstructured":"Li K, Wan G, Cheng G, Meng L, Han J (2019) Object detection in optical remote sensing images: A survey and a new benchmark. ISPRS J Photogram Remote Sens. https:\/\/doi.org\/10.1016\/j.isprsjprs.2019.11.023","journal-title":"ISPRS J Photogram Remote Sens"},{"key":"8104_CR48","doi-asserted-by":"publisher","unstructured":"Wang J, Yang W, Guo H, Zhang R, Xia GS (2021) Tiny object detection in aerial images. In: 2020 25th International Conference on Pattern Recognition (ICPR), pp. 3791\u20133798 https:\/\/doi.org\/10.1109\/icpr48806.2021.9413340","DOI":"10.1109\/icpr48806.2021.9413340"},{"key":"8104_CR49","doi-asserted-by":"publisher","unstructured":"Li C, Li L, Jiang H, Weng K, Geng Y, Li L, Ke Z, Li Q, Cheng M, Nie W, Li Y, Zhang B, Liang Y, Zhou L, Xu X, Chu X, Wei X, Wei X (2022) Yolov6: A single-stage object detection framework for industrial applications. https:\/\/doi.org\/10.48550\/arXiv.2209.02976","DOI":"10.48550\/arXiv.2209.02976"},{"key":"8104_CR50","doi-asserted-by":"publisher","unstructured":"Xu X, Jiang Y, Chen W, Huang Y, Zhang Y, Sun X (2022) Damo-yolo : A report on real-time object detection design. https:\/\/doi.org\/10.48550\/arXiv.2211.15444","DOI":"10.48550\/arXiv.2211.15444"},{"key":"8104_CR51","first-page":"51094","volume":"36","author":"C Wang","year":"2023","unstructured":"Wang C, He W, Nie Y, Guo J, Liu C, Wang Y, Han K (2023) Gold-yolo: efficient object detector via gather-and-distribute mechanism. Adv Neural Inf Process Syst 36:51094\u201351112","journal-title":"Adv Neural Inf Process Syst"},{"key":"8104_CR52","doi-asserted-by":"publisher","unstructured":"Liu J, Hou Q, Cheng MM, Wang C, Feng J (2020) Improving convolutional networks with self-calibrated convolutions. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 10093\u201310102 https:\/\/doi.org\/10.1109\/cvpr42600.2020.01011","DOI":"10.1109\/cvpr42600.2020.01011"},{"key":"8104_CR53","doi-asserted-by":"publisher","unstructured":"Hu M, Feng J, Hua J, Lai B, Huang J, Gong X, Hua X (2022) Online convolutional re-parameterization. https:\/\/doi.org\/10.48550\/arXiv.2204.00826","DOI":"10.48550\/arXiv.2204.00826"},{"key":"8104_CR54","doi-asserted-by":"publisher","unstructured":"Xia Z, Pan X, Song S, Li LE, Huang G (2022) Vision transformer with deformable attention. https:\/\/doi.org\/10.48550\/arXiv.2201.00520","DOI":"10.48550\/arXiv.2201.00520"},{"key":"8104_CR55","doi-asserted-by":"crossref","unstructured":"He H, Zhang J, Cai Y, Chen H, Hu X, Gan Z, Wang Y, Wang C, Wu Y, Xie L (2024) Mobilemamba: Lightweight multi-receptive visual mamba network. arXiv:2411.15941","DOI":"10.1109\/CVPR52734.2025.00424"},{"key":"8104_CR56","doi-asserted-by":"publisher","unstructured":"Yu W, Wang X (2024) Mambaout: Do we really need mamba for vision? https:\/\/doi.org\/10.48550\/arXiv.2405.07992","DOI":"10.48550\/arXiv.2405.07992"},{"key":"8104_CR57","doi-asserted-by":"publisher","unstructured":"Li J, Zhang Z, Zuo W (2024) Rethinking transformer-based blind-spot network for self-supervised image denoising. https:\/\/doi.org\/10.48550\/arXiv.2404.07846","DOI":"10.48550\/arXiv.2404.07846"},{"issue":"6","key":"8104_CR58","doi-asserted-by":"publisher","first-page":"110714","DOI":"10.1016\/j.patcog.2024.110714","volume":"45","author":"Z Yu","year":"2024","unstructured":"Yu Z, Huang H, Chen W, Su Y, Liu Y, Wang X (2024) Yolo-facev2: a scale and occlusion aware face detector. Patt Recognit 45(6):110714","journal-title":"Patt Recognit"},{"key":"8104_CR59","doi-asserted-by":"publisher","unstructured":"Cai Z, Vasconcelos N (2017) Cascade r-cnn: delving into high quality object detection. https:\/\/doi.org\/10.48550\/arXiv.1712.00726","DOI":"10.48550\/arXiv.1712.00726"},{"key":"8104_CR60","doi-asserted-by":"publisher","unstructured":"Zhang S, Chi C, Yao Y, Lei Z, Li SZ (2019) Bridging the gap between anchor-based and anchor-free detection via adaptive training sample selection. https:\/\/doi.org\/10.48550\/arXiv.1912.02424","DOI":"10.48550\/arXiv.1912.02424"},{"key":"8104_CR61","doi-asserted-by":"publisher","unstructured":"Feng C, Zhong Y, Gao Y, Scott MR, Huang W (2021) Tood: task-aligned one-stage object detection. https:\/\/doi.org\/10.48550\/arXiv.2108.07755","DOI":"10.48550\/arXiv.2108.07755"},{"key":"8104_CR62","doi-asserted-by":"publisher","unstructured":"Zhang H, Li F, Liu S, Zhang L, Su H, Zhu J, Ni LM, Shum HY (2022) Dino: Detr with improved denoising anchor boxes for end-to-end object detection. https:\/\/doi.org\/10.48550\/arXiv.2203.03605","DOI":"10.48550\/arXiv.2203.03605"},{"key":"8104_CR63","doi-asserted-by":"publisher","unstructured":"Ge Z, Liu S, Wang F, Li Z, Sun J (2021) Yolox: Exceeding yolo series in 2021 https:\/\/doi.org\/10.48550\/arXiv.2107.08430","DOI":"10.48550\/arXiv.2107.08430"},{"key":"8104_CR64","doi-asserted-by":"publisher","unstructured":"Li X, Wang W, Wu L, Chen S, Hu X, Li J, Tang J, Yang J (2020) Generalized focal loss: learning qualified and distributed bounding boxes for dense object detection. https:\/\/doi.org\/10.48550\/arXiv.2006.04388","DOI":"10.48550\/arXiv.2006.04388"},{"key":"8104_CR65","doi-asserted-by":"publisher","unstructured":"Lyu C, Zhang W, Huang H, Zhou Y, Wang Y, Liu Y, Zhang S, Chen K (2022) Rtmdet: An empirical study of designing real-time object detectors. https:\/\/doi.org\/10.48550\/arXiv.2212.07784","DOI":"10.48550\/arXiv.2212.07784"},{"key":"8104_CR66","doi-asserted-by":"publisher","unstructured":"Zhao Y, Lv W, Xu S, Wei J, Wang G, Dang Q, Liu Y, Chen J (2023) Detrs beat yolos on real-time object detection. https:\/\/doi.org\/10.48550\/arXiv.2304.08069","DOI":"10.48550\/arXiv.2304.08069"},{"key":"8104_CR67","unstructured":"Peng Y, Li H, Wu P, Zhang Y, Sun X, Wu F (2024) D-FINE: redefine regression task in DETRs as fine-grained distribution refinement"},{"key":"8104_CR68","doi-asserted-by":"crossref","unstructured":"Huang S, Lu Z, Cun X, Yu Y, Zhou X, Shen X (2024) DEIM: DETR with improved matching for fast convergence","DOI":"10.1109\/CVPR52734.2025.01412"},{"key":"8104_CR69","doi-asserted-by":"publisher","unstructured":"Lv W, Zhao Y, Chang Q, Huang K, Wang G, Liu Y (2024) Rt-detrv2: improved baseline with bag-of-freebies for real-time detection transformer. https:\/\/doi.org\/10.48550\/arXiv.2407.17140","DOI":"10.48550\/arXiv.2407.17140"},{"key":"8104_CR70","unstructured":"Jocher G, Chaurasia A, Qiu J. Ultralytics YOLOv8. https:\/\/github.com\/ultralytics\/ultralytics"},{"key":"8104_CR71","unstructured":"Jocher G, Qiu J Ultralytics YOLO11. https:\/\/github.com\/ultralytics\/ultralytics"},{"key":"8104_CR72","doi-asserted-by":"publisher","unstructured":"Zhang S, Xinjiang W, Wang J, Pang J, Lyu C, Zhang W, Luo P, Chen K (2023) Dense distinct query for end-to-end object detection. https:\/\/doi.org\/10.48550\/arXiv.2303.12776","DOI":"10.48550\/arXiv.2303.12776"},{"key":"8104_CR73","doi-asserted-by":"publisher","unstructured":"Tian Z, Shen C, Chen H, He T (2019) Fcos: Fully convolutional one-stage object detection. In: 2019 IEEE\/CVF International Conference on Computer Vision (ICCV). IEEE, pp. 9626\u20139635, Seoul, Korea (South) https:\/\/doi.org\/10.1109\/iccv.2019.00972. https:\/\/ieeexplore.ieee.org\/document\/9010746\/","DOI":"10.1109\/iccv.2019.00972"}],"container-title":["The Journal of Supercomputing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-025-08104-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11227-025-08104-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-025-08104-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,12]],"date-time":"2025-12-12T10:13:10Z","timestamp":1765534390000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11227-025-08104-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,12]]},"references-count":73,"journal-issue":{"issue":"18","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["8104"],"URL":"https:\/\/doi.org\/10.1007\/s11227-025-08104-x","relation":{},"ISSN":["1573-0484"],"issn-type":[{"value":"1573-0484","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,12,12]]},"assertion":[{"value":"23 May 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 November 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 December 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}},{"value":"The work described has not been published before, and its publication has been approved by the responsible authorities at the institution where the work is carried out.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}}],"article-number":"1646"}}