{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,5]],"date-time":"2026-03-05T02:06:50Z","timestamp":1772676410939,"version":"3.50.1"},"reference-count":34,"publisher":"Springer Science and Business Media LLC","issue":"8","license":[{"start":{"date-parts":[[2025,5,30]],"date-time":"2025-05-30T00:00:00Z","timestamp":1748563200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,5,30]],"date-time":"2025-05-30T00:00:00Z","timestamp":1748563200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/100009110","name":"Natural Science Foundation of Xinjiang Uygur Autonomous Region","doi-asserted-by":"publisher","award":["2022D01C83"],"award-info":[{"award-number":["2022D01C83"]}],"id":[{"id":"10.13039\/100009110","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100009110","name":"Natural Science Foundation of Xinjiang Uygur Autonomous Region","doi-asserted-by":"publisher","award":["2022D01C83"],"award-info":[{"award-number":["2022D01C83"]}],"id":[{"id":"10.13039\/100009110","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100009110","name":"Natural Science Foundation of Xinjiang Uygur Autonomous Region","doi-asserted-by":"publisher","award":["2022D01C83"],"award-info":[{"award-number":["2022D01C83"]}],"id":[{"id":"10.13039\/100009110","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100009110","name":"Natural Science Foundation of Xinjiang Uygur Autonomous Region","doi-asserted-by":"publisher","award":["2022D01C83"],"award-info":[{"award-number":["2022D01C83"]}],"id":[{"id":"10.13039\/100009110","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100009110","name":"Natural Science Foundation of Xinjiang Uygur Autonomous Region","doi-asserted-by":"publisher","award":["2022D01C83"],"award-info":[{"award-number":["2022D01C83"]}],"id":[{"id":"10.13039\/100009110","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Supercomput"],"DOI":"10.1007\/s11227-025-07362-z","type":"journal-article","created":{"date-parts":[[2025,5,30]],"date-time":"2025-05-30T07:48:58Z","timestamp":1748591338000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Stff-rtdetr: a small object detection algorithm based on drone aerial photography"],"prefix":"10.1007","volume":"81","author":[{"given":"Xiaoxi","family":"Teng","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wendong","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tao","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jingdong","family":"Yang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mengnan","family":"Ma","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,5,30]]},"reference":[{"issue":"1","key":"7362_CR1","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1109\/MGRS.2021.3115137","volume":"10","author":"X Wu","year":"2021","unstructured":"Wu X, Li W, Hong D, Tao R, Du Q (2021) Deep learning for unmanned aerial vehicle-based object detection and tracking: a survey. IEEE Geosci Remote Sens Mag 10(1):91\u2013124","journal-title":"IEEE Geosci Remote Sens Mag"},{"key":"7362_CR2","doi-asserted-by":"crossref","unstructured":"Jiao L, Wang M, Liu X, Li L, Liu F, Feng Z, Yang S, Hou B (2024) Multiscale deep learning for detection and recognition: a comprehensive survey. IEEE Trans Neural Netw Learn Syst","DOI":"10.1109\/TNNLS.2024.3389454"},{"key":"7362_CR3","doi-asserted-by":"publisher","first-page":"68324","DOI":"10.1109\/ACCESS.2023.3292302","volume":"11","author":"M Alhafnawi","year":"2023","unstructured":"Alhafnawi M, Salameh HAB, Masadeh A, Al-Obiedollah H, Ayyash M, El-Khazali R, Elgala H (2023) A survey of indoor and outdoor uav-based target tracking systems: current status, challenges, technologies, and future directions. IEEE Access 11:68324\u201368339","journal-title":"IEEE Access"},{"key":"7362_CR4","doi-asserted-by":"crossref","unstructured":"Zhang M, Zhang R, Yang Y, Bai H, Zhang J, Guo J (2022) Isnet: shape matters for infrared small target detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 877\u2013886","DOI":"10.1109\/CVPR52688.2022.00095"},{"key":"7362_CR5","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2022.104471","volume":"123","author":"K Tong","year":"2022","unstructured":"Tong K, Wu Y (2022) Deep learning-based detection from the perspective of small or tiny objects: a survey. Image Vis Comput 123:104471","journal-title":"Image Vis Comput"},{"key":"7362_CR6","doi-asserted-by":"crossref","unstructured":"Baykara HC, B\u0131y\u0131k E, G\u00fcl G, Onural D, \u00d6zt\u00fcrk AS, Y\u0131ld\u0131z I (2017) Real-time detection, tracking and classification of multiple moving objects in uav videos. In: 2017 IEEE 29th International Conference on Tools with Artificial Intelligence (ICTAI), pp 945\u2013950. IEEE","DOI":"10.1109\/ICTAI.2017.00145"},{"issue":"6","key":"7362_CR7","doi-asserted-by":"publisher","first-page":"3107","DOI":"10.1109\/TGRS.2018.2790926","volume":"56","author":"Y Bazi","year":"2018","unstructured":"Bazi Y, Melgani F (2018) Convolutional SVM networks for object detection in UAV imagery. IEEE Trans Geosci Remote Sens 56(6):3107\u20133118","journal-title":"IEEE Trans Geosci Remote Sens"},{"key":"7362_CR8","doi-asserted-by":"crossref","unstructured":"Carion N, Massa F, Synnaeve G, Usunier N, Kirillov A, Zagoruyko S (2020) End-to-end object detection with transformers. In: European Conference On Computer Vision. Springer, pp 213\u2013229","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"7362_CR9","doi-asserted-by":"crossref","unstructured":"Xie X, Cheng G, Wang J, Li K, Yao X, Han J (2024) Oriented R-CNN and beyond. Int J Comput Vis, pp 1\u201323","DOI":"10.1007\/s11263-024-01989-w"},{"key":"7362_CR10","doi-asserted-by":"crossref","unstructured":"Lin T-Y, Goyal P, Girshick R, He K, Doll\u00e1r P (2017) Focal loss for dense object detection. In: Proceedings of the IEEE International Conference on Computer Vision, pp 2980\u20132988","DOI":"10.1109\/ICCV.2017.324"},{"key":"7362_CR11","doi-asserted-by":"crossref","unstructured":"Redmon J, Divvala S, Girshick R, Farhadi A (2016) You only look once: unified, real-time object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 779\u2013788","DOI":"10.1109\/CVPR.2016.91"},{"issue":"4","key":"7362_CR12","doi-asserted-by":"publisher","first-page":"1680","DOI":"10.3390\/make5040083","volume":"5","author":"J Terven","year":"2023","unstructured":"Terven J, C\u00f3rdova-Esparza D-M, Romero-Gonz\u00e1lez J-A (2023) A comprehensive review of yolo architectures in computer vision: from yolov1 to yolov8 and yolo-nas. Mach Learn Knowl Extr 5(4):1680\u20131716","journal-title":"Mach Learn Knowl Extr"},{"key":"7362_CR13","doi-asserted-by":"crossref","unstructured":"Zhao Y, Lv W, Xu S, Wei J, Wang G, Dang Q, Liu Y, Chen J (2024) Detrs beat yolos on real-time object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 16965\u201316974","DOI":"10.1109\/CVPR52733.2024.01605"},{"key":"7362_CR14","doi-asserted-by":"crossref","unstructured":"Yang X, Yang J, Yan J, Zhang Y, Zhang T, Guo Z, Sun X, Fu K (2019) Scrdet: towards more robust detection for small, cluttered and rotated objects. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 8232\u20138241","DOI":"10.1109\/ICCV.2019.00832"},{"issue":"1","key":"7362_CR15","doi-asserted-by":"publisher","first-page":"2609","DOI":"10.1038\/s41598-024-53181-2","volume":"14","author":"Q Cheng","year":"2024","unstructured":"Cheng Q, Wang Y, He W, Bai Y (2024) Lightweight air-to-air unmanned aerial vehicle target detection model. Sci Rep 14(1):2609","journal-title":"Sci Rep"},{"issue":"3","key":"7362_CR16","doi-asserted-by":"publisher","first-page":"251","DOI":"10.2478\/jaiscr-2024-0014","volume":"14","author":"W Zhang","year":"2024","unstructured":"Zhang W, Hong Z, Xiong L, Zeng Z, Cai Z, Tan K (2024) Sinextnet: a new small object detection model for aerial images based on pp-yoloe. J Artif Intell Soft Comput Res 14(3):251\u2013265","journal-title":"J Artif Intell Soft Comput Res"},{"key":"7362_CR17","doi-asserted-by":"publisher","first-page":"197","DOI":"10.1016\/j.patrec.2024.08.006","volume":"185","author":"A Jung","year":"2024","unstructured":"Jung A, Hong S, Hyun Y (2024) Scale-aware token-matching for transformer-based object detector. Pattern Recognit Lett 185:197\u2013202","journal-title":"Pattern Recognit Lett"},{"issue":"6","key":"7362_CR18","doi-asserted-by":"publisher","first-page":"240","DOI":"10.3390\/drones8060240","volume":"8","author":"S Wang","year":"2024","unstructured":"Wang S, Jiang H, Li Z, Yang J, Ma X, Chen J, Tang X (2024) Phsi-rtdetr: a lightweight infrared small target detection algorithm based on UAV aerial photography. Drones 8(6):240","journal-title":"Drones"},{"issue":"6","key":"7362_CR19","doi-asserted-by":"publisher","first-page":"3329","DOI":"10.1007\/s00530-023-01182-y","volume":"29","author":"X Wang","year":"2023","unstructured":"Wang X, He N, Hong C, Sun F, Han W, Wang Q (2023) Yolo-erf: lightweight object detector for UAV aerial images. Multimed Syst 29(6):3329\u20133339","journal-title":"Multimed Syst"},{"key":"7362_CR20","doi-asserted-by":"crossref","unstructured":"Ding X, Zhang Y, Ge Y, Zhao S, Song L, Yue X, Shan Y (2024) Unireplknet: a universal perception large-kernel convnet for audio video point cloud time-series and image recognition. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 5513\u20135524","DOI":"10.1109\/CVPR52733.2024.00527"},{"key":"7362_CR21","doi-asserted-by":"crossref","unstructured":"Sunkara R, Luo T (2022) No more strided convolutions or pooling: a new CNN building block for low-resolution images and small objects. In: Joint European Conference on Machine Learning and Knowledge Discovery in Databases. Springer, pp 443\u2013459","DOI":"10.1007\/978-3-031-26409-2_27"},{"key":"7362_CR22","doi-asserted-by":"crossref","unstructured":"Cui Y, Ren W, Knoll A (2024) Omni-kernel network for image restoration. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol 38, pp 1426\u20131434","DOI":"10.1609\/aaai.v38i2.27907"},{"key":"7362_CR23","doi-asserted-by":"crossref","unstructured":"Du D, Zhu P, Wen L, Bian X, Lin H, Hu Q, Peng T, Zheng J, Wang X, Zhang Y et al (2019) Visdrone-det2019: the vision meets drone object detection in image challenge results. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision Workshops","DOI":"10.1109\/ICCVW.2019.00031"},{"issue":"1","key":"7362_CR24","doi-asserted-by":"publisher","first-page":"227","DOI":"10.1038\/s41597-023-02066-6","volume":"10","author":"J Suo","year":"2023","unstructured":"Suo J, Wang T, Zhang X, Chen H, Zhou W, Shi W (2023) Hit-UAV: a high-altitude infrared thermal dataset for unmanned aerial vehicle-based object detection. Sci Data 10(1):227","journal-title":"Sci Data"},{"key":"7362_CR25","doi-asserted-by":"crossref","unstructured":"Feng C, Zhong Y, Gao Y, Scott MR, Huang W (2021) Tood: task-aligned one-stage object detection. In: 2021 IEEE\/CVF International Conference on Computer Vision (ICCV). IEEE Computer Society, pp 3490\u20133499","DOI":"10.1109\/ICCV48922.2021.00349"},{"key":"7362_CR26","unstructured":"Ge Z, Liu S, Wang F, Li Z, Sun J (2021) Yolox: exceeding yolo series in 2021. arXiv preprint arXiv:2107.08430"},{"key":"7362_CR27","doi-asserted-by":"publisher","first-page":"361","DOI":"10.1007\/s00500-021-06407-8","volume":"26","author":"W Zhan","year":"2022","unstructured":"Zhan W, Sun C, Wang M, She J, Zhang Y, Zhang Z, Sun Y (2022) An improved yolov5 real-time detection method for small objects captured by UAV. Soft Comput 26:361\u2013373","journal-title":"Soft Comput"},{"key":"7362_CR28","unstructured":"Li C, Li L, Jiang H, Weng K, Geng Y, Li L, Ke Z, Li Q, Cheng M, Nie W, et al (2022) Yolov6: a single-stage object detection framework for industrial applications. arXiv preprint arXiv:2209.02976"},{"key":"7362_CR29","unstructured":"Lyu C, Zhang W, Huang H, Zhou Y, Wang Y, Liu Y, Zhang S, Chen K (2022) Rtmdet: an empirical study of designing real-time object detectors. arXiv preprint arXiv:2212.07784"},{"key":"7362_CR30","doi-asserted-by":"crossref","unstructured":"Wang C-Y, Bochkovskiy A, Liao H-YM (2023) Yolov7: trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 7464\u20137475","DOI":"10.1109\/CVPR52729.2023.00721"},{"key":"7362_CR31","unstructured":"Jocher G, Qiu J, Chaurasia A. Ultralytics YOLO. https:\/\/github.com\/ultralytics\/ultralytics"},{"key":"7362_CR32","doi-asserted-by":"crossref","unstructured":"Wang C-Y, Yeh I-H, Mark\u00a0Liao H-Y (2024) Yolov9: learning what you want to learn using programmable gradient information. In: European Conference on Computer Vision. Springer, pp 1\u201321","DOI":"10.1007\/978-3-031-72751-1_1"},{"key":"7362_CR33","first-page":"107984","volume":"37","author":"A Wang","year":"2024","unstructured":"Wang A, Chen H, Liu L, Chen K, Lin Z, Han J et al (2024) Yolov10: real-time end-to-end object detection. Adv Neural Inf Process Syst 37:107984\u2013108011","journal-title":"Adv Neural Inf Process Syst"},{"key":"7362_CR34","unstructured":"Khanam R, Hussain M (2024) Yolov11: an overview of the key architectural enhancements. arXiv preprint arXiv:2410.17725"}],"container-title":["The Journal of Supercomputing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-025-07362-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11227-025-07362-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-025-07362-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,30]],"date-time":"2025-05-30T07:49:10Z","timestamp":1748591350000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11227-025-07362-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,30]]},"references-count":34,"journal-issue":{"issue":"8","published-online":{"date-parts":[[2025,6]]}},"alternative-id":["7362"],"URL":"https:\/\/doi.org\/10.1007\/s11227-025-07362-z","relation":{},"ISSN":["1573-0484"],"issn-type":[{"value":"1573-0484","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,5,30]]},"assertion":[{"value":"30 April 2025","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 May 2025","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"928"}}