{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,4]],"date-time":"2026-02-04T18:29:01Z","timestamp":1770229741081,"version":"3.49.0"},"reference-count":57,"publisher":"Springer Science and Business Media LLC","issue":"12","license":[{"start":{"date-parts":[[2024,7,26]],"date-time":"2024-07-26T00:00:00Z","timestamp":1721952000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,7,26]],"date-time":"2024-07-26T00:00:00Z","timestamp":1721952000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int. J. Mach. Learn. &amp; Cyber."],"published-print":{"date-parts":[[2024,12]]},"DOI":"10.1007\/s13042-024-02278-1","type":"journal-article","created":{"date-parts":[[2024,7,27]],"date-time":"2024-07-27T00:02:52Z","timestamp":1722038572000},"page":"5781-5805","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":13,"title":["Doublem-net: multi-scale spatial pyramid pooling-fast and multi-path adaptive feature pyramid network for UAV detection"],"prefix":"10.1007","volume":"15","author":[{"given":"Zhongxu","family":"Li","sequence":"first","affiliation":[]},{"given":"Qihan","family":"He","sequence":"additional","affiliation":[]},{"given":"Hong","family":"Zhao","sequence":"additional","affiliation":[]},{"given":"Wenyuan","family":"Yang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,7,26]]},"reference":[{"issue":"3","key":"2278_CR1","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1109\/JPROC.2023.3238524","volume":"111","author":"Z Zou","year":"2023","unstructured":"Zou Z, Chen K, Shi Z, Guo Y, Ye J (2023) Object detection in 20 years: a survey. Proc IEEE 111(3):257\u2013276","journal-title":"Proc IEEE"},{"key":"2278_CR2","doi-asserted-by":"publisher","first-page":"747","DOI":"10.1007\/s13042-020-01096-5","volume":"11","author":"X Wang","year":"2020","unstructured":"Wang X, Zhao Y, Pourpanah F (2020) Recent advances in deep learning. Int J Mach Learn Cybern 11:747\u2013750","journal-title":"Int J Mach Learn Cybern"},{"issue":"11","key":"2278_CR3","doi-asserted-by":"publisher","first-page":"12180","DOI":"10.1109\/TITS.2023.3292934","volume":"24","author":"J Cui","year":"2023","unstructured":"Cui J, Qin Y, Wu Y, Shao C, Yang H (2023) Skip connection yolo architecture for noise barrier defect detection using uav-based images in high-speed railway. IEEE Trans Intell Transp Syst 24(11):12180\u201312195","journal-title":"IEEE Trans Intell Transp Syst"},{"issue":"11","key":"2278_CR4","doi-asserted-by":"publisher","first-page":"12272","DOI":"10.1109\/TITS.2023.3290827","volume":"24","author":"X Li","year":"2023","unstructured":"Li X, Wu J (2023) Developing a more reliable framework for extracting traffic data from a uav video. IEEE Trans Intell Transp Syst 24(11):12272\u201312283","journal-title":"IEEE Trans Intell Transp Syst"},{"key":"2278_CR5","doi-asserted-by":"crossref","unstructured":"Huang J, Jiang X, Jin G (2022) Detection of river floating debris in uav images based on improved yolov5. In: 2022 International Joint Conference on Neural Networks, pp 1\u20138","DOI":"10.1109\/IJCNN55064.2022.9892392"},{"key":"2278_CR6","doi-asserted-by":"publisher","first-page":"128914","DOI":"10.1016\/j.optcom.2022.128914","volume":"527","author":"L Sun","year":"2023","unstructured":"Sun L, Zhang Y, Ouyang C, Yin S, Ren X, Fu S (2023) A portable uav-based laser-induced fluorescence lidar system for oil pollution and aquatic environment monitoring. Opt Commun 527:128914\u2013128928","journal-title":"Opt Commun"},{"key":"2278_CR7","doi-asserted-by":"crossref","unstructured":"Furusawa T, Premachandra C (2023) Innovative colormap for emphatic imaging of human voice for uav-based disaster victim search. In: 2023 IEEE Region 10 Symposium, pp. 1\u20135","DOI":"10.1109\/TENSYMP55890.2023.10223627"},{"key":"2278_CR8","doi-asserted-by":"crossref","unstructured":"Dorn C, Depold A, Lurz F, Erhardt S, Hagelauer A (2022) Uav-based localization of mobile phones for search and rescue applications. In: 2022 IEEE 22nd Annual Wireless and Microwave Technology Conference, pp. 1\u20134","DOI":"10.1109\/WAMICON53991.2022.9786189"},{"key":"2278_CR9","doi-asserted-by":"crossref","unstructured":"Girshick R, Donahue J, Darrell T, Malik J (2014) Rich feature hierarchies for accurate object detection and semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 580\u2013587","DOI":"10.1109\/CVPR.2014.81"},{"issue":"9","key":"2278_CR10","doi-asserted-by":"publisher","first-page":"1904","DOI":"10.1109\/TPAMI.2015.2389824","volume":"37","author":"K He","year":"2015","unstructured":"He K, Zhang X, Ren S, Sun J (2015) Spatial pyramid pooling in deep convolutional networks for visual recognition. IEEE Trans Pattern Anal Mach Intell 37(9):1904\u20131916","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"2278_CR11","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2017","unstructured":"Ren S, He K, Girshick R, Sun J (2017) Faster r-cnn: towards real-time object detection with region proposal networks. IEEE Trans Pattern Anal Mach Intell 39:1\u201314","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"2278_CR12","doi-asserted-by":"crossref","unstructured":"Lin TY, Dollar P, Girshick R, He K, Hariharan B, Belongie S (2017) Feature pyramid networks for object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2117\u20132125","DOI":"10.1109\/CVPR.2017.106"},{"key":"2278_CR13","doi-asserted-by":"crossref","unstructured":"Redmon J, Divvala S, Girshick R, Farhadi A (2016) You only look once: unified, real-time object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 779\u2013788","DOI":"10.1109\/CVPR.2016.91"},{"key":"2278_CR14","doi-asserted-by":"crossref","unstructured":"Redmon J, Farhadi A (2017) Yolo9000: better, faster, stronger. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7263\u20137271","DOI":"10.1109\/CVPR.2017.690"},{"key":"2278_CR15","unstructured":"Redmon J, Farhadi A (2018) Yolov3: an incremental improvement arXiv:1804.02767"},{"key":"2278_CR16","unstructured":"Bochkovskiy A, Wang CY, Liao HYM (2020) Yolov4: optimal speed and accuracy of object detection arXiv:2004.10934"},{"key":"2278_CR17","unstructured":"Jocher G (2020) YOLOv5 by Ultralytics"},{"key":"2278_CR18","unstructured":"Li C, Li L, Geng Y, Jiang H, Cheng M, Zhang B, Ke Z, Xu X, Chu X (2023) Yolov6 v3.0: a full-scale reloading arXiv:2301.05586"},{"key":"2278_CR19","doi-asserted-by":"crossref","unstructured":"Wang CY, Bochkovskiy A, Liao HYM (2022) Yolov7: trainable bag-of-freebies sets new state-of-the-art for real-time object detectors arXiv:2207.02696","DOI":"10.1109\/CVPR52729.2023.00721"},{"key":"2278_CR20","unstructured":"Jocher G, Chaurasia A, Qiu J (2023) YOLO by Ultralytics"},{"key":"2278_CR21","doi-asserted-by":"crossref","unstructured":"Wang CY, Yeh IH, Liao HYM (2024) Yolov9: learning what you want to learn using programmable gradient information arXiv:2402.13616","DOI":"10.1007\/978-3-031-72751-1_1"},{"key":"2278_CR22","doi-asserted-by":"publisher","first-page":"1018","DOI":"10.3390\/rs14041018","volume":"14","author":"X Xu","year":"2022","unstructured":"Xu X, Zhang X, Zhang T (2022) Lite-yolov5: a lightweight deep learning detector for on-board ship detection in large-scene sentinel-1 sar images. Remote Sens 14:1018\u20131030","journal-title":"Remote Sens"},{"key":"2278_CR23","unstructured":"Xu X, Jiang Y, Chen W, Huang Y, Zhang Y, Sun X (2023) Damo-yolo: a report on real-time object detection design arXiv:2211.15444"},{"issue":"9","key":"2278_CR24","doi-asserted-by":"publisher","first-page":"1904","DOI":"10.1109\/TPAMI.2015.2389824","volume":"37","author":"K He","year":"2015","unstructured":"He K, Zhang X, Ren S, Sun J (2015) Spatial pyramid pooling in deep convolutional networks for visual recognition. IEEE Trans Pattern Anal Mach Intell 37(9):1904\u20131916","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"4","key":"2278_CR25","doi-asserted-by":"publisher","first-page":"834","DOI":"10.1109\/TPAMI.2017.2699184","volume":"40","author":"LC Chen","year":"2018","unstructured":"Chen LC, Papandreou G, Kokkinos I, Murphy K, Yuille AL (2018) Deeplab: semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected crfs. IEEE Trans Pattern Anal Mach Intell 40(4):834\u2013848","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"2278_CR26","doi-asserted-by":"crossref","unstructured":"Liu S, Huang D, Wang a (2018) Receptive field block net for accurate and fast object detection. In: Proceedings of the European Conference on Computer Vision, pp. 385\u2013400","DOI":"10.1007\/978-3-030-01252-6_24"},{"key":"2278_CR27","first-page":"11231","volume":"31","author":"C Szegedy","year":"2016","unstructured":"Szegedy C, Ioffe S, Vanhoucke V, Alemi A (2016) Inception-v4, inception-resnet and the impact of residual connections on learning. Proc AAAI Conf Artif Intell 31:11231\u201311245","journal-title":"Proc AAAI Conf Artif Intell"},{"key":"2278_CR28","doi-asserted-by":"crossref","unstructured":"Liu W, Anguelov D, Erhan D, Szegedy C, Reed S, Fu CY, Berg AC (2016) Ssd: single shot multibox detector. In: Computer Vision\u2014ECCV 2016: 14th European Conference, pp. 21\u201337","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"2278_CR29","doi-asserted-by":"crossref","unstructured":"Liu S, Qi L, Qin H, Shi J, Jia J (2018) Path aggregation network for instance segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 8759\u20138768","DOI":"10.1109\/CVPR.2018.00913"},{"key":"2278_CR30","doi-asserted-by":"crossref","unstructured":"Tan M, Pang R, Le QV (2020) Efficientdet: scalable and efficient object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10781\u201310790","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"2278_CR31","doi-asserted-by":"publisher","first-page":"2771","DOI":"10.3390\/rs13142771","volume":"13","author":"T Zhang","year":"2021","unstructured":"Zhang T, Zhang X, Ke X (2021) Quad-fpn: a novel quad feature pyramid network for sar ship detection. Remote Sens 13:2771\u20132785","journal-title":"Remote Sens"},{"key":"2278_CR32","unstructured":"Jiang Y, Tan Z, Wang J, Sun X, Lin M, Li H (2022) Giraffedet: a heavy-neck paradigm for object detection arXiv:2202.04256"},{"key":"2278_CR33","doi-asserted-by":"publisher","first-page":"5276","DOI":"10.3390\/rs14205276","volume":"14","author":"X Xu","year":"2022","unstructured":"Xu X, Zhang X, Shao Z, Shi J, Wei S, Zhang T, Zeng T (2022) A group-wise feature enhancement-and-fusion network with dual-polarization feature enrichment for sar ship detection. Remote Sens 14:5276\u20135291","journal-title":"Remote Sens"},{"key":"2278_CR34","doi-asserted-by":"crossref","unstructured":"Yang G, Lei J, Zhu Z, Cheng S, Feng Z, Liang R (2023) Afpn: asymptotic feature pyramid network for object detection arXiv:2306.15988","DOI":"10.1109\/SMC53992.2023.10394415"},{"key":"2278_CR35","doi-asserted-by":"crossref","unstructured":"Saqib M, Khan SD, Sharma N, Blumenstein M (2017) A study on detecting drones using deep convolutional neural networks. In: 2017 14th IEEE International Conference on Advanced Video and Signal Based Surveillance, pp. 1\u20135","DOI":"10.1109\/AVSS.2017.8078541"},{"key":"2278_CR36","doi-asserted-by":"crossref","unstructured":"Chen C, Zhang Y, Lv Q, Wei S, Wang X, Sun X, Dong J (2019) Rrnet: a hybrid detector for object detection in drone-captured images. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision Workshops, pp. 100\u2013108","DOI":"10.1109\/ICCVW.2019.00018"},{"issue":"8","key":"2278_CR37","doi-asserted-by":"publisher","first-page":"9489","DOI":"10.1007\/s13369-021-06288-x","volume":"47","author":"SD Khan","year":"2022","unstructured":"Khan SD, Alarabi L, Basalamah S (2022) A unified deep learning framework of multi-scale detectors for geo-spatial object detection in high-resolution satellite images. Arab J Sci Eng 47(8):9489\u20139504","journal-title":"Arab J Sci Eng"},{"issue":"19","key":"2278_CR38","doi-asserted-by":"publisher","first-page":"3140","DOI":"10.3390\/rs12193140","volume":"12","author":"R Zhang","year":"2020","unstructured":"Zhang R, Shao Z, Huang X, Wang J, Li D (2020) Object detection in uav images via global density fused convolutional network. Remote Sens 12(19):3140\u20133143","journal-title":"Remote Sens"},{"key":"2278_CR39","doi-asserted-by":"publisher","first-page":"292","DOI":"10.1016\/j.neucom.2021.03.016","volume":"443","author":"G Tian","year":"2021","unstructured":"Tian G, Liu J, Yang W (2021) A dual neural network for object detection in uav images. Neurocomputing 443:292\u2013301","journal-title":"Neurocomputing"},{"issue":"10","key":"2278_CR40","doi-asserted-by":"publisher","first-page":"18855","DOI":"10.1109\/TITS.2022.3161977","volume":"23","author":"J Chen","year":"2022","unstructured":"Chen J, Wang Q, Peng W, Xu H, Li X, Xu W (2022) Disparity-based multiscale fusion network for transportation detection. IEEE Trans Intell Transp Syst 23(10):18855\u201318863","journal-title":"IEEE Trans Intell Transp Syst"},{"issue":"13","key":"2278_CR41","doi-asserted-by":"publisher","first-page":"19643","DOI":"10.1007\/s11042-023-14360-x","volume":"82","author":"S Li","year":"2023","unstructured":"Li S, Chen J, Peng W, Shi X, Bu W (2023) A vehicle detection method based on disparity segmentation. Multimed Tools Appl 82(13):19643\u201319655","journal-title":"Multimed Tools Appl"},{"issue":"5","key":"2278_CR42","first-page":"1","volume":"72","author":"B Ma","year":"2023","unstructured":"Ma B, Liu Z, Dang Q, Zhao W, Wang J, Cheng Y, Yuan Z (2023) Deep reinforcement learning of uav tracking control under wind disturbances environments. IEEE Trans Instrum Meas 72(5):1\u201313","journal-title":"IEEE Trans Instrum Meas"},{"key":"2278_CR43","doi-asserted-by":"publisher","first-page":"377","DOI":"10.1016\/j.neucom.2022.03.033","volume":"489","author":"R Zhang","year":"2022","unstructured":"Zhang R, Shao Z, Huang X, Wang J, Wang Y, Li D (2022) Adaptive dense pyramid network for object detection in uav imagery. Neurocomputing 489:377\u2013389","journal-title":"Neurocomputing"},{"key":"2278_CR44","doi-asserted-by":"publisher","first-page":"126384","DOI":"10.1016\/j.neucom.2023.126384","volume":"547","author":"T Wang","year":"2023","unstructured":"Wang T, Ma Z, Yang T, Zou S (2023) Petnet: a yolo-based prior enhanced transformer network for aerial image detection. Neurocomputing 547:126384\u2013126399","journal-title":"Neurocomputing"},{"key":"2278_CR45","unstructured":"Liu S, Huang D, Wang Y (2019) Learning spatial fusion for single-shot object detection arXiv:1911.09516"},{"issue":"11","key":"2278_CR46","doi-asserted-by":"publisher","first-page":"7380","DOI":"10.1109\/TPAMI.2021.3119563","volume":"44","author":"P Zhu","year":"2022","unstructured":"Zhu P, Wen L, Du D, Bian X, Fan H, Hu Q, Ling H (2022) Detection and tracking meet drones challenge. IEEE Trans Pattern Anal Mach Intell 44(11):7380\u20137399","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"10","key":"2278_CR47","doi-asserted-by":"publisher","first-page":"6700","DOI":"10.1109\/TCSVT.2022.3168279","volume":"32","author":"Y Sun","year":"2022","unstructured":"Sun Y, Cao B, Zhu P, Hu Q (2022) Drone-based rgb-infrared cross-modality vehicle detection via uncertainty-aware learning. IEEE Trans Circuits Syst Video Technol 32(10):6700\u20136713","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"2278_CR48","doi-asserted-by":"crossref","unstructured":"Zhu C, He Y, Savvides M (2019) Feature selective anchor-free module for single-shot object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 840\u2013849","DOI":"10.1109\/CVPR.2019.00093"},{"key":"2278_CR49","doi-asserted-by":"crossref","unstructured":"Zhang S, Chi C, Yao Y, Lei Z, Li SZ (2019) Bridging the gap between anchor-based and anchor-free detection via adaptive training sample selection arXiv:1912.02424","DOI":"10.1109\/CVPR42600.2020.00978"},{"key":"2278_CR50","doi-asserted-by":"crossref","unstructured":"Li Y, Chen Y, Wang N, Zhang Z (2019) Scale-aware trident networks for object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 6054\u20136063","DOI":"10.1109\/ICCV.2019.00615"},{"key":"2278_CR51","unstructured":"Zhou X, Wang D, Kr\u00e4henb\u00fchl P (2019) Objects as points"},{"key":"2278_CR52","doi-asserted-by":"crossref","unstructured":"Tian Z, Shen C, Chen H, He T (2019) Fcos: fully convolutional one-stage object detection arXiv:1904.01355","DOI":"10.1109\/ICCV.2019.00972"},{"key":"2278_CR53","doi-asserted-by":"crossref","unstructured":"Chen Z, Yang C, Li Q, Zhao F, Zha ZJ, Wu F (2021) Disentangle your dense object detector. In: Proceedings of the 29th ACM International Conference on Multimedia, pp. 4939\u20134948","DOI":"10.1145\/3474085.3475351"},{"key":"2278_CR54","doi-asserted-by":"crossref","unstructured":"Feng C, Zhong Y, Gao Y, Scott MR, Huang W (2021) Tood: task-aligned one-stage object detection. In: 2021 IEEE\/CVF International Conference on Computer Vision, pp. 3490\u20133499","DOI":"10.1109\/ICCV48922.2021.00349"},{"key":"2278_CR55","doi-asserted-by":"crossref","unstructured":"Zhang H, Wang Y, Dayoub F, S\u00fcnderhauf N (2020) Varifocalnet: an iou-aware dense object detector arXiv:1200.81336","DOI":"10.1109\/CVPR46437.2021.00841"},{"key":"2278_CR56","first-page":"1","volume":"43","author":"Z Cai","year":"2019","unstructured":"Cai Z, Vasconcelos N (2019) Cascade r-cnn: high quality object detection and instance segmentation. IEEE Trans Pattern Anal Mach Intell 43:1\u201315","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"2278_CR57","unstructured":"Ge Z, Liu S, Wang F, Li Z, Sun J (2021) Yolox: exceeding yolo series in 2021 arXiv:2107.08430"}],"container-title":["International Journal of Machine Learning and Cybernetics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s13042-024-02278-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s13042-024-02278-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s13042-024-02278-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T10:27:11Z","timestamp":1730197631000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s13042-024-02278-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7,26]]},"references-count":57,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2024,12]]}},"alternative-id":["2278"],"URL":"https:\/\/doi.org\/10.1007\/s13042-024-02278-1","relation":{},"ISSN":["1868-8071","1868-808X"],"issn-type":[{"value":"1868-8071","type":"print"},{"value":"1868-808X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,7,26]]},"assertion":[{"value":"21 October 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 July 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 July 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"This article does not contain any research conducted by any author on human participants or animals and informed consent is obtained from all individual participants included in the study.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical and informed consent for data used"}}]}}