{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,31]],"date-time":"2026-03-31T21:22:49Z","timestamp":1774992169160,"version":"3.50.1"},"reference-count":55,"publisher":"MDPI AG","issue":"14","license":[{"start":{"date-parts":[[2023,7,9]],"date-time":"2023-07-09T00:00:00Z","timestamp":1688860800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100012166","name":"National Basic Research Program of China","doi-asserted-by":"publisher","award":["2019YFE0126600"],"award-info":[{"award-number":["2019YFE0126600"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012166","name":"National Basic Research Program of China","doi-asserted-by":"publisher","award":["201400210300"],"award-info":[{"award-number":["201400210300"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012166","name":"National Basic Research Program of China","doi-asserted-by":"publisher","award":["212102210496"],"award-info":[{"award-number":["212102210496"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012166","name":"National Basic Research Program of China","doi-asserted-by":"publisher","award":["212102210393"],"award-info":[{"award-number":["212102210393"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012166","name":"National Basic Research Program of China","doi-asserted-by":"publisher","award":["202102110121"],"award-info":[{"award-number":["202102110121"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012166","name":"National Basic Research Program of China","doi-asserted-by":"publisher","award":["2002001"],"award-info":[{"award-number":["2002001"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012166","name":"National Basic Research Program of China","doi-asserted-by":"publisher","award":["62176087"],"award-info":[{"award-number":["62176087"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012166","name":"National Basic Research Program of China","doi-asserted-by":"publisher","award":["2021Szvup032"],"award-info":[{"award-number":["2021Szvup032"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Major Project of Science and Technology of Henan Province","award":["2019YFE0126600"],"award-info":[{"award-number":["2019YFE0126600"]}]},{"name":"Major Project of Science and Technology of Henan Province","award":["201400210300"],"award-info":[{"award-number":["201400210300"]}]},{"name":"Major Project of Science and Technology of Henan Province","award":["212102210496"],"award-info":[{"award-number":["212102210496"]}]},{"name":"Major Project of Science and Technology of Henan Province","award":["212102210393"],"award-info":[{"award-number":["212102210393"]}]},{"name":"Major Project of Science and Technology of Henan Province","award":["202102110121"],"award-info":[{"award-number":["202102110121"]}]},{"name":"Major Project of Science and Technology of Henan Province","award":["2002001"],"award-info":[{"award-number":["2002001"]}]},{"name":"Major Project of Science and Technology of Henan Province","award":["62176087"],"award-info":[{"award-number":["62176087"]}]},{"name":"Major Project of Science and Technology of Henan Province","award":["2021Szvup032"],"award-info":[{"award-number":["2021Szvup032"]}]},{"name":"Key Scientific and Technological Project of Henan Province","award":["2019YFE0126600"],"award-info":[{"award-number":["2019YFE0126600"]}]},{"name":"Key Scientific and Technological Project of Henan Province","award":["201400210300"],"award-info":[{"award-number":["201400210300"]}]},{"name":"Key Scientific and Technological Project of Henan Province","award":["212102210496"],"award-info":[{"award-number":["212102210496"]}]},{"name":"Key Scientific and Technological Project of Henan Province","award":["212102210393"],"award-info":[{"award-number":["212102210393"]}]},{"name":"Key Scientific and Technological Project of Henan Province","award":["202102110121"],"award-info":[{"award-number":["202102110121"]}]},{"name":"Key Scientific and Technological Project of Henan Province","award":["2002001"],"award-info":[{"award-number":["2002001"]}]},{"name":"Key Scientific and Technological Project of Henan Province","award":["62176087"],"award-info":[{"award-number":["62176087"]}]},{"name":"Key Scientific and Technological Project of Henan Province","award":["2021Szvup032"],"award-info":[{"award-number":["2021Szvup032"]}]},{"name":"Key Research and Promotion Projects of Henan Province","award":["2019YFE0126600"],"award-info":[{"award-number":["2019YFE0126600"]}]},{"name":"Key Research and Promotion Projects of Henan Province","award":["201400210300"],"award-info":[{"award-number":["201400210300"]}]},{"name":"Key Research and Promotion Projects of Henan Province","award":["212102210496"],"award-info":[{"award-number":["212102210496"]}]},{"name":"Key Research and Promotion Projects of Henan Province","award":["212102210393"],"award-info":[{"award-number":["212102210393"]}]},{"name":"Key Research and Promotion Projects of Henan Province","award":["202102110121"],"award-info":[{"award-number":["202102110121"]}]},{"name":"Key Research and Promotion Projects of Henan Province","award":["2002001"],"award-info":[{"award-number":["2002001"]}]},{"name":"Key Research and Promotion Projects of Henan Province","award":["62176087"],"award-info":[{"award-number":["62176087"]}]},{"name":"Key Research and Promotion Projects of Henan Province","award":["2021Szvup032"],"award-info":[{"award-number":["2021Szvup032"]}]},{"name":"Kaifeng Science and Technology Development Plan","award":["2019YFE0126600"],"award-info":[{"award-number":["2019YFE0126600"]}]},{"name":"Kaifeng Science and Technology Development Plan","award":["201400210300"],"award-info":[{"award-number":["201400210300"]}]},{"name":"Kaifeng Science and Technology Development Plan","award":["212102210496"],"award-info":[{"award-number":["212102210496"]}]},{"name":"Kaifeng Science and Technology Development Plan","award":["212102210393"],"award-info":[{"award-number":["212102210393"]}]},{"name":"Kaifeng Science and Technology Development Plan","award":["202102110121"],"award-info":[{"award-number":["202102110121"]}]},{"name":"Kaifeng Science and Technology Development Plan","award":["2002001"],"award-info":[{"award-number":["2002001"]}]},{"name":"Kaifeng Science and Technology Development Plan","award":["62176087"],"award-info":[{"award-number":["62176087"]}]},{"name":"Kaifeng Science and Technology Development Plan","award":["2021Szvup032"],"award-info":[{"award-number":["2021Szvup032"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["2019YFE0126600"],"award-info":[{"award-number":["2019YFE0126600"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["201400210300"],"award-info":[{"award-number":["201400210300"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["212102210496"],"award-info":[{"award-number":["212102210496"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["212102210393"],"award-info":[{"award-number":["212102210393"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["202102110121"],"award-info":[{"award-number":["202102110121"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["2002001"],"award-info":[{"award-number":["2002001"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62176087"],"award-info":[{"award-number":["62176087"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["2021Szvup032"],"award-info":[{"award-number":["2021Szvup032"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Shenzhen Science and Technology Innovation Commission (SZSTI), Shenzhen Virtual University Park (SZVUP) Special Fund Project","award":["2019YFE0126600"],"award-info":[{"award-number":["2019YFE0126600"]}]},{"name":"Shenzhen Science and Technology Innovation Commission (SZSTI), Shenzhen Virtual University Park (SZVUP) Special Fund Project","award":["201400210300"],"award-info":[{"award-number":["201400210300"]}]},{"name":"Shenzhen Science and Technology Innovation Commission (SZSTI), Shenzhen Virtual University Park (SZVUP) Special Fund Project","award":["212102210496"],"award-info":[{"award-number":["212102210496"]}]},{"name":"Shenzhen Science and Technology Innovation Commission (SZSTI), Shenzhen Virtual University Park (SZVUP) Special Fund Project","award":["212102210393"],"award-info":[{"award-number":["212102210393"]}]},{"name":"Shenzhen Science and Technology Innovation Commission (SZSTI), Shenzhen Virtual University Park (SZVUP) Special Fund Project","award":["202102110121"],"award-info":[{"award-number":["202102110121"]}]},{"name":"Shenzhen Science and Technology Innovation Commission (SZSTI), Shenzhen Virtual University Park (SZVUP) Special Fund Project","award":["2002001"],"award-info":[{"award-number":["2002001"]}]},{"name":"Shenzhen Science and Technology Innovation Commission (SZSTI), Shenzhen Virtual University Park (SZVUP) Special Fund Project","award":["62176087"],"award-info":[{"award-number":["62176087"]}]},{"name":"Shenzhen Science and Technology Innovation Commission (SZSTI), Shenzhen Virtual University Park (SZVUP) Special Fund Project","award":["2021Szvup032"],"award-info":[{"award-number":["2021Szvup032"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Remote Sensing"],"abstract":"<jats:p>Unmanned aerial vehicle (UAV) image object detection has great application value in the military and civilian fields. However, the objects in the captured images from UAVs have problems of large-scale variation, complex backgrounds, and a large proportion of small objects. To resolve these problems, a multi-scale object detector based on coordinate and global information aggregation is proposed, named CGMDet. Firstly, a Coordinate and Global Information Aggregation Module (CGAM) is designed by aggregating local, coordinate, and global information, which can obtain features with richer context information. Secondly, a Feature Fusion Module (FFM) is proposed, which can better fuse features by learning the importance of different scale features and improve the representation ability of multi-scale features by reusing feature maps to help models better detect multi-scale objects. Moreover, more location information of low-level feature maps is integrated to improve the detection results of small targets. Furthermore, we modified the bounding box regression loss of the model to make the model more accurately regress the bounding box and faster convergence. Finally, we tested the CGMDet on VisDrone and UAVDT datasets. The proposed CGMDet improves mAP0.5 by 1.9% on the VisDrone dataset and 3.0% on the UAVDT dataset.<\/jats:p>","DOI":"10.3390\/rs15143468","type":"journal-article","created":{"date-parts":[[2023,7,10]],"date-time":"2023-07-10T00:47:35Z","timestamp":1688950055000},"page":"3468","update-policy":"https:\/\/doi.org\/10.3390\/mdpi_crossmark_policy","source":"Crossref","is-referenced-by-count":20,"title":["A Multi-Scale Object Detector Based on Coordinate and Global Information Aggregation for UAV Aerial Images"],"prefix":"10.3390","volume":"15","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8741-0827","authenticated-orcid":false,"given":"Liming","family":"Zhou","sequence":"first","affiliation":[{"name":"Henan Key Laboratory of Big Data Analysis and Processing, Henan University, Kaifeng 475004, China"},{"name":"School of Computer and Information Engineering, Henan University, Kaifeng 475004, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-6800-4645","authenticated-orcid":false,"given":"Zhehao","family":"Liu","sequence":"additional","affiliation":[{"name":"Henan Key Laboratory of Big Data Analysis and Processing, Henan University, Kaifeng 475004, China"},{"name":"School of Computer and Information Engineering, Henan University, Kaifeng 475004, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-8690-415X","authenticated-orcid":false,"given":"Hang","family":"Zhao","sequence":"additional","affiliation":[{"name":"Henan Key Laboratory of Big Data Analysis and Processing, Henan University, Kaifeng 475004, China"},{"name":"School of Computer and Information Engineering, Henan University, Kaifeng 475004, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4836-0406","authenticated-orcid":false,"given":"Yan-e","family":"Hou","sequence":"additional","affiliation":[{"name":"Henan Key Laboratory of Big Data Analysis and Processing, Henan University, Kaifeng 475004, China"},{"name":"School of Computer and Information Engineering, Henan University, Kaifeng 475004, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7018-646X","authenticated-orcid":false,"given":"Yang","family":"Liu","sequence":"additional","affiliation":[{"name":"Henan Key Laboratory of Big Data Analysis and Processing, Henan University, Kaifeng 475004, China"},{"name":"School of Computer and Information Engineering, Henan University, Kaifeng 475004, China"},{"name":"Henan Province Engineering Research Center of Spatial Information Processing and Shenzhen Research Institute, Henan University, Kaifeng 475004, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5675-2362","authenticated-orcid":false,"given":"Xianyu","family":"Zuo","sequence":"additional","affiliation":[{"name":"Henan Key Laboratory of Big Data Analysis and Processing, Henan University, Kaifeng 475004, China"},{"name":"School of Computer and Information Engineering, Henan University, Kaifeng 475004, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1053-6741","authenticated-orcid":false,"given":"Lanxue","family":"Dang","sequence":"additional","affiliation":[{"name":"Henan Key Laboratory of Big Data Analysis and Processing, Henan University, Kaifeng 475004, China"},{"name":"School of Computer and Information Engineering, Henan University, Kaifeng 475004, China"}]}],"member":"1968","published-online":{"date-parts":[[2023,7,9]]},"reference":[{"key":"ref_1","doi-asserted-by":"crossref","first-page":"8851","DOI":"10.1109\/TII.2022.3153031","article-title":"Multiperiod unmanned aerial vehicles path planning with dynamic emergency priorities for geohazards monitoring","volume":"18","author":"Wei","year":"2022","journal-title":"IEEE Trans. Ind. Inform."},{"key":"ref_2","first-page":"100292","article-title":"Workflow for capturing information and characterizing difficult-to-access geological outcrops using unmanned aerial vehicle-based digital photogrammetric data","volume":"26","author":"Villarreal","year":"2022","journal-title":"J. Ind. Inf. Integr."},{"key":"ref_3","doi-asserted-by":"crossref","first-page":"2558","DOI":"10.1109\/TAES.2021.3053115","article-title":"Decentralized autonomous navigation of a uav network for road traffic monitoring","volume":"57","author":"Hailong","year":"2021","journal-title":"IEEE Trans. Aerosp. Electron. Syst."},{"key":"ref_4","doi-asserted-by":"crossref","first-page":"3411","DOI":"10.1109\/JSAC.2021.3088662","article-title":"Joint optimisation of real-time deployment and resource allocation for uav-aided disaster emergency communications","volume":"39","author":"Nguyen","year":"2021","journal-title":"IEEE J. Sel. Areas Commun."},{"key":"ref_5","unstructured":"Dalal, N., and Triggs, B. (2005, January 20\u201325). Histograms of oriented gradients for human detection. Proceedings of the 2005 IEEE Computer Society Conference on Computer Vision and Pattern Recognition (CVPR\u201905), San Diego, CA, USA."},{"key":"ref_6","doi-asserted-by":"crossref","first-page":"1150","DOI":"10.1109\/ICCV.1999.790410","article-title":"Object recognition from local scale-invariant features","volume":"2","author":"Lowe","year":"1999","journal-title":"Proc. Seventh IEEE Int. Conf. Comput. Vis."},{"key":"ref_7","doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., and Malik, J. (2014, January 28). Rich feature hierarchies for accurate object detection and semantic segmentation. Proceedings of the 2014 IEEE Conference on Computer Vision and Pattern Recognition, Columbus, OH, USA.","DOI":"10.1109\/CVPR.2014.81"},{"key":"ref_8","doi-asserted-by":"crossref","unstructured":"Girshick, R. (2015, January 7\u201313). Fast r-cnn. Proceedings of the 2015 IEEE International Conference on Computer Vision (ICCV), Santiago, Chile.","DOI":"10.1109\/ICCV.2015.169"},{"key":"ref_9","doi-asserted-by":"crossref","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","article-title":"Faster r-cnn: Towards real-time object detection with region proposal networks","volume":"39","author":"Ren","year":"2017","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"ref_10","doi-asserted-by":"crossref","first-page":"1907","DOI":"10.1109\/TPAMI.2015.2389824","article-title":"Spatial pyramid pooling in deep convolutional networks for visual recognition","volume":"37","author":"He","year":"2015","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"ref_11","doi-asserted-by":"crossref","unstructured":"Liu, W., Anguelov, D., Erhan, D., Szegedy, C., Reed, S., Fu, C.Y., and Berg, A.C. (2016, January 11\u201314). Ssd: Single shot multibox detector. Proceedings of the European Conference on Computer Vision, Amsterdam, The Netherlands.","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"ref_12","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Goyal, P., Girshick, R., He, K., and Doll\u00e1r, P. (2017, January 22\u201329). Focal loss for dense object detection. Proceedings of the 2017 IEEE International Conference on Computer Vision (ICCV), Venice, Italy.","DOI":"10.1109\/ICCV.2017.324"},{"key":"ref_13","doi-asserted-by":"crossref","unstructured":"Redmon, J., Divvala, S., Girshick, R., and Farhadi, A. (2016, January 27\u201330). You only look once: Unified, real-time object detection. Proceedings of the 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), Las Vegas, NV, USA.","DOI":"10.1109\/CVPR.2016.91"},{"key":"ref_14","doi-asserted-by":"crossref","unstructured":"Redmon, J., and Farhadi, A. (2017, January 21\u201326). Yolo9000: Better, faster, stronger. Proceedings of the 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), Honolulu, HI, USA.","DOI":"10.1109\/CVPR.2017.690"},{"key":"ref_15","unstructured":"Redmon, J., and Farhadi, A. (2018). Yolov3: An incremental improvement. arXiv."},{"key":"ref_16","unstructured":"Bochkovskiy, A., Wang, C.Y., and Liao, H.Y.M. (2020). Yolov4: Optimal speed and accuracy of object detection. arXiv."},{"key":"ref_17","unstructured":"Ultralytics (2022, June 18). Yolov5. Available online: https:\/\/github.com\/ultralytics\/yolov5."},{"key":"ref_18","unstructured":"Wang, C.Y., Bochkovskiy, A., and Liao, H.Y.M. (2022). YOLOv7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. arXiv."},{"key":"ref_19","doi-asserted-by":"crossref","unstructured":"Tian, Z., Shen, C., Chen, H., and He, T. (November, January 27). Fcos: Fully convolutional one-stage object detection. Proceedings of the 2019 IEEE\/CVF International Conference on Computer Vision (ICCV), Seoul, Republic of Korea.","DOI":"10.1109\/ICCV.2019.00972"},{"key":"ref_20","unstructured":"Zhou, X., Wang, D., and Kr\u00e4henb\u00fchl, P. (2019). Objects as points. arXiv."},{"key":"ref_21","doi-asserted-by":"crossref","unstructured":"Liu, S., Zha, J., Sun, J., Li, Z., and Wang, G. (2023). EdgeYOLO: An Edge-Real-Time Object Detector. arXiv.","DOI":"10.23919\/CCC58697.2023.10239786"},{"key":"ref_22","first-page":"102912","article-title":"Object detection from UAV thermal infrared images and videos using YOLO models","volume":"112","author":"Jiang","year":"2022","journal-title":"Int. J. Appl. Earth Obs. Geoinf."},{"key":"ref_23","unstructured":"Yang, F., Fan, H., Chu, P., Blasch, E., and Ling, H. (November, January 27). Clustered object detection in aerial images. Proceedings of the IEEE\/CVF International Conference on Computer Vision, Seoul, Republic of Korea."},{"key":"ref_24","doi-asserted-by":"crossref","unstructured":"Li, C., Yang, T., Zhu, S., Chen, C., and Guan, S. (2020, January 13\u201319). Density map guided object detection in aerial images. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, Seattle, WA, USA.","DOI":"10.1109\/CVPRW50498.2020.00103"},{"key":"ref_25","doi-asserted-by":"crossref","unstructured":"Hu, J., Shen, L., and Sun, G. (2018, January 18\u201323). Squeeze-and-excitation networks. Proceedings of the 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, Salt Lake City, UT, USA.","DOI":"10.1109\/CVPR.2018.00745"},{"key":"ref_26","doi-asserted-by":"crossref","unstructured":"Wang, Q., Wu, B., Zhu, P., Li, P., Zuo, W., and Hu, Q. (2020, January 13\u201319). ECA-Net: Efficient Channel Attention for Deep Convolutional Neural Networks. Proceedings of the 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), Seattle, WA, USA.","DOI":"10.1109\/CVPR42600.2020.01155"},{"key":"ref_27","doi-asserted-by":"crossref","unstructured":"Lee, Y., and Park, J. (2020, January 13\u201319). CenterMask: Real-Time Anchor-Free Instance Segmentation. Proceedings of the 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), Seattle, WA, USA.","DOI":"10.1109\/CVPR42600.2020.01392"},{"key":"ref_28","doi-asserted-by":"crossref","unstructured":"Hou, Q., Zhou, D., and Feng, J. (2021, January 20\u201325). Coordinate Attention for Efficient Mobile Network Design. Proceedings of the 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), Nashville, TN, USA.","DOI":"10.1109\/CVPR46437.2021.01350"},{"key":"ref_29","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, J.Y., and Kweon, I.S. (2018, January 8\u201314). Cbam: Convolutional block attention module. Proceedings of the European Conference on Computer Vision (ECCV), Munich, Germany.","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"ref_30","doi-asserted-by":"crossref","unstructured":"Ye, Y., Ren, X., Zhu, B., Tang, T., Tan, X., Gui, Y., and Yao, Q. (2022). An Adaptive Attention Fusion Mechanism Convolutional Network for Object Detection in Remote Sensing Images. Remote Sens., 14.","DOI":"10.3390\/rs14030516"},{"key":"ref_31","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Doll\u00e1r, P., Girshick, R., He, K., Hariharan, B., and Belongie, S. (2017, January 21\u201326). Feature pyramid networks for object detection. Proceedings of the 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), Honolulu, HI, USA.","DOI":"10.1109\/CVPR.2017.106"},{"key":"ref_32","doi-asserted-by":"crossref","unstructured":"Liu, S., Qi, L., Qin, H., Shi, J., and Jia, J. (2018, January 18\u201323). Path aggregation network for instance segmentation. Proceedings of the 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, Salt Lake City, UT, USA.","DOI":"10.1109\/CVPR.2018.00913"},{"key":"ref_33","unstructured":"Zhao, Q., Sheng, T., Wang, Y., Tang, Z., Chen, Y., Cai, L., and Ling, H. (February, January 27). M2Det: A Single-Shot Object Detector Based on Multi-Level Feature Pyramid Network. Proceedings of the Thirty-Third AAAI Conference on Artificial Intelligence, Honolulu, HI, USA."},{"key":"ref_34","doi-asserted-by":"crossref","unstructured":"Tan, M., Pang, R., and Le, Q.V. (2020, January 13\u201319). Efficientdet: Scalable and efficient object detection. Proceedings of the 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), Seattle, WA, USA.","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"ref_35","unstructured":"Ioffe, S., and Szegedy, C. (2015, January 6\u201311). Batch normalization: Accelerating deep network training by reducing internal covariate shift. Proceedings of the ICML\u201915: 32nd International Conference on International Conference on Machine Learning, Lille, France."},{"key":"ref_36","doi-asserted-by":"crossref","first-page":"3","DOI":"10.1016\/j.neunet.2017.12.012","article-title":"Sigmoid-weighted linear units for neural network function approximation in reinforcement learning","volume":"107","author":"Elfwing","year":"2018","journal-title":"Neural Netw."},{"key":"ref_37","unstructured":"Wang, C.Y., Liao, H.Y.M., and Yeh, I.H. (2022). Designing network design strategies through gradient path analysis. arXiv."},{"key":"ref_38","doi-asserted-by":"crossref","unstructured":"Zheng, Z., Wang, P., Liu, W., Li, J., Ye, R., and Ren, D. (2020, January 7\u201312). Distance-iou loss: Faster and better learning for bounding box regression. Proceedings of the AAAI Conference on Artificial Intelligence, New York, NY, USA.","DOI":"10.1609\/aaai.v34i07.6999"},{"key":"ref_39","doi-asserted-by":"crossref","first-page":"146","DOI":"10.1016\/j.neucom.2022.07.042","article-title":"Focal and efficient iou loss for accurate bounding box regression","volume":"506","author":"Zhang","year":"2022","journal-title":"Neurocomputing"},{"key":"ref_40","doi-asserted-by":"crossref","unstructured":"Sun, Z., Leng, X., Lei, Y., Xiong, B., Ji, K., and Kuang, G. (2021). BiFA-YOLO: A Novel YOLO-Based Method for Arbitrary-Oriented Ship Detection in High-Resolution SAR Images. Remote Sens., 13.","DOI":"10.3390\/rs13214209"},{"key":"ref_41","doi-asserted-by":"crossref","first-page":"7380","DOI":"10.1109\/TPAMI.2021.3119563","article-title":"Detection and tracking meet drones challenge","volume":"44","author":"Zhu","year":"2022","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"ref_42","doi-asserted-by":"crossref","unstructured":"Du, D., Qi, Y., Yu, H., Yang, Y., Duan, K., Li, G., Zhang, W., Huang, Q., and Tian, Q. (2018, January 8\u201314). The unmanned aerial vehicle benchmark: Object detection and tracking. Proceedings of the European Conference on Computer Vision (ECCV), Munich, Germany.","DOI":"10.1007\/978-3-030-01249-6_23"},{"key":"ref_43","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Maire, M., Belongie, S., Hays, J., Perona, P., Ramanan, D., Doll\u00e1r, P., and Zitnick, C.L. (2014, January 6\u201312). Microsoft coco: Common objects in context. Proceedings of the European Conference on Computer Vision, Zurich, Switzerland.","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"ref_44","doi-asserted-by":"crossref","unstructured":"Cai, Z., and Vasconcelos, N. (2018, January 18\u201323). Cascade R-CNN: Delving Into High Quality Object Detection. Proceedings of the 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, Salt Lake City, UT, USA.","DOI":"10.1109\/CVPR.2018.00644"},{"key":"ref_45","unstructured":"Ge, Z., Liu, S., Wang, F., Li, Z., and Sun, J. (2021). Yolox: Exceeding yolo series in 2021. arXiv."},{"key":"ref_46","doi-asserted-by":"crossref","first-page":"364","DOI":"10.1016\/j.neucom.2020.06.011","article-title":"Novel up-scale feature aggregation for object detection in aerial images","volume":"411","author":"Lin","year":"2020","journal-title":"Neurocomputing"},{"key":"ref_47","doi-asserted-by":"crossref","unstructured":"Yang, C., Huang, Z., and Wang, N. (2022, January 18\u201324). Querydet: Cascaded sparse query for accelerating high-resolution small object detection. Proceedings of the 2022 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), New Orleans, LA, USA.","DOI":"10.1109\/CVPR52688.2022.01330"},{"key":"ref_48","unstructured":"Wang, J., Xu, C., Yang, W., and Yu, L. (2021). A normalized Gaussian Wasserstein distance for tiny object detection. arXiv."},{"key":"ref_49","doi-asserted-by":"crossref","unstructured":"Du, B., Huang, Y., Chen, J., and Huang, D. (2023, January 18\u201322). Adaptive Sparse Convolutional Networks with Global Context Enhancement for Faster Object Detection on Drone Images. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, Vancouver, BC, Canada.","DOI":"10.1109\/CVPR52729.2023.01291"},{"key":"ref_50","doi-asserted-by":"crossref","unstructured":"Duan, C., Wei, Z., Zhang, C., Qu, S., and Wang, H. (2021, January 11\u201317). Coarse-grained density map guided object detection in aerial images. Proceedings of the IEEE\/CVF International Conference on Computer Vision, Montreal, BC, Canada.","DOI":"10.1109\/ICCVW54120.2021.00313"},{"key":"ref_51","doi-asserted-by":"crossref","unstructured":"Liu, C., Yang, D., Tang, L., Zhou, X., and Deng, Y. (2023). A Lightweight Object Detector Based on Spatial-Coordinate Self-Attention for UAV Aerial Images. Remote Sens., 15.","DOI":"10.3390\/rs15010083"},{"key":"ref_52","unstructured":"Xu, S., Wang, X., Lv, W., Chang, Q., Cui, C., Deng, K., Wang, G., Dang, Q., Wei, S., and Du, Y. (2022). PP-YOLOE: An evolved version of YOLO. arXiv."},{"key":"ref_53","unstructured":"Ultralytics (2023, January 01). YOLOv8. Available online: https:\/\/github.com\/ultralytics\/ultralytics."},{"key":"ref_54","doi-asserted-by":"crossref","unstructured":"Selvaraju, R.R., Cogswell, M., Das, A., Vedantam, R., Parikh, D., and Batra, D. (2017, January 22\u201329). Grad-CAM: Visual Explanations from Deep Networks via Gradient-Based Localization. Proceedings of the 2017 IEEE International Conference on Computer Vision (ICCV), Venice, Italy.","DOI":"10.1109\/ICCV.2017.74"},{"key":"ref_55","doi-asserted-by":"crossref","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","article-title":"The pascal visual object classes (voc) challenge","volume":"88","author":"Everingham","year":"2010","journal-title":"Int. J. Comput. Vis."}],"container-title":["Remote Sensing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.mdpi.com\/2072-4292\/15\/14\/3468\/pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,10]],"date-time":"2025-10-10T20:09:30Z","timestamp":1760126970000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.mdpi.com\/2072-4292\/15\/14\/3468"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,7,9]]},"references-count":55,"journal-issue":{"issue":"14","published-online":{"date-parts":[[2023,7]]}},"alternative-id":["rs15143468"],"URL":"https:\/\/doi.org\/10.3390\/rs15143468","relation":{},"ISSN":["2072-4292"],"issn-type":[{"value":"2072-4292","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,7,9]]}}}