{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,18]],"date-time":"2026-03-18T17:42:22Z","timestamp":1773855742279,"version":"3.50.1"},"reference-count":38,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2024,11,15]],"date-time":"2024-11-15T00:00:00Z","timestamp":1731628800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2024,11,15]],"date-time":"2024-11-15T00:00:00Z","timestamp":1731628800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"DOI":"10.13039\/501100001809","name":"the National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["61971078"],"award-info":[{"award-number":["61971078"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"name":"Chongqing University of Technology Graduate Education Quality Development Action Plan Funding Results","award":["KJZD-M202301901"],"award-info":[{"award-number":["KJZD-M202301901"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Complex Intell. Syst."],"published-print":{"date-parts":[[2025,1]]},"DOI":"10.1007\/s40747-024-01652-4","type":"journal-article","created":{"date-parts":[[2024,11,15]],"date-time":"2024-11-15T04:11:37Z","timestamp":1731643897000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":17,"title":["ATBHC-YOLO: aggregate transformer and bidirectional hybrid convolution for small object detection"],"prefix":"10.1007","volume":"11","author":[{"given":"Dandan","family":"Liao","sequence":"first","affiliation":[]},{"given":"Jianxun","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Ye","family":"Tao","sequence":"additional","affiliation":[]},{"given":"Xie","family":"Jin","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,15]]},"reference":[{"key":"1652_CR1","doi-asserted-by":"crossref","unstructured":"Lin T-Y et al (2017) Feature pyramid networks for object detection. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp\u00a02117\u20132125","DOI":"10.1109\/CVPR.2017.106"},{"key":"1652_CR2","doi-asserted-by":"publisher","first-page":"114602","DOI":"10.1016\/j.eswa.2021.114602","volume":"172","author":"Y Liu","year":"2021","unstructured":"Liu Y et al (2021) A survey and performance evaluation of deep learning methods for small object detection. Expert Syst Appl 172:114602","journal-title":"Expert Syst Appl"},{"key":"1652_CR3","doi-asserted-by":"publisher","first-page":"104197","DOI":"10.1016\/j.imavis.2021.104197","volume":"111","author":"G Liu","year":"2021","unstructured":"Liu G, Han J, Rong W (2021) Feedback-driven loss function for small object detection. Image Vis Comput 111:104197","journal-title":"Image Vis Comput"},{"key":"1652_CR4","doi-asserted-by":"crossref","unstructured":"Liu S et al (2018) Path aggregation network for instance segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 8759\u20138768","DOI":"10.1109\/CVPR.2018.00913"},{"key":"1652_CR5","doi-asserted-by":"crossref","unstructured":"Zhu X et al (2021) TPH-YOLOv5: improved YOLOv5 based on transformer prediction head for object detection on drone-captured scenarios. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 2778\u20132788","DOI":"10.1109\/ICCVW54120.2021.00312"},{"key":"1652_CR6","doi-asserted-by":"crossref","unstructured":"Lee Y et al (2022) Mpvit: multi-path vision transformer for dense prediction. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp\u00a07287\u20137296","DOI":"10.1109\/CVPR52688.2022.00714"},{"issue":"11","key":"1652_CR7","doi-asserted-by":"publisher","first-page":"7380","DOI":"10.1109\/TPAMI.2021.3119563","volume":"44","author":"P Zhu","year":"2021","unstructured":"Zhu P et al (2021) Detection and tracking meet drones challenge. IEEE Trans Pattern Anal Mach Intell 44(11):7380\u20137399","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"1652_CR8","doi-asserted-by":"crossref","unstructured":"Touvron H et al (2021) Training data-efficient image transformers & distillation through attention. In: International conference on machine learning. PMLR, pp 10347\u201310357","DOI":"10.1109\/ICCV48922.2021.00010"},{"key":"1652_CR9","doi-asserted-by":"crossref","unstructured":"Yang C, Huang Z, Wang N (2022) QueryDet: cascaded sparse query for accelerating high-resolution small object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp\u00a013668\u201313677","DOI":"10.1109\/CVPR52688.2022.01330"},{"key":"1652_CR10","doi-asserted-by":"crossref","unstructured":"Xia B et al (2022) Efficient non-local contrastive attention for image super-resolution. In: Proceedings of the AAAI conference on artificial intelligence, vol 36, no 3, pp\u00a02759\u20132767","DOI":"10.1609\/aaai.v36i3.20179"},{"key":"1652_CR11","doi-asserted-by":"crossref","unstructured":"Akyon FC, Altinuc SO, Temizel A (2022) Slicing aided hyper inference and fine-tuning for small object detection. In: 2022 IEEE International Conference on Image Processing (ICIP). IEEE, pp\u00a0966\u2013970","DOI":"10.1109\/ICIP46576.2022.9897990"},{"key":"1652_CR12","doi-asserted-by":"publisher","first-page":"1968","DOI":"10.1109\/TMM.2021.3074273","volume":"24","author":"C Deng","year":"2022","unstructured":"Deng C et al (2022) Extended feature pyramid network for small object detection. IEEE Trans Multimed 24:1968\u20131979","journal-title":"IEEE Trans Multimed"},{"key":"1652_CR13","unstructured":"Gevorgyan Z (2022) SIoU loss: more powerful learning for bounding box regression. arXiv preprint arXiv:2205.12740"},{"key":"1652_CR14","first-page":"1","volume":"61","author":"J Zhang","year":"2023","unstructured":"Zhang J et al (2023) SuperYOLO: super resolution assisted object detection in multimodal remote sensing imagery. IEEE Trans Geosci Remote Sens 61:1\u201315","journal-title":"IEEE Trans Geosci Remote Sens"},{"key":"1652_CR15","doi-asserted-by":"publisher","first-page":"103752","DOI":"10.1016\/j.jvcir.2023.103752","volume":"90","author":"M Wang","year":"2023","unstructured":"Wang M et al (2023) FE-YOLOv5: feature enhancement network based on YOLOv5 for small object detection. J Visual Commun Image Represent 90:103752","journal-title":"J Visual Commun Image Represent"},{"issue":"13","key":"1652_CR16","doi-asserted-by":"publisher","first-page":"10719","DOI":"10.1007\/s00521-022-07007-9","volume":"34","author":"Z-D Zhang","year":"2022","unstructured":"Zhang Z-D et al (2022) CDNet: a real-time and robust crosswalk detection network on Jetson nano based on YOLOv5. Neural Comput Appl 34(13):10719\u201310730","journal-title":"Neural Comput Appl"},{"key":"1652_CR17","doi-asserted-by":"publisher","first-page":"104697","DOI":"10.1016\/j.imavis.2023.104697","volume":"135","author":"X Wang","year":"2023","unstructured":"Wang X et al (2023) Improved YOLOX-X based UAV aerial photography object detection algorithm. Image Vis Comput 135:104697","journal-title":"Image Vis Comput"},{"key":"1652_CR18","unstructured":"Wang J et al (2021) A normalized Gaussian Wasserstein distance for tiny object detection. arXiv preprint arXiv:2110.13389"},{"key":"1652_CR19","doi-asserted-by":"publisher","first-page":"296","DOI":"10.1016\/j.isprsjprs.2019.11.023","volume":"159","author":"K Li","year":"2020","unstructured":"Li K et al (2020) Object detection in optical remote sensing images: a survey and a new benchmark. ISPRS J Photogramm Remote Sens 159:296\u2013307","journal-title":"ISPRS J Photogramm Remote Sens"},{"key":"1652_CR20","doi-asserted-by":"publisher","first-page":"187","DOI":"10.1016\/j.jvcir.2015.11.002","volume":"34","author":"S Razakarivony","year":"2016","unstructured":"Razakarivony S, Jurie F (2016) Vehicle detection in aerial imagery: a small target detection benchmark. J Vis Commun Image Represent 34:187\u2013203","journal-title":"J Vis Commun Image Represent"},{"key":"1652_CR21","doi-asserted-by":"crossref","unstructured":"Wang C-Y, Bochkovskiy A, Liao H-YM (2023) YOLOv7: trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp\u00a07464\u20137475","DOI":"10.1109\/CVPR52729.2023.00721"},{"key":"1652_CR22","doi-asserted-by":"publisher","first-page":"116919","DOI":"10.1016\/j.image.2023.116919","volume":"113","author":"Y Chen","year":"2023","unstructured":"Chen Y et al (2023) Enhanced semantic feature pyramid network for small object detection. Signal Process Image Commun 113:116919","journal-title":"Signal Process Image Commun"},{"key":"1652_CR23","doi-asserted-by":"crossref","unstructured":"Zhang J et al (2023) ETAM: ensemble transformer with attention modules for detection of small objects. Expert Syst Appl 224:119997","DOI":"10.1016\/j.eswa.2023.119997"},{"key":"1652_CR24","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.109801","volume":"143","author":"H Zhang","year":"2023","unstructured":"Zhang H et al (2023) Construction of a feature enhancement network for small object detection. Pattern Recognit 143:109801","journal-title":"Pattern Recognit"},{"key":"1652_CR25","doi-asserted-by":"publisher","first-page":"79","DOI":"10.1016\/j.isprsjprs.2022.06.002","volume":"190","author":"X Chang","year":"2022","unstructured":"Chang X et al (2022) Detecting tiny objects in aerial images: a normalized Wasserstein distance and a new benchmark. ISPRS J Photogramm Remote Sens 190:79\u201393","journal-title":"ISPRS J Photogramm Remote Sens"},{"key":"1652_CR26","doi-asserted-by":"publisher","first-page":"126285","DOI":"10.1016\/j.neucom.2023.126285","volume":"543","author":"R Fu","year":"2023","unstructured":"Fu R et al (2023) Gaussian similarity-based adaptive dynamic label assignment for tiny object detection. Neurocomputing 543:126285","journal-title":"Neurocomputing"},{"key":"1652_CR27","doi-asserted-by":"crossref","unstructured":"Du Y et al (2021) Giaotracker: a comprehensive framework for mcmot with global information and optimizing strategies in visdrone 2021. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp\u00a02809\u20132819","DOI":"10.1109\/ICCVW54120.2021.00315"},{"issue":"22","key":"1652_CR28","doi-asserted-by":"publisher","first-page":"34679","DOI":"10.1007\/s11042-023-14800-8","volume":"82","author":"K Li","year":"2023","unstructured":"Li K, Liu ZD (2023) MCANet: multi-scale contextual feature fusion network based on Atrous convolution. Multimed Tools Appl 82(22):34679\u201334702","journal-title":"Multimed Tools Appl"},{"key":"1652_CR29","unstructured":"Ren S et al (2015) Faster r-cnn: towards real-time object detection with region proposal networks. In: Advances in neural information processing systems, vol 28"},{"key":"1652_CR30","doi-asserted-by":"crossref","unstructured":"Albaba BM, Ozer S (2021) SyNet: an ensemble network for object detection in UAV images. In: 2020 25th International Conference on Pattern Recognition (ICPR). IEEE, pp\u00a010227\u201310234","DOI":"10.1109\/ICPR48806.2021.9412847"},{"key":"1652_CR31","doi-asserted-by":"crossref","unstructured":"Huang Y, Chen J, Huang D (2022) UFPMP-Det: toward accurate and efficient object detection on drone imagery. In: Proceedings of the AAAI conference on artificial intelligence, vol 36, no 1, pp 1026\u20131033","DOI":"10.1609\/aaai.v36i1.19986"},{"key":"1652_CR32","doi-asserted-by":"publisher","first-page":"117106","DOI":"10.1016\/j.eswa.2022.117106","volume":"199","author":"P Mittal","year":"2022","unstructured":"Mittal P et al (2022) Dilated convolution based RCNN using feature fusion for low-altitude aerial objects. Expert Syst Appl 199:117106","journal-title":"Expert Syst Appl"},{"key":"1652_CR33","doi-asserted-by":"crossref","unstructured":"Lin T-Y et al (2017) Focal loss for dense object detection. In: Proceedings of the IEEE international conference on computer vision, pp\u00a02980\u20132988","DOI":"10.1109\/ICCV.2017.324"},{"key":"1652_CR34","doi-asserted-by":"crossref","unstructured":"Pang J et al (2019) Libra r-cnn: towards balanced learning for object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp\u00a0821\u2013830","DOI":"10.1109\/CVPR.2019.00091"},{"key":"1652_CR35","doi-asserted-by":"crossref","unstructured":"Liu W et al (2016) Ssd: single shot multibox detector. In: Computer Vision\u2014ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part I 14. Springer, pp\u00a021\u201337","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"1652_CR36","unstructured":"Redmon J, Farhadi A (2018) Yolov3: an incremental improvement. arXiv preprint arXiv:1804.02767"},{"key":"1652_CR37","doi-asserted-by":"publisher","first-page":"296","DOI":"10.1016\/j.isprsjprs.2019.11.023","volume":"159","author":"K Li","year":"2020","unstructured":"Li K et al (2020) Object detection in optical remote sensing images: a survey and a new benchmark. ISPRS J Photogramm Remote Sens 159:296\u2013307","journal-title":"ISPRS J Photogramm Remote Sens"},{"key":"1652_CR38","doi-asserted-by":"crossref","unstructured":"Liu Y et al (2021) Catnet: context aggregation network for instance segmentation in remote sensing images","DOI":"10.1109\/LGRS.2020.3023124"}],"container-title":["Complex &amp; Intelligent Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s40747-024-01652-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s40747-024-01652-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s40747-024-01652-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,30]],"date-time":"2025-01-30T20:16:42Z","timestamp":1738268202000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s40747-024-01652-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,15]]},"references-count":38,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2025,1]]}},"alternative-id":["1652"],"URL":"https:\/\/doi.org\/10.1007\/s40747-024-01652-4","relation":{},"ISSN":["2199-4536","2198-6053"],"issn-type":[{"value":"2199-4536","type":"print"},{"value":"2198-6053","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,11,15]]},"assertion":[{"value":"18 March 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 October 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 November 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could be perceived to have influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"38"}}