{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,25]],"date-time":"2025-10-25T21:26:01Z","timestamp":1761427561777,"version":"3.41.0"},"reference-count":39,"publisher":"Springer Science and Business Media LLC","issue":"7","license":[{"start":{"date-parts":[[2025,5,12]],"date-time":"2025-05-12T00:00:00Z","timestamp":1747008000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,5,12]],"date-time":"2025-05-12T00:00:00Z","timestamp":1747008000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100012166","name":"National Key Research and Development Program of China","doi-asserted-by":"publisher","award":["No. 2020YFC1523301"],"award-info":[{"award-number":["No. 2020YFC1523301"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["SIViP"],"published-print":{"date-parts":[[2025,7]]},"DOI":"10.1007\/s11760-025-04013-x","type":"journal-article","created":{"date-parts":[[2025,5,12]],"date-time":"2025-05-12T06:08:45Z","timestamp":1747030125000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Rethinking the structural similarity in small object detection"],"prefix":"10.1007","volume":"19","author":[{"given":"Enhui","family":"Chai","sequence":"first","affiliation":[]},{"given":"Li","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Umara","family":"Khalid","sequence":"additional","affiliation":[]},{"given":"Bowei","family":"Chen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,5,12]]},"reference":[{"key":"4013_CR1","doi-asserted-by":"publisher","DOI":"10.1016\/j.comcom.2024.107986","volume":"229","author":"N Dong","year":"2024","unstructured":"Dong, N., Liu, S., Mai, X.: Communication-efficient heterogeneous multi-uav task allocation based on clustering. Comput. Commun. 229, 107986 (2024)","journal-title":"Comput. Commun."},{"issue":"3","key":"4013_CR2","doi-asserted-by":"publisher","first-page":"4039","DOI":"10.1109\/TII.2023.3313635","volume":"20","author":"J Ma","year":"2024","unstructured":"Ma, J., Xiong, G., Xu, J., Chen, X.: Cvtnet: A cross-view transformer network for lidar-based place recognition in autonomous driving environments. IEEE Trans. Ind. Inf. 20(3), 4039\u20134048 (2024)","journal-title":"IEEE Trans. Ind. Inf."},{"issue":"6","key":"4013_CR3","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2016","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster r-cnn: Towards real-time object detection with region proposal networks. IEEE Trans. pattern Anal. Mach. Intell. 39(6), 1137\u20131149 (2016)","journal-title":"IEEE Trans. pattern Anal. Mach. Intell."},{"key":"4013_CR4","unstructured":"Ross, T.-Y., Doll\u00e1r, G.: Focal loss for dense object detection, in proceedings of the IEEE conference on computer vision and pattern recognition, pp. 2980\u20132988, (2017)"},{"issue":"4","key":"4013_CR5","first-page":"1922","volume":"44","author":"Z Tian","year":"2020","unstructured":"Tian, Z., Shen, C., Chen, H., He, T.: Fcos: a simple and strong anchor-free object detector. IEEE Trans. Pattern Anal. Mach. Intell. 44(4), 1922\u20131933 (2020)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"4013_CR6","doi-asserted-by":"crossref","unstructured":"Carion, N., Massa, F., Synnaeve, G., Usunier, N., Kirillov, A., Zagoruyko, S.: End-to-end object detection with transformers, in European conference on computer vision, pp. 213\u2013229, Springer, (2020)","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"4013_CR7","doi-asserted-by":"crossref","unstructured":"Dai, X., Chen, Y., Xiao, B., Chen, D., Liu, M., Yuan, L., Zhang, L.: Dynamic head: Unifying object detection heads with attentions, in Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 7373\u20137382, (2021)","DOI":"10.1109\/CVPR46437.2021.00729"},{"key":"4013_CR8","unstructured":"Wang, A., Chen, H., Liu, L., Chen, K., Lin, Z., Han, J., Ding, G.: Yolov10: Real-time end-to-end object detection, arXiv preprint arXiv:2405.14458, (2024)"},{"key":"4013_CR9","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Maire, M., Belongie, S., Hays, J., Perona, P., Ramanan, D., Doll\u00e1r, P., Zitnick, C.L.: Microsoft coco: Common objects in context, in Computer Vision\u2013ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6-12, 2014, Proceedings, Part V 13, pp. 740\u2013755, Springer, (2014)","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"4013_CR10","doi-asserted-by":"crossref","unstructured":"Yang, C., Huang, Z., Wang, N.: Querydet: Cascaded sparse query for accelerating high-resolution small object detection, in Proceedings of the IEEE\/CVF Conference on computer vision and pattern recognition, pp. 13668\u201313677, 2022","DOI":"10.1109\/CVPR52688.2022.01330"},{"key":"4013_CR11","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, J.-Y., Kweon, I.S.: Cbam: Convolutional block attention module, in Proceedings of the European conference on computer vision (ECCV), pp. 3\u201319, (2018)","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"4013_CR12","doi-asserted-by":"publisher","first-page":"2148","DOI":"10.1109\/JSTARS.2020.3046482","volume":"14","author":"Y Li","year":"2021","unstructured":"Li, Y., Huang, Q., Pei, X., Chen, Y., Jiao, L., Shang, R.: Cross-layer attention network for small object detection in remote sensing imagery. IEEE J Sel. Top. Appl. Earth Obs. Remote Sens. 14, 2148\u20132161 (2021)","journal-title":"IEEE J Sel. Top. Appl. Earth Obs. Remote Sens."},{"issue":"2","key":"4013_CR13","doi-asserted-by":"publisher","first-page":"936","DOI":"10.1109\/TSMC.2020.3005231","volume":"52","author":"G Chen","year":"2020","unstructured":"Chen, G., Wang, H., Chen, K., Li, Z., Song, Z., Liu, Y., Chen, W., Knoll, A.: A survey of the four pillars for small object detection: Multiscale representation, contextual information, super-resolution, and region proposal. IEEE Trans. Syst. Man Cybern.: Syst. 52(2), 936\u2013953 (2020)","journal-title":"IEEE Trans. Syst. Man Cybern.: Syst."},{"key":"4013_CR14","unstructured":"Du, D., Zhu, P., Wen, L., Bian, X., Liu, Z.M.: Visdrone-det2019: The vision meets drone object detection in image challenge results, in ICCV visdrone workshop, (2019)"},{"key":"4013_CR15","doi-asserted-by":"crossref","unstructured":"Law, H., Deng, J.: Cornernet: Detecting objects as paired keypoints, in Proceedings of the European conference on computer vision (ECCV), pp. 734\u2013750, (2018)","DOI":"10.1007\/978-3-030-01264-9_45"},{"key":"4013_CR16","doi-asserted-by":"crossref","unstructured":"Zand, M., Etemad, A., Greenspan, M.: Objectbox: From centers to boxes for anchor-free object detection, in European Conference on Computer Vision, pp. 390\u2013406, Springer, (2022)","DOI":"10.1007\/978-3-031-20080-9_23"},{"key":"4013_CR17","doi-asserted-by":"crossref","unstructured":"Shen, L., Dong, Y., Pei, Y., Yang, H., Zheng, L., Ma, J.: One-dimensional feature supervision network for object detection, in International Conference on Intelligent Computing, pp. 147\u2013156, Springer, (2023)","DOI":"10.1007\/978-981-99-4761-4_13"},{"key":"4013_CR18","doi-asserted-by":"publisher","first-page":"1066","DOI":"10.1016\/j.procs.2022.01.135","volume":"199","author":"P Jiang","year":"2022","unstructured":"Jiang, P., Ergu, D., Liu, F., Cai, Y., Ma, B.: A review of yolo algorithm developments. Procedia Comput. Sci. 199, 1066\u20131073 (2022)","journal-title":"Procedia Comput. Sci."},{"key":"4013_CR19","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., Darrell, T.: Fully convolutional networks for semantic segmentation, in Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 3431\u20133440, (2015)","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"4013_CR20","unstructured":"Jocher, G., Chaurasia, A., Stoken, A., Borovec, J., Kwon, Y., Fang, J. Michael, K., Montes, D., Nadar, J., Skalski, P., et\u00a0al.: ultralytics\/yolov5: v6. 1-tensorrt, tensorflow edge tpu and openvino export and inference, Zenodo, (2022)"},{"issue":"16","key":"4013_CR21","doi-asserted-by":"publisher","first-page":"7190","DOI":"10.3390\/s23167190","volume":"23","author":"G Wang","year":"2023","unstructured":"Wang, G., Chen, Y., An, P., Hong, H., Hu, J., Huang, T.: Uav-yolov8: A small-object-detection model based on improved yolov8 for uav aerial photography scenarios. Sensors 23(16), 7190 (2023)","journal-title":"Sensors"},{"issue":"4","key":"4013_CR22","doi-asserted-by":"publisher","first-page":"2239","DOI":"10.1109\/TPAMI.2023.3335410","volume":"46","author":"F Li","year":"2024","unstructured":"Li, F., Zhang, H., Zhang, N.L.: Dn-detr: Accelerate detr training by introducing query denoising. IEEE Trans. Pattern Anal. Mach. Intell. 46(4), 2239\u20132251 (2024)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"4013_CR23","doi-asserted-by":"crossref","unstructured":"Chen, Q., Chen, X., Wang, J., Zhang, S., Yao, K., Feng, H., Han, J., Ding, E., Zeng, G., Wang, J.: Group detr: Fast detr training with group-wise one-to-many assignment, in Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 6633\u20136642, (2023)","DOI":"10.1109\/ICCV51070.2023.00610"},{"key":"4013_CR24","doi-asserted-by":"crossref","unstructured":"Rezatofighi, H., Tsoi, N., Gwak, J., Sadeghian, A., Reid, I., Savarese, S.: Generalized intersection over union: A metric and a loss for bounding box regression, in Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 658\u2013666, (2019)","DOI":"10.1109\/CVPR.2019.00075"},{"key":"4013_CR25","first-page":"12993","volume":"34","author":"Z Zheng","year":"2020","unstructured":"Zheng, Z., Wang, P., Liu, W., Li, J., Ye, R., Ren, D.: Distance-iou loss: Faster and better learning for bounding box regression. Proc. AAAI Conf. Artif. Intell. 34, 12993\u201313000 (2020)","journal-title":"Proc. AAAI Conf. Artif. Intell."},{"key":"4013_CR26","doi-asserted-by":"crossref","unstructured":"Zhang, Y.-F., Ren, W., Zhang, Z., Jia, Z., Wang, L., Tan, T.: Focal and efficient iou loss for accurate bounding box regression. Neurocomputing 506, 146\u2013157 (2022)","DOI":"10.1016\/j.neucom.2022.07.042"},{"key":"4013_CR27","unstructured":"Gevorgyan, Z.: Siou loss: More powerful learning for bounding box regression, arXiv preprint arXiv:2205.12740, (2022)"},{"key":"4013_CR28","doi-asserted-by":"publisher","first-page":"276","DOI":"10.1016\/j.neunet.2023.11.041","volume":"170","author":"C Liu","year":"2024","unstructured":"Liu, C., Wang, K., Li, Q., Zhao, F., Zhao, K., Ma, H.: Powerful-iou: More straightforward and faster bounding box regression loss with a nonmonotonic focusing mechanism. Neural Netw. 170, 276\u2013284 (2024)","journal-title":"Neural Netw."},{"key":"4013_CR29","unstructured":"Tong, Z., Chen, Y., Xu, Z., Yu, R.: Wise-iou: bounding box regression loss with dynamic focusing mechanism, arXiv preprint arXiv:2301.10051, (2023)"},{"key":"4013_CR30","doi-asserted-by":"crossref","unstructured":"Xu, C., Wang, J., Yang, W., Yu, L.: Dot distance for tiny object detection in aerial images, in Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 1192\u20131201, (2021)","DOI":"10.1109\/CVPRW53098.2021.00130"},{"key":"4013_CR31","doi-asserted-by":"crossref","unstructured":"Xu, C., Wang, J., Yang, W., Yu, H., Yu, L., Xia, G.-S.: Rfla: Gaussian receptive field based label assignment for tiny object detection, in European conference on computer vision, pp. 526\u2013543, Springer, (2022)","DOI":"10.1007\/978-3-031-20077-9_31"},{"key":"4013_CR32","doi-asserted-by":"crossref","unstructured":"Wu, Y., He, K.: Group normalization, in Proceedings of the European conference on computer vision (ECCV), pp. 3\u201319, (2018)","DOI":"10.1007\/978-3-030-01261-8_1"},{"key":"4013_CR33","doi-asserted-by":"crossref","unstructured":"Li, X., Wang, W., Hu, X., Yang, J.: Selective kernel networks, in Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 510\u2013519, (2019)","DOI":"10.1109\/CVPR.2019.00060"},{"key":"4013_CR34","doi-asserted-by":"crossref","unstructured":"Liu, W., Anguelov, D., Erhan, D., Szegedy, C., Reed, S., Fu, C.-Y., Berg, A. C.: Ssd: Single shot multibox detector, in Computer Vision\u2013ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part I 14, pp. 21\u201337, Springer, (2016)","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"4013_CR35","first-page":"1","volume":"61","author":"Y Zhang","year":"2023","unstructured":"Zhang, Y., Wu, C., Guo, W., Zhang, T., Li, W.: Cfanet: Efficient detection of uav image based on cross-layer feature aggregation. IEEE Trans. Geosci. Remote Sens. 61, 1\u201311 (2023)","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"key":"4013_CR36","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2024.3392794","author":"Y Zhang","year":"2024","unstructured":"Zhang, Y., Wu, C., Zhang, T., Zheng, Y.: Full-scale feature aggregation and grouping feature reconstruction based uav image target detection. IEEE Trans. Geosci. Remote Sens. (2024). https:\/\/doi.org\/10.1109\/TGRS.2024.3392794","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"key":"4013_CR37","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TGRS.2024.3510781","volume":"62","author":"Y Zhang","year":"2024","unstructured":"Zhang, Y., Ye, M., Zhu, G., Liu, Y., Guo, P., Yan, J.: Ffca-yolo for small object detection in remote sensing images. IEEE Trans. Geosci. Remote Sens. 62, 1\u201315 (2024)","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"key":"4013_CR38","doi-asserted-by":"crossref","unstructured":"Zhao, Y., Lv, W., Xu, S., Wei, J., Wang, G., Dang, Q., Liu, Y., Chen, J.: Detrs beat yolos on real-time object detection, in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16965\u201316974, (2024)","DOI":"10.1109\/CVPR52733.2024.01605"},{"key":"4013_CR39","doi-asserted-by":"publisher","first-page":"12994","DOI":"10.1109\/TII.2024.3431044","volume":"20","author":"S Cheng","year":"2024","unstructured":"Cheng, S., Song, J., Zhou, M., Wei, X., Pu, H., Luo, J., Jia, W.: Ef-detr: A lightweight transformer-based object detector with an encoder-free neck. IEEE Trans. Indus. Inf. 20, 12994\u201313002 (2024)","journal-title":"IEEE Trans. Indus. Inf."}],"container-title":["Signal, Image and Video Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11760-025-04013-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11760-025-04013-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11760-025-04013-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,30]],"date-time":"2025-05-30T06:39:41Z","timestamp":1748587181000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11760-025-04013-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,12]]},"references-count":39,"journal-issue":{"issue":"7","published-print":{"date-parts":[[2025,7]]}},"alternative-id":["4013"],"URL":"https:\/\/doi.org\/10.1007\/s11760-025-04013-x","relation":{},"ISSN":["1863-1703","1863-1711"],"issn-type":[{"type":"print","value":"1863-1703"},{"type":"electronic","value":"1863-1711"}],"subject":[],"published":{"date-parts":[[2025,5,12]]},"assertion":[{"value":"12 December 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 February 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 March 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 May 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"554"}}