{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,7]],"date-time":"2026-02-07T10:25:11Z","timestamp":1770459911800,"version":"3.49.0"},"reference-count":53,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,12,7]],"date-time":"2025-12-07T00:00:00Z","timestamp":1765065600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,12,7]],"date-time":"2025-12-07T00:00:00Z","timestamp":1765065600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"Sichuan Science and Technology Program","award":["2024NSFSC2050"],"award-info":[{"award-number":["2024NSFSC2050"]}]},{"name":"Sichuan Science and Technology Innovation Sowers Project Funding Program","award":["MZGC20240147"],"award-info":[{"award-number":["MZGC20240147"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["62441610"],"award-info":[{"award-number":["62441610"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"name":"Natural Science Starting Project of SWPU","award":["2022QHZ023"],"award-info":[{"award-number":["2022QHZ023"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Real-Time Image Proc"],"published-print":{"date-parts":[[2026,2]]},"DOI":"10.1007\/s11554-025-01816-6","type":"journal-article","created":{"date-parts":[[2025,12,7]],"date-time":"2025-12-07T15:38:17Z","timestamp":1765121897000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["PRepDETR: a real-time detection transformer with partial convolutions and efficient cross-scale feature fusion"],"prefix":"10.1007","volume":"23","author":[{"given":"Bin","family":"Xiao","sequence":"first","affiliation":[]},{"given":"Junchao","family":"Wen","sequence":"additional","affiliation":[]},{"given":"Xianjie","family":"He","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4222-9271","authenticated-orcid":false,"given":"Yanxue","family":"Wu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6547-6374","authenticated-orcid":false,"given":"Xingpeng","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Shengtong","family":"Hu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,12,7]]},"reference":[{"key":"1816_CR1","doi-asserted-by":"crossref","unstructured":"Dalal, N., Triggs, B.: Histograms of oriented gradients for human detection. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 886\u2013893 (2005)","DOI":"10.1109\/CVPR.2005.177"},{"issue":"9","key":"1816_CR2","doi-asserted-by":"publisher","first-page":"1627","DOI":"10.1109\/TPAMI.2009.167","volume":"32","author":"PF Felzenszwalb","year":"2009","unstructured":"Felzenszwalb, P.F., Girshick, R.B., McAllester, D., Ramanan, D.: Object detection with discriminatively trained part-based models. IEEE Trans. Pattern Anal. Mach. Intell. 32(9), 1627\u20131645 (2009)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1816_CR3","doi-asserted-by":"crossref","unstructured":"Wang, B., Ye, H., Zhang, X., He, D., Wang, X., Wang, Q., Zhao, C.: Object correlation matrix for two-stage object detection network. In: IEEE International Conference on Acoustics, Speech and Signal Processing, pp. 9846\u20139850 (2024)","DOI":"10.1109\/ICASSP48485.2024.10448162"},{"issue":"6","key":"1816_CR4","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2016","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster r-cnn: towards real-time object detection with region proposal networks. IEEE Trans. Pattern Anal. Mach. Intell. 39(6), 1137\u20131149 (2016)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1816_CR5","doi-asserted-by":"crossref","unstructured":"Redmon, J., Divvala, S., Girshick, R., Farhadi, A.: You only look once: unified, real-time object detection. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 779\u2013788 (2016)","DOI":"10.1109\/CVPR.2016.91"},{"key":"1816_CR6","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Goyal, P., Girshick, R., He, K., Doll\u00e1r, P.: Focal loss for dense object detection. In: IEEE International Conference on Computer Vision, pp. 2980\u20132988 (2017)","DOI":"10.1109\/ICCV.2017.324"},{"key":"1816_CR7","doi-asserted-by":"crossref","unstructured":"Zeng, F., Dong, B., Zhang, Y., Wang, T., Zhang, X., Wei, Y.: Motr: End-to-end multiple-object tracking with transformer. In: European Conference on Computer Vision, pp. 659\u2013675 (2022)","DOI":"10.1007\/978-3-031-19812-0_38"},{"key":"1816_CR8","unstructured":"Bochkovskiy, A., Wang, C.-Y., Liao, H.-Y.M.: Yolov4: Optimal speed and accuracy of object detection. arXiv preprint arXiv:2004.10934 (2020)"},{"key":"1816_CR9","unstructured":"Jocher, G., Chaurasia, A., Stoken, A., Borovec, J., Kwon, Y., Michael, K., Fang, J., Wong, C., Yifu, Z., Montes, D., et al.: ultralytics\/yolov5: v6. 2-yolov5 classification models, apple m1, reproducibility, clearml and deci. ai integrations. Zenodo (2022)"},{"key":"1816_CR10","unstructured":"Li, C., Li, L., Jiang, H., Weng, K., Geng, Y., Li, L., Ke, Z., Li, Q., Cheng, M., Nie, W., et al.: Yolov6: A single-stage object detection framework for industrial applications. arXiv preprint arXiv:2209.02976 (2022)"},{"key":"1816_CR11","doi-asserted-by":"crossref","unstructured":"Wang, C.-Y., Bochkovskiy, A., Liao, H.-Y.M.: Yolov7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7464\u20137475 (2023)","DOI":"10.1109\/CVPR52729.2023.00721"},{"key":"1816_CR12","doi-asserted-by":"crossref","unstructured":"Sohan, M., Sai\u00a0Ram, T., Rami\u00a0Reddy, C.V.: A review on yolov8 and its advancements. In: International Conference on Data Intelligence and Cognitive Informatics, pp. 529\u2013545 (2024)","DOI":"10.1007\/978-981-99-7962-2_39"},{"issue":"2","key":"1816_CR13","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11554-025-01645-7","volume":"22","author":"P Ding","year":"2025","unstructured":"Ding, P., Li, T., Qian, H., Ma, L., Chen, Z.: A lightweight real-time object detection method for complex scenes based on yolov4. J. Real-Time Image Proc. 22(2), 1\u201313 (2025)","journal-title":"J. Real-Time Image Proc."},{"issue":"4","key":"1816_CR14","doi-asserted-by":"publisher","first-page":"138","DOI":"10.1007\/s11554-025-01716-9","volume":"22","author":"Y Zhang","year":"2025","unstructured":"Zhang, Y., Wu, C., Fan, Y.: Mlf-yolo: a novel multiscale feature fusion network for remote sensing small target detection. J. Real-Time Image Proc. 22(4), 138 (2025)","journal-title":"J. Real-Time Image Proc."},{"key":"1816_CR15","unstructured":"Khanam, R., Hussain, M.: Yolov11: An overview of the key architectural enhancements. arXiv preprint arXiv:2410.17725 (2024)"},{"key":"1816_CR16","unstructured":"Tian, Y., Ye, Q., Doermann, D.: Yolov12: attention-centric real-time object detectors. arXiv preprint arXiv:2502.12524 (2025)"},{"key":"1816_CR17","doi-asserted-by":"crossref","unstructured":"Carion, N., Massa, F., Synnaeve, G., Usunier, N., Kirillov, A., Zagoruyko, S.: End-to-end object detection with transformers. In: European Conference on Computer Vision, pp. 213\u2013229 (2020)","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"1816_CR18","unstructured":"Zhang, H., Li, F., Liu, S., Zhang, L., Su, H., Zhu, J., Ni, L.M., Shum, H.-Y.: Dino: Detr with improved denoising anchor boxes for end-to-end object detection. In: International Conference on Learning Representations (2023)"},{"key":"1816_CR19","unstructured":"Zhu, X., Su, W., Lu, L., Li, B., Wang, X., Dai, J.: Deformable detr: Deformable transformers for end-to-end object detection. In: International Conference on Learning Representations (2021)"},{"key":"1816_CR20","doi-asserted-by":"crossref","unstructured":"Zhao, Y., Lv, W., Xu, S., Wei, J., Wang, G., Dang, Q., Liu, Y., Chen, J.: Detrs beat yolos on real-time object detection. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16965\u201316974 (2024)","DOI":"10.1109\/CVPR52733.2024.01605"},{"key":"1816_CR21","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"1816_CR22","doi-asserted-by":"crossref","unstructured":"Rezatofighi, H., Tsoi, N., Gwak, J., Sadeghian, A., Reid, I., Savarese, S.: Generalized intersection over union: A metric and a loss for bounding box regression. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 658\u2013666 (2019)","DOI":"10.1109\/CVPR.2019.00075"},{"key":"1816_CR23","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","volume":"88","author":"M Everingham","year":"2010","unstructured":"Everingham, M., Van Gool, L., Williams, C.K., Winn, J., Zisserman, A.: The pascal visual object classes (voc) challenge. Int. J. Comput. Vis. 88, 303\u2013338 (2010)","journal-title":"Int. J. Comput. Vis."},{"issue":"5","key":"1816_CR24","first-page":"2","volume":"8","author":"M Everingham","year":"2011","unstructured":"Everingham, M., Winn, J.: The pascal visual object classes challenge 2012 (voc2012) development kit. Pattern Anal. Stat. Model. Comput. Learn. Tech. Rep 8(5), 2\u20135 (2011)","journal-title":"Pattern Anal. Stat. Model. Comput. Learn. Tech. Rep"},{"key":"1816_CR25","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Maire, M., Belongie, S., Hays, J., Perona, P., Ramanan, D., Doll\u00e1r, P., Zitnick, C.L.: Microsoft coco: common objects in context. In: European Conference on Computer Vision, pp. 740\u2013755. Springer (2014)","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"1816_CR26","unstructured":"Arani, E., Gowda, S., Mukherjee, R., Magdy, O., Kathiresan, S., Zonooz, B.: A comprehensive study of real-time object detection networks across multiple domains: a survey. Trans. Mach. Learn. Res. 2022 (2022)"},{"key":"1816_CR27","doi-asserted-by":"crossref","unstructured":"Wang, C.-Y., Liao, H.-Y.M., Wu, Y.-H., Chen, P.-Y., Hsieh, J.-W., Yeh, I.-H.: Cspnet: a new backbone that can enhance learning capability of cnn. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, pp. 390\u2013391 (2020)","DOI":"10.1109\/CVPRW50498.2020.00203"},{"key":"1816_CR28","doi-asserted-by":"crossref","unstructured":"Liu, S., Qi, L., Qin, H., Shi, J., Jia, J.: Path aggregation network for instance segmentation. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 8759\u20138768 (2018)","DOI":"10.1109\/CVPR.2018.00913"},{"issue":"1","key":"1816_CR29","doi-asserted-by":"publisher","first-page":"23542","DOI":"10.1038\/s41598-024-75243-1","volume":"14","author":"L Xiao","year":"2024","unstructured":"Xiao, L., Li, W., Yao, S., Liu, H., Ren, D.: High-precision and lightweight small-target detection algorithm for low-cost edge intelligence. Sci. Rep. 14(1), 23542 (2024)","journal-title":"Sci. Rep."},{"key":"1816_CR30","doi-asserted-by":"crossref","unstructured":"Li, H., Xiao, L., Cao, L., Wu, D., Liu, Y., Li, Y., Zhang, Y., Bao, H.: Crossmodalnet: A dual-modal object detection network based on cross-modal fusion and channel interaction. Expert Syst. Appl. 129677 (2025)","DOI":"10.1016\/j.eswa.2025.129677"},{"issue":"5","key":"1816_CR31","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11554-025-01753-4","volume":"22","author":"L Xiao","year":"2025","unstructured":"Xiao, L., Li, W., Tang, R., Li, H., Wan, B., Ren, D.: Edet-yolo: an efficient small object detection algorithm for aerial images. J. Real-Time Image Proc. 22(5), 1\u201312 (2025)","journal-title":"J. Real-Time Image Proc."},{"key":"1816_CR32","doi-asserted-by":"crossref","unstructured":"Li, W., Xiao, L., Li, H., Yao, S., Wan, B., Ren, D.: Dacg-net: a dual-backbone and context-guided fusion network for aerial uav detection. IEEE Trans. Aerosp. Electron. Syst. (2025)","DOI":"10.1109\/TAES.2025.3601109"},{"key":"1816_CR33","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., Weissenborn, D., Zhai, X., Unterthiner, T., Dehghani, M., Minderer, M., Heigold, G., Gelly, S., Uszkoreit, J., Houlsby, N.: An image is worth 16x16 words: transformers for image recognition at scale. In: International Conference on Learning Representations (2021)"},{"key":"1816_CR34","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2025.113539","volume":"318","author":"P Shi","year":"2025","unstructured":"Shi, P., Dong, X., Ge, R., Liu, Z., Yang, A.: Dp-m3d: Monocular 3d object detection algorithm with depth perception capability. Knowl.-Based Syst. 318, 113539 (2025)","journal-title":"Knowl.-Based Syst."},{"issue":"1","key":"1816_CR35","doi-asserted-by":"publisher","first-page":"1947","DOI":"10.1177\/03611981241258753","volume":"2679","author":"X Dong","year":"2025","unstructured":"Dong, X., Shi, P., Liang, T., Yang, A.: Ctaffnet: Cnn-transformer adaptive feature fusion object detection algorithm for complex traffic scenarios. Transp. Res. Rec. 2679(1), 1947\u20131965 (2025)","journal-title":"Transp. Res. Rec."},{"key":"1816_CR36","doi-asserted-by":"publisher","DOI":"10.1016\/j.displa.2024.102814","volume":"84","author":"X Dong","year":"2024","unstructured":"Dong, X., Shi, P., Qi, H., Yang, A., Liang, T.: Ts-bev: Bev object detection algorithm based on temporal-spatial feature fusion. Displays 84, 102814 (2024)","journal-title":"Displays"},{"key":"1816_CR37","unstructured":"Shufang, Y.: Rt-detr++ for uav object detection. arXiv preprint arXiv:2509.09157 (2025)"},{"key":"1816_CR38","doi-asserted-by":"crossref","unstructured":"Yang, Y., Dai, J., Wang, Y., Chen, Y.: Fm-rtdetr: small object detection algorithm based on enhanced feature fusion with mamba. IEEE Signal Process. Lett. (2025)","DOI":"10.1109\/LSP.2025.3553426"},{"key":"1816_CR39","doi-asserted-by":"publisher","DOI":"10.1016\/j.bspc.2024.107378","volume":"103","author":"C Zhou","year":"2025","unstructured":"Zhou, C., He, H., Zhou, H., Ge, F., Yu, P.: Msrt-detr: A novel rt-detr model with multi-scale feature sequence for cell detection. Biomed. Signal Process. Control 103, 107378 (2025)","journal-title":"Biomed. Signal Process. Control"},{"key":"1816_CR40","doi-asserted-by":"crossref","unstructured":"Yu, J., Jiang, Y., Wang, Z., Cao, Z., Huang, T.: Unitbox: an advanced object detection network. In: ACM International Conference on Multimedia, pp. 516\u2013520 (2016)","DOI":"10.1145\/2964284.2967274"},{"key":"1816_CR41","doi-asserted-by":"crossref","unstructured":"Zheng, Z., Wang, P., Liu, W., Li, J., Ye, R., Ren, D.: Distance-iou loss: Faster and better learning for bounding box regression. In: AAAI Conference on Artificial Intelligence, pp. 12993\u201313000 (2020)","DOI":"10.1609\/aaai.v34i07.6999"},{"key":"1816_CR42","doi-asserted-by":"publisher","first-page":"146","DOI":"10.1016\/j.neucom.2022.07.042","volume":"506","author":"Y-F Zhang","year":"2022","unstructured":"Zhang, Y.-F., Ren, W., Zhang, Z., Jia, Z., Wang, L., Tan, T.: Focal and efficient iou loss for accurate bounding box regression. Neurocomputing 506, 146\u2013157 (2022)","journal-title":"Neurocomputing"},{"key":"1816_CR43","unstructured":"Zeng, Y.: Hmpe: Heatmap embedding for efficient transformer-based small object detection. arXiv preprint arXiv:2504.13469 (2025)"},{"key":"1816_CR44","doi-asserted-by":"crossref","unstructured":"Nascimento, M.G.d., Fawcett, R., Prisacariu, V.A.: Dsconv: efficient convolution operator. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 5148\u20135157 (2019)","DOI":"10.1109\/ICCV.2019.00525"},{"key":"1816_CR45","doi-asserted-by":"crossref","unstructured":"Chen, J., Kao, S.-h., He, H., Zhuo, W., Wen, S., Lee, C.-H., Chan, S.-H.G.: Run, don\u2019t walk: chasing higher flops for faster neural networks. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12021\u201312031 (2023)","DOI":"10.1109\/CVPR52729.2023.01157"},{"key":"1816_CR46","doi-asserted-by":"crossref","unstructured":"Ghiasi, G., Lin, T.-Y., Le, Q.V.: Nas-fpn: learning scalable feature pyramid architecture for object detection. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7036\u20137045 (2019)","DOI":"10.1109\/CVPR.2019.00720"},{"key":"1816_CR47","unstructured":"Jiang, Y., Tan, Z., Wang, J., Sun, X., Lin, M., Li, H.: Giraffedet: a heavy-neck paradigm for object detection. In: International Conference on Learning Representations (2022)"},{"key":"1816_CR48","unstructured":"Xu, X., Jiang, Y., Chen, W., Huang, Y., Zhang, Y., Sun, X.: Damo-yolo: a report on real-time object detection design. arXiv preprint arXiv:2211.15444 (2022)"},{"key":"1816_CR49","doi-asserted-by":"crossref","unstructured":"Ding, X., Zhang, X., Ma, N., Han, J., Ding, G., Sun, J.: Repvgg: making vgg-style convnets great again. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13733\u201313742 (2021)","DOI":"10.1109\/CVPR46437.2021.01352"},{"key":"1816_CR50","unstructured":"Zhang, H., Zhang, S.: Focaler-iou: More focused intersection over union loss. arXiv preprint arXiv:2401.10525 (2024)"},{"key":"1816_CR51","doi-asserted-by":"crossref","unstructured":"Yang, J., Liu, S., Wu, J., Su, X., Hai, N., Huang, X.: Pinwheel-shaped convolution and scale-based dynamic loss for infrared small target detection. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 39, pp. 9202\u20139210 (2025)","DOI":"10.1609\/aaai.v39i9.32996"},{"key":"1816_CR52","unstructured":"Tan, M., Le, Q.: Efficientnetv2: smaller models and faster training. In: International Conference on Machine Learning, pp. 10096\u201310106. PMLR (2021)."},{"key":"1816_CR53","doi-asserted-by":"crossref","unstructured":"Sandler, M., Howard, A., Zhu, M., Zhmoginov, A., Chen, L.-C.: Mobilenetv2: inverted residuals and linear bottlenecks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4510\u20134520 (2018)","DOI":"10.1109\/CVPR.2018.00474"}],"container-title":["Journal of Real-Time Image Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-025-01816-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11554-025-01816-6","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-025-01816-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,6]],"date-time":"2026-02-06T16:52:00Z","timestamp":1770396720000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11554-025-01816-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,7]]},"references-count":53,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,2]]}},"alternative-id":["1816"],"URL":"https:\/\/doi.org\/10.1007\/s11554-025-01816-6","relation":{},"ISSN":["1861-8200","1861-8219"],"issn-type":[{"value":"1861-8200","type":"print"},{"value":"1861-8219","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,12,7]]},"assertion":[{"value":"30 August 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 November 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 December 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"21"}}