{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,20]],"date-time":"2026-01-20T21:54:12Z","timestamp":1768946052029,"version":"3.49.0"},"reference-count":55,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,1,20]],"date-time":"2026-01-20T00:00:00Z","timestamp":1768867200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,20]],"date-time":"2026-01-20T00:00:00Z","timestamp":1768867200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"the National Key Research and Development Program of China","award":["2100041"],"award-info":[{"award-number":["2100041"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Supercomput"],"DOI":"10.1007\/s11227-026-08235-9","type":"journal-article","created":{"date-parts":[[2026,1,20]],"date-time":"2026-01-20T09:10:06Z","timestamp":1768900206000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["MD-YOLO: research on the innovation and performance optimization of vehicle detection technology"],"prefix":"10.1007","volume":"82","author":[{"given":"Keyou","family":"Guo","sequence":"first","affiliation":[]},{"given":"Jiangnan","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Haibing","family":"Jiang","sequence":"additional","affiliation":[]},{"given":"Pei","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Huangcheng","family":"Qin","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,1,20]]},"reference":[{"key":"8235_CR1","doi-asserted-by":"publisher","DOI":"10.1016\/j.treng.2024.100252","volume":"16","author":"M Elassy","year":"2024","unstructured":"Elassy M, Al-Hattab M, Takruri M, Badawi S (2024) Intelligent transportation systems for sustainable smart cities. Transp Eng 16:100252. https:\/\/doi.org\/10.1016\/j.treng.2024.100252","journal-title":"Transp Eng"},{"key":"8235_CR2","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2408.09332","author":"C-Y Wang","year":"2024","unstructured":"Wang C-Y, Liao H-YM (2024) YOLOv1 to YOLOv10: the fastest and most accurate real-time object detection systems. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2408.09332","journal-title":"arXiv"},{"key":"8235_CR3","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1804.02767","author":"J Redmon","year":"2018","unstructured":"Redmon J, Farhadi A (2018) YOLOv3: an incremental improvement. arXiv. https:\/\/doi.org\/10.48550\/arXiv.1804.02767","journal-title":"arXiv"},{"key":"8235_CR4","doi-asserted-by":"publisher","unstructured":"Jocher G, et al (2020) Ultralytics\/yolov5: v3.0. Zenodo. https:\/\/doi.org\/10.5281\/zenodo.3983579","DOI":"10.5281\/zenodo.3983579"},{"key":"8235_CR5","doi-asserted-by":"publisher","DOI":"10.14569\/IJACSA.2025.01601113","author":"NS Albalawi","year":"2025","unstructured":"Albalawi NS (2025) High-precision multi-class object detection using fine-tuned YOLOv11 architecture: a case study on airborne vehicles. Int J Adv Comput Sci Appl. https:\/\/doi.org\/10.14569\/IJACSA.2025.01601113","journal-title":"Int J Adv Comput Sci Appl"},{"key":"8235_CR6","doi-asserted-by":"publisher","first-page":"740","DOI":"10.1007\/978-3-319-10602-1_48","volume":"8693","author":"T-Y Lin","year":"2014","unstructured":"Lin T-Y, Maire M, Belongie S, Hays J, Perona P, Ramanan D, Doll\u00e1r P, Zitnick CL (2014) Microsoft COCO: common objects in context. Lect Notes Comput Sci 8693:740\u2013755. https:\/\/doi.org\/10.1007\/978-3-319-10602-1_48","journal-title":"Lect Notes Comput Sci"},{"key":"8235_CR7","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2501.18835","author":"S Vidhanaarachchi","year":"2025","unstructured":"Vidhanaarachchi S, Wijekoon JL, Abeysiriwardhana WAPS (2025) Early diagnosis and severity assessment of Weligama coconut leaf wilt disease and coconut caterpillar infestation using deep learning-based image processing techniques. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2501.18835","journal-title":"arXiv"},{"issue":"11","key":"8235_CR8","doi-asserted-by":"publisher","DOI":"10.1061\/JCEMD4.COENG-13686","volume":"149","author":"S Wang","year":"2023","unstructured":"Wang S, Kim M, Hae H, Cao M, Kim J (2023) The development of a rebar-counting model for reinforced concrete columns: using an unmanned aerial vehicle and deep-learning approach. J Constr Eng Manag 149(11):04023122. https:\/\/doi.org\/10.1061\/JCEMD4.COENG-13686","journal-title":"J Constr Eng Manag"},{"key":"8235_CR9","unstructured":"Jocher G, Chaurasia A, Qiu J (2023) Ultralytics YOLO (Version 8.0.0) [Computer software]. https:\/\/github.com\/ultralytics\/ultralytics"},{"issue":"5","key":"8235_CR10","doi-asserted-by":"publisher","DOI":"10.3390\/app15052631","volume":"15","author":"S Park","year":"2025","unstructured":"Park S, Kim J, Wang S, Kim J (2025) Effectiveness of image augmentation techniques on non-protective personal equipment detection using yolov8. Appl Sci 15(5):2631. https:\/\/doi.org\/10.3390\/app15052631","journal-title":"Appl Sci"},{"key":"8235_CR11","doi-asserted-by":"crossref","unstructured":"Wang A, Chen H, Liu LH, Chen K, Lin ZJ, Han JG, Ding GG (2024, October 30) YOLOv10: real-time end-to-end object detection. arXiv. https:\/\/arxiv.org\/pdf\/2405.14458v2","DOI":"10.52202\/079017-3429"},{"key":"8235_CR12","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2503.04139","author":"J Feng","year":"2025","unstructured":"Feng J, Hamilton-Fletcher G, Ballem N, Batavia M, Wang Y, Zhong J, Porfiri M, Rizzo J (2025) Robust computer-vision based construction site detection for assistive-technology applications. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2503.04139","journal-title":"arXiv"},{"key":"8235_CR13","doi-asserted-by":"publisher","first-page":"1242","DOI":"10.1007\/s11227-025-07732-7","volume":"81","author":"DA Amer","year":"2025","unstructured":"Amer DA, Ibrahim NY, Ibrahim IK, Mohamed AM, Soliman SA (2025) Intelligent eyes on water: yolov11-based real-time drowning detection system. J Supercomput 81:1242. https:\/\/doi.org\/10.1007\/s11227-025-07732-7","journal-title":"J Supercomput"},{"issue":"6","key":"8235_CR14","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2016","unstructured":"Ren S, He K, Girshick R, Sun J (2016) Faster R-CNN: towards real-time object detection with region proposal networks. IEEE Trans Pattern Anal Mach Intell 39(6):1137\u20131149. https:\/\/doi.org\/10.1109\/TPAMI.2016.2577031","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"8","key":"8235_CR15","doi-asserted-by":"publisher","first-page":"10453","DOI":"10.1007\/s13369-022-06825-2","volume":"47","author":"MA Rahman","year":"2022","unstructured":"Rahman MA, Allaham SS, Masad AA, Al-Rawabdeh AM (2022) Window detection in facade imagery: a deep learning approach using mask R-CNN. Arab J Sci Eng 47(8):10453\u201310467. https:\/\/doi.org\/10.1007\/s13369-022-06825-2","journal-title":"Arab J Sci Eng"},{"key":"8235_CR16","doi-asserted-by":"crossref","unstructured":"He K, Gkioxari G, Doll\u00e1r P, Girshick R (2017) Mask r-cnn. In: Proceedings of the IEEE international conference on computer vision, pp 2961\u20132969. IEEE. https:\/\/arxiv.org\/pdf\/1703.06870","DOI":"10.1109\/ICCV.2017.322"},{"key":"8235_CR17","doi-asserted-by":"publisher","unstructured":"Dai J, Li Y, He K, Sun J (2016) R-FCN: object detection via region-based fully convolutional networks. In: Advances in neural information processing systems 29\u00a0(NIPS 2016).\u00a0https:\/\/doi.org\/10.48550\/arXiv.1605.06409","DOI":"10.48550\/arXiv.1605.06409"},{"key":"8235_CR18","doi-asserted-by":"publisher","DOI":"10.1016\/j.rineng.2024.103571","volume":"24","author":"S Wang","year":"2024","unstructured":"Wang S (2024) Evaluation of impact of image augmentation techniques on two tasks: window detection and window states detection. Results Eng 24:103571. https:\/\/doi.org\/10.1016\/j.rineng.2024.103571","journal-title":"Results Eng"},{"key":"8235_CR19","doi-asserted-by":"publisher","unstructured":"Carion N, Massa F, Synnaeve G, Usunier N, Kirchhof A, Doll\u00e1r P (2020) End-to-end object detection with transformers. In: European conference on computer vision, Springer, pp 213\u2013229. https:\/\/doi.org\/10.1007\/978-3-030-58586-4_13","DOI":"10.1007\/978-3-030-58586-4_13"},{"key":"8235_CR20","doi-asserted-by":"publisher","unstructured":"Zhao Y et al (2024) DETRs beat YOLOs on real-time object detection. In: 2024 IEEE\/CVF conference on computer vision and pattern recognition, IEEE, pp 16965\u201316974. https:\/\/doi.org\/10.1109\/CVPR52733.2024.01605","DOI":"10.1109\/CVPR52733.2024.01605"},{"key":"8235_CR21","doi-asserted-by":"publisher","first-page":"1226","DOI":"10.1007\/s11227-025-07709-6","volume":"81","author":"Q Shen","year":"2025","unstructured":"Shen Q, Zhang L, Zhang Y, Zhang Y, Liu S (2025) LEDDR-YOLO: a lightweight and efficient distracted driving recognition algorithm with a particular pruning method. J Supercomput 81:1226. https:\/\/doi.org\/10.1007\/s11227-025-07709-6","journal-title":"J Supercomput"},{"key":"8235_CR22","doi-asserted-by":"publisher","first-page":"984","DOI":"10.1007\/s11227-025-07485-3","volume":"81","author":"X Chen","year":"2025","unstructured":"Chen X, Wang G (2025) FP-RTDETR: enhancing infrared ship detection with multi-scale feature fusion and lightweight design. J Supercomput 81:984. https:\/\/doi.org\/10.1007\/s11227-025-07485-3","journal-title":"J Supercomput"},{"key":"8235_CR23","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2024.105276","volume":"151","author":"H Pan","year":"2024","unstructured":"Pan H, Guan S, Zhao X (2024) LVD-yolo: an efficient lightweight vehicle detection model for intelligent transportation systems. Image Vis Comput 151:105276. https:\/\/doi.org\/10.1016\/j.imavis.2024.105276","journal-title":"Image Vis Comput"},{"key":"8235_CR24","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2502.04656","author":"Z Yang","year":"2025","unstructured":"Yang Z, Guan Q, Yu Z, Xu X, Long H, Lian S, Hu H, Tang Y (2025) MHAF-YOLO: multi-branch heterogeneous auxiliary fusion YOLO for accurate object detection. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2502.04656","journal-title":"arXiv"},{"key":"8235_CR25","doi-asserted-by":"publisher","unstructured":"Cai X, Lai Q, Wang Y, Wang W, Sun Z, Yao Y (2024).Poly kernel inception network for remote sensing detection. In: 2024 IEEE\/CVF conference on computer vision and pattern recognition, IEEE, pp 27706\u201327716. https:\/\/doi.org\/10.1109\/CVPR52733.2024.02617","DOI":"10.1109\/CVPR52733.2024.02617"},{"key":"8235_CR26","doi-asserted-by":"publisher","unstructured":"Xia G-S, Bai X, Ding J, Zhu Z, Belongie S, Luo J, Datcu M, Pelillo M, Zhang L (2018) DOTA: a large-scale dataset for object detection in aerial images. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3974\u20133983. https:\/\/doi.org\/10.1109\/CVPR.2018.00418","DOI":"10.1109\/CVPR.2018.00418"},{"issue":"4","key":"8235_CR27","doi-asserted-by":"publisher","first-page":"2388","DOI":"10.1109\/TPAMI.2024.3524377","volume":"47","author":"Y Feng","year":"2025","unstructured":"Feng Y et al (2025) Hyper-yolo: when visual object detection meets hypergraph computation. IEEE Trans Pattern Anal Mach Intell 47(4):2388\u20132401. https:\/\/doi.org\/10.1109\/TPAMI.2024.3524377","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"8235_CR28","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2403.19967","author":"X Ma","year":"2024","unstructured":"Ma X, Dai X, Bai Y, Wang Y, Fu Y (2024) Rewrite the stars. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2403.19967","journal-title":"arXiv"},{"key":"8235_CR29","doi-asserted-by":"publisher","unstructured":"Geiger A, Lenz P, Urtasun R (2012) Are we ready for autonomous driving? The KITTI vision benchmark suite. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3354\u20133361. https:\/\/doi.org\/10.1109\/CVPR.2012.6248074","DOI":"10.1109\/CVPR.2012.6248074"},{"key":"8235_CR30","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2205.12740","author":"Z Gevorgyan","year":"2022","unstructured":"Gevorgyan Z (2022) SIoU loss: more powerful learning for bounding box regression. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2205.12740","journal-title":"arXiv"},{"key":"8235_CR31","doi-asserted-by":"publisher","unstructured":"Tong Z, Chen Y, Xu Z, et al (2023). Wise-IoU: bounding box regression loss with dynamic focusing mechanism. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2301.10051","DOI":"10.48550\/arXiv.2301.10051"},{"key":"8235_CR32","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2502.14740","author":"MAR Alif","year":"2025","unstructured":"Alif MAR, Hussain M (2025) YOLOv12: a breakdown of the key architectural features. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2502.14740","journal-title":"arXiv"},{"key":"8235_CR33","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TIM.2024.3497132","volume":"74","author":"M Zhang","year":"2025","unstructured":"Zhang M, Rong Q, Jing H (2025) TTSDA-YOLO: a two training stage domain adaptation framework for object detection in adverse weather. IEEE Trans Instrum Meas 74:1\u201313. https:\/\/doi.org\/10.1109\/TIM.2024.3497132","journal-title":"IEEE Trans Instrum Meas"},{"key":"8235_CR34","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2407.21640","author":"SG Kolahii","year":"2024","unstructured":"Kolahii SG, Chaharsooghi SK, Khatibi T, Bozorgpour A, Azad R, Heidari M, Hacihaliloglu I, Merhof D (2024) MSA2Net: multi-scale adaptive attention-guided network for medical image segmentation. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2407.21640","journal-title":"arXiv"},{"key":"8235_CR35","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2311.02877","author":"H Zhang","year":"2023","unstructured":"Zhang H, Xu C, Zhang S (2023) Inner-iou: more effective intersection over union loss with auxiliary bounding box. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2311.02877","journal-title":"arXiv"},{"key":"8235_CR36","doi-asserted-by":"publisher","first-page":"276","DOI":"10.1016\/j.neunet.2023.11.041","volume":"170","author":"C Liu","year":"2024","unstructured":"Liu C, Wang K, Li Q, Zhao F, Zhao K, Ma H (2024) Powerful-iou: more straightforward and faster bounding box regression loss with a nonmonotonic focusing mechanism. Neural Netw 170:276\u2013284. https:\/\/doi.org\/10.1016\/j.neunet.2023.11.041","journal-title":"Neural Netw"},{"key":"8235_CR37","doi-asserted-by":"crossref","unstructured":"Huang S et al (2025) DEIM: DETR with improved matching for fast convergence. arXiv. https:\/\/arxiv.org\/abs\/2412.04234","DOI":"10.1109\/CVPR52734.2025.01412"},{"key":"8235_CR38","doi-asserted-by":"publisher","unstructured":"Cheng T, Song L, Ge Y, Liu W, Wang X, Shan Y (2024) YOLO-World: real-time open-vocabulary object detection. In: ieee\/cvf conference on computer vision and pattern recognition, pp 21202\u201321212. https:\/\/doi.org\/10.1109\/CVPR.2024.01305","DOI":"10.1109\/CVPR.2024.01305"},{"key":"8235_CR39","unstructured":"Han K, Wang Y, Guo J, Wu E (2024, January 14) ParameterNet: parameters are all you need [cs.CV]. arXiv. https:\/\/arxiv.org\/pdf\/2306.14525v2"},{"key":"8235_CR40","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2312.05760","author":"A Wang","year":"2024","unstructured":"Wang A, Chen H, Lin Z, Han J, Ding G (2024) RepViT-SAM: towards real-time segmenting anything [cs.CV]. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2312.05760","journal-title":"arXiv"},{"key":"8235_CR41","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2408.03703","author":"T Zhang","year":"2024","unstructured":"Zhang T, Li L, Zhou Y, Liu W, Qian C, Hwang J, Ji X (2024) CAS-ViT: convolutional additive self-attention vision transformers for efficient mobile applications [cs.CV]. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2408.03703","journal-title":"arXiv"},{"key":"8235_CR42","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2311.17132","author":"D Shi","year":"2024","unstructured":"Shi D (2024) TransNeXt: robust foveal visual perception for vision transformers [cs.CV, cs.AI]. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2311.17132","journal-title":"arXiv"},{"key":"8235_CR43","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2412.08345","author":"M Lei","year":"2024","unstructured":"Lei M, Wu H, Lv X, Wang X (2024) ConDSeg: a general medical image segmentation framework via contrast-driven feature enhancement [eess.IV, cs.CV]. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2412.08345","journal-title":"arXiv"},{"key":"8235_CR44","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1911.11907","author":"K Han","year":"2020","unstructured":"Han K, Wang Y, Tian Q, Guo J, Xu C, Xu C (2020) Ghostnet: more features from cheap operations. arXiv. https:\/\/doi.org\/10.48550\/arXiv.1911.11907","journal-title":"arXiv"},{"key":"8235_CR45","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2301.00808","author":"S Woo","year":"2023","unstructured":"Woo S, Debnath S, Hu R, Chen X, Liu Z, Kweon IS, Xie S (2023) ConvNeXt V2: co-designing and scaling ConvNets with masked autoencoders [cs.CV]. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2301.00808","journal-title":"arXiv"},{"key":"8235_CR46","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1706.03762","author":"A Vaswani","year":"2017","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser L, Polosukhin I (2017) Attention is all you need. arXiv. https:\/\/doi.org\/10.48550\/arXiv.1706.03762","journal-title":"arXiv"},{"key":"8235_CR47","doi-asserted-by":"publisher","unstructured":"Li W, Guo H, Liu X, Liang K, Hu J, Ma Z, Guo J (2024) Efficient face super-resolution via wavelet-based feature enhancement network. In: Proceedings of the 32nd ACM international conference on multimedia, ACM, pp 4515\u20134523. https:\/\/doi.org\/10.1145\/3664647.3681088","DOI":"10.1145\/3664647.3681088"},{"key":"8235_CR48","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2212.11677","author":"F Tang","year":"2022","unstructured":"Tang F, Huang Q, Wang J, Hou X, Su J, Liu J (2022) DuAT: dual-aggregation transformer network for medical image segmentation. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2212.11677","journal-title":"arXiv"},{"key":"8235_CR49","doi-asserted-by":"publisher","DOI":"10.1016\/j.mechmat.2025.105254","volume":"203","author":"X Hu","year":"2025","unstructured":"Hu X, Zeng G, Huang M, Zhu Y, Zhao L, Li Z, Deng F (2025) Unusual temperature dependent core properties of <110> superdislocation in Ni<inf>3<\/inf>Al by ab initio results-informed fully discrete Peierls-Nabarro model. Mech Mater 203:105254. https:\/\/doi.org\/10.1016\/j.mechmat.2025.105254","journal-title":"Mech Mater"},{"key":"8235_CR50","doi-asserted-by":"publisher","unstructured":"Xu S et al (2024) HCF-Net: hierarchical context fusion network for infrared small object detection. In: 2024 IEEE international conference on multimedia and expo, IEEE, pp 1\u20136. https:\/\/doi.org\/10.1109\/ICME57554.2024.10687431","DOI":"10.1109\/ICME57554.2024.10687431"},{"key":"8235_CR51","doi-asserted-by":"publisher","DOI":"10.1007\/s00530-024-01593-5","author":"X Chen","year":"2025","unstructured":"Chen X, Yu C (2025) SCG-DETR: a high-precision railway turnout defect detection method based on attention feature fusion and SMP-CGLU approach. Multimedia Syst. https:\/\/doi.org\/10.1007\/s00530-024-01593-5","journal-title":"Multimedia Syst"},{"key":"8235_CR52","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2405.06228","author":"Z Ni","year":"2024","unstructured":"Ni Z, Chen X, Zhai Y, Tang Y, Wang Y (2024) Context-guided spatial feature reconstruction for efficient semantic segmentation. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2405.06228","journal-title":"arXiv"},{"key":"8235_CR53","doi-asserted-by":"crossref","unstructured":"Woo S, Park J, Lee J-Y, Kweon IS (2018) CBAM: convolutional block attention module.\u00a0arXiv.\u00a0https:\/\/arxiv.org\/pdf\/1807.06521","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"8235_CR54","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2101.08158","author":"Y-F Zhang","year":"2022","unstructured":"Zhang Y-F, Ren W, Zhang Z, Jia Z, Wang L, Tan T (2022) Focal and efficient IOU loss for accurate bounding box regression. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2101.08158","journal-title":"arXiv"},{"key":"8235_CR55","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2307.07662","author":"S Ma","year":"2023","unstructured":"Ma S, Xu Y (2023) MPdiou: a loss for efficient and accurate bounding box regression. arXiv. https:\/\/doi.org\/10.48550\/arXiv.2307.07662","journal-title":"arXiv"}],"container-title":["The Journal of Supercomputing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-026-08235-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11227-026-08235-9","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11227-026-08235-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,20]],"date-time":"2026-01-20T09:10:14Z","timestamp":1768900214000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11227-026-08235-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1,20]]},"references-count":55,"journal-issue":{"issue":"2","published-online":{"date-parts":[[2026,1]]}},"alternative-id":["8235"],"URL":"https:\/\/doi.org\/10.1007\/s11227-026-08235-9","relation":{},"ISSN":["1573-0484"],"issn-type":[{"value":"1573-0484","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,1,20]]},"assertion":[{"value":"25 April 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 January 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have influenced the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not applicable (no human participants or data were used).","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Human and animal participants"}}],"article-number":"73"}}