{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T11:05:16Z","timestamp":1773486316672,"version":"3.50.1"},"reference-count":32,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T00:00:00Z","timestamp":1769558400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T00:00:00Z","timestamp":1769558400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Pattern Anal Applic"],"published-print":{"date-parts":[[2026,3]]},"DOI":"10.1007\/s10044-026-01614-1","type":"journal-article","created":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T20:24:18Z","timestamp":1769631858000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Addressing data scarcity and imbalance in vessel detection from UAV-captured images via diffusion-based multimodal synthesis and context-aware compositing"],"prefix":"10.1007","volume":"29","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4335-7002","authenticated-orcid":false,"given":"Chi-Thanh","family":"Nguyen","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-2228-5225","authenticated-orcid":false,"given":"Thu-Huong","family":"Pham","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5065-5545","authenticated-orcid":false,"given":"Thi-Thu-Hong","family":"Le","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,1,28]]},"reference":[{"issue":"4","key":"1614_CR1","doi-asserted-by":"publisher","first-page":"447","DOI":"10.1007\/s13437-023-00312-7","volume":"22","author":"C Gamage","year":"2023","unstructured":"Gamage C, Dinalankara R, Samarabandu J, Subasinghe A (2023) A comprehensive survey on the applications of machine learning techniques on maritime surveillance to detect abnormal maritime vessel behaviors. WMU J Marit Aff 22(4):447\u2013477","journal-title":"WMU J Marit Aff"},{"key":"1614_CR2","doi-asserted-by":"publisher","DOI":"10.1016\/j.oceaneng.2023.115440","volume":"285","author":"S Cheng","year":"2023","unstructured":"Cheng S, Zhu Y, Wu S (2023) Deep learning based efficient ship detection from drone-captured images for maritime surveillance. Ocean Eng 285:115440","journal-title":"Ocean Eng"},{"key":"1614_CR3","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2023.107513","volume":"128","author":"C Zhao","year":"2024","unstructured":"Zhao C, Liu RW, Qu J, Gao R (2024) Deep learning-based object detection in maritime unmanned aerial vehicle imagery: review and experimental comparisons. Eng Appl Artif Intell 128:107513","journal-title":"Eng Appl Artif Intell"},{"key":"1614_CR4","doi-asserted-by":"publisher","DOI":"10.1016\/j.apor.2023.103835","volume":"142","author":"N Wang","year":"2024","unstructured":"Wang N, Wang Y, Wei Y, Han B, Feng Y (2024) Marine vessel detection dataset and benchmark for unmanned surface vehicles. Appl Ocean Res 142:103835","journal-title":"Appl Ocean Res"},{"key":"1614_CR5","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.109347","volume":"137","author":"M Xu","year":"2023","unstructured":"Xu M, Yoon S, Fuentes A, Park DS (2023) A comprehensive survey of image augmentation techniques for deep learning. Pattern Recogn 137:109347","journal-title":"Pattern Recogn"},{"key":"1614_CR6","first-page":"13001","volume":"34","author":"Z Zhong","year":"2020","unstructured":"Zhong Z, Zheng L, Kang G, Li S, Yang Y (2020) Random erasing data augmentation. Proc AAAI Conf Artif Intell 34:13001\u201313008","journal-title":"Proc AAAI Conf Artif Intell"},{"key":"1614_CR7","unstructured":"Chen P, Liu S, Zhao H, Wang X, Jia J (2020) Gridmask data augmentation. arXiv:2001.04086"},{"key":"1614_CR8","unstructured":"Li P, Li X, Long X (2020) Fencemask: a data augmentation approach for pre-extracted image features. arXiv:2006.07877"},{"key":"1614_CR9","unstructured":"Ge ZY, Liu S, Wang F, Li Z, Yolox JS (2021) Exceeding yolo series in 2021. arXiv:2107.08430"},{"key":"1614_CR10","doi-asserted-by":"crossref","unstructured":"Yun S, Han D, Oh SJ, Chun S, Choe J, Yoo Y (2019) Cutmix: regularization strategy to train strong classifiers with localizable features. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 6023\u20136032","DOI":"10.1109\/ICCV.2019.00612"},{"key":"1614_CR11","doi-asserted-by":"publisher","first-page":"47304","DOI":"10.1109\/ACCESS.2023.3275134","volume":"11","author":"P Eigenschink","year":"2023","unstructured":"Eigenschink P, Reutterer T, Vamosi S, Vamosi R, Sun C, Kalcher K (2023) Deep generative models for synthetic data: a survey. IEEE Access 11:47304\u201347320","journal-title":"IEEE Access"},{"key":"1614_CR12","unstructured":"Azizi S, Kornblith S, Saharia C, Norouzi M, Fleet DJ (2023) Synthetic data from diffusion models improves imagenet classification. arXiv:2304.08466"},{"issue":"4","key":"1614_CR13","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1007\/s10489-024-06217-z","volume":"55","author":"Y Jiang","year":"2025","unstructured":"Jiang Y, Liu S, Wang H (2025) Diffusion-based remote sensing image fusion for classification. Appl Intell 55(4):247","journal-title":"Appl Intell"},{"key":"1614_CR14","unstructured":"Li Z, Li Y, Zhao P, Song R, Li X, Yang J (2023) Is synthetic data from diffusion models ready for knowledge distillation? arXiv:2305.12954"},{"issue":"12","key":"1614_CR15","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10489-025-06751-4","volume":"55","author":"T Yuan","year":"2025","unstructured":"Yuan T, Yu Y, Ji N (2025) Style-content progressive aggregation network with stable diffusion. Appl Intell 55(12):1\u201316","journal-title":"Appl Intell"},{"key":"1614_CR16","doi-asserted-by":"crossref","unstructured":"Shipard J, Wiliem A, Thanh KN, Xiang W, Fookes C (2023) Diversity is definitely needed: Improving model-agnostic zero-shot classification via stable diffusion. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 769\u2013778","DOI":"10.1109\/CVPRW59228.2023.00084"},{"key":"1614_CR17","unstructured":"Zhou Y, Sahak H, Ba J (2023) Training on thin air: improve image classification with generated data. arXiv:2305.15316"},{"issue":"4","key":"1614_CR18","doi-asserted-by":"publisher","first-page":"286","DOI":"10.1007\/s10489-024-06210-6","volume":"55","author":"J Meng","year":"2025","unstructured":"Meng J, Zou J, Xiang Z, Wang C, Wang S, Li Y, Kim J (2025) Visible and thermal image fusion network with diffusion models for high-level visual tasks. Appl Intell 55(4):286","journal-title":"Appl Intell"},{"key":"1614_CR19","unstructured":"Podell D, English Z, Lacey K, Blattmann A, Dockhorn T, M\u00fcller J, Penna J, Rombach R (2023) Sdxl: improving latent diffusion models for high-resolution image synthesis. arXiv:2307.01952"},{"key":"1614_CR20","doi-asserted-by":"crossref","unstructured":"Zhang L, Rao A, Agrawala M (2023) Adding conditional control to text-to-image diffusion models. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 3836\u20133847","DOI":"10.1109\/ICCV51070.2023.00355"},{"key":"1614_CR21","doi-asserted-by":"crossref","unstructured":"Mou C, Wang X, Xie L, Wu Y, Zhang J, Qi Z, Shan Y (2024) T2i-adapter: Learning adapters to dig out more controllable ability for text-to-image diffusion models. In: Proceedings of the AAAI conference on artificial intelligence, vol. 38, pp. 4296\u20134304","DOI":"10.1609\/aaai.v38i5.28226"},{"key":"1614_CR22","doi-asserted-by":"crossref","unstructured":"Rub\u00ed B, Cacace J, Rodriguez J, Company R, Tanner M, Arzo R, Cayero J (2024) Vesselimg: a large uav-based vessel image dataset for port surveillance. In: 2024 international conference on unmanned aircraft systems (ICUAS). IEEE\u00a0pp. 76\u201383","DOI":"10.1109\/ICUAS60882.2024.10556944"},{"key":"1614_CR23","unstructured":"Team G, Mesnard T, Hardin C, Dadashi R, Bhupatiraju S, Pathak S, Sifre L, Rivi\u00e8re M, Kale MS, Love J, et al (2024) Gemma: Open models based on gemini research and technology. arXiv:2403.08295"},{"key":"1614_CR24","unstructured":"Black Forest Lab: FLUX (2024) https:\/\/github.com\/black-forest-labs\/flux. Accessed: 2025-04-15"},{"key":"1614_CR25","doi-asserted-by":"crossref","unstructured":"Cheng T, Song L, Ge Y, Liu W, Wang X, Shan Y (2024) Yolo-world: real-time open-vocabulary object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 16901\u201316911.","DOI":"10.1109\/CVPR52733.2024.01599"},{"key":"1614_CR26","doi-asserted-by":"crossref","unstructured":"Liu S, Zeng Z, Ren T, Li F, Zhang H, Yang J, Jiang Q, Li C, Yang J, Su H, et al (2024) Grounding dino: marrying dino with grounded pre-training for open-set object detection. In: European conference on computer vision. Springer, pp. 38\u201355.\u00a0","DOI":"10.1007\/978-3-031-72970-6_3"},{"key":"1614_CR27","doi-asserted-by":"crossref","unstructured":"Kirillov A, Mintun E, Ravi N, Mao H, Rolland C, Gustafson L, Xiao T, Whitehead S, Berg AC, Lo W-Y, et al (2023) Segment anything. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 4015\u20134026l.","DOI":"10.1109\/ICCV51070.2023.00371"},{"issue":"9","key":"1614_CR28","doi-asserted-by":"publisher","first-page":"1638","DOI":"10.3390\/jmse11091638","volume":"11","author":"B Iancu","year":"2023","unstructured":"Iancu B, Winsten J, Soloviev V, Lilius J (2023) A benchmark for maritime object detection with centernet on an improved dataset, aboships-plus. J Mar Sci Eng 11(9):1638","journal-title":"J Mar Sci Eng"},{"key":"1614_CR29","doi-asserted-by":"publisher","DOI":"10.1016\/j.ecolind.2024.111682","volume":"159","author":"H Hu","year":"2024","unstructured":"Hu H, Zhou W, Jiang B, Zhang J, Cheng T (2024) Exploring deep learning techniques for the extraction of lit fishing vessels from luojia1-01. Ecol Ind 159:111682","journal-title":"Ecol Ind"},{"key":"1614_CR30","first-page":"1","volume":"22","author":"Y Zhang","year":"2025","unstructured":"Zhang Y, Liu T, Zhen J, Kang Y, Cheng Y (2025) Adaptive downsampling and scale enhanced detection head for tiny object detection in remote sensing image. IEEE Geosci Remote Sens Lett 22:1\u20135","journal-title":"IEEE Geosci Remote Sens Lett"},{"issue":"1","key":"1614_CR31","doi-asserted-by":"publisher","DOI":"10.1117\/1.JEI.34.1.013005","volume":"34","author":"Y Zhang","year":"2025","unstructured":"Zhang Y, Wang S, Zhang Y, Yu P (2025) Asymmetric light-aware progressive decoding network for rgb-thermal salient object detection. J Electron Imaging 34(1):013005\u2013013005","journal-title":"J Electron Imaging"},{"key":"1614_CR32","first-page":"6840","volume":"33","author":"J Ho","year":"2020","unstructured":"Ho J, Jain A, Abbeel P (2020) Denoising diffusion probabilistic models. Adv Neural Inf Process Syst 33:6840\u20136851","journal-title":"Adv Neural Inf Process Syst"}],"container-title":["Pattern Analysis and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-026-01614-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10044-026-01614-1","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10044-026-01614-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T10:39:14Z","timestamp":1773484754000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10044-026-01614-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1,28]]},"references-count":32,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,3]]}},"alternative-id":["1614"],"URL":"https:\/\/doi.org\/10.1007\/s10044-026-01614-1","relation":{},"ISSN":["1433-7541","1433-755X"],"issn-type":[{"value":"1433-7541","type":"print"},{"value":"1433-755X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,1,28]]},"assertion":[{"value":"14 August 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 January 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no Conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"30"}}