{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,24]],"date-time":"2026-06-24T01:02:25Z","timestamp":1782262945187,"version":"3.54.5"},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2026,1,3]],"date-time":"2026-01-03T00:00:00Z","timestamp":1767398400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2026,1,30]],"date-time":"2026-01-30T00:00:00Z","timestamp":1769731200000},"content-version":"vor","delay-in-days":27,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["82201195"],"award-info":[{"award-number":["82201195"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["npj Digit. Med."],"DOI":"10.1038\/s41746-025-02300-y","type":"journal-article","created":{"date-parts":[[2026,1,3]],"date-time":"2026-01-03T06:37:12Z","timestamp":1767422232000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Grounded report generation for enhancing ophthalmic ultrasound interpretation using Vision-Language Segmentation models"],"prefix":"10.1038","volume":"9","author":[{"given":"Kai","family":"Jin","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Qixuan","family":"Sun","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Daohuan","family":"Kang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ziyao","family":"Luo","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Tao","family":"Yu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Wenzheng","family":"Han","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yi","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Meng","family":"Wang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Danli","family":"Shi","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Andrzej","family":"Grzybowski","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2026,1,3]]},"reference":[{"key":"2300_CR1","doi-asserted-by":"publisher","first-page":"888","DOI":"10.1038\/s41586-025-08675-y","volume":"639","author":"VM Rao","year":"2025","unstructured":"Rao, V. M. et al. Multimodal generative AI for medical image interpretation. Nature 639, 888\u2013896 (2025).","journal-title":"Nature"},{"key":"2300_CR2","doi-asserted-by":"publisher","first-page":"e1921460","DOI":"10.1001\/jamanetworkopen.2019.21460","volume":"3","author":"SL Propst","year":"2020","unstructured":"Propst, S. L. et al. Ocular point-of-care ultrasonography to diagnose posterior chamber abnormalities: a systematic review and meta-analysis. JAMA Netw. open 3, e1921460\u2013e1921460 (2020).","journal-title":"JAMA Netw. open"},{"key":"2300_CR3","doi-asserted-by":"publisher","first-page":"677","DOI":"10.1007\/s10555-018-9762-9","volume":"37","author":"A Maheshwari","year":"2018","unstructured":"Maheshwari, A. & Finger, P. T. Cancers of the eye. Cancer Metastasis Rev. 37, 677\u2013690 (2018).","journal-title":"Cancer Metastasis Rev."},{"key":"2300_CR4","doi-asserted-by":"publisher","first-page":"783","DOI":"10.1136\/bjophthalmol-2011-301378","volume":"96","author":"S Resnikoff","year":"2012","unstructured":"Resnikoff, S., Felch, W., Gauthier, T. M. & Spivey, B. The number of ophthalmologists in practice and training worldwide: a growing gap despite more than 200,000 practitioners. Br. J. Ophthalmol. 96, 783\u2013787 (2012).","journal-title":"Br. J. Ophthalmol."},{"key":"2300_CR5","doi-asserted-by":"publisher","first-page":"588","DOI":"10.1136\/bjophthalmol-2019-314336","volume":"104","author":"S Resnikoff","year":"2020","unstructured":"Resnikoff, S. et al. Estimated number of ophthalmologists worldwide (International Council of Ophthalmology update): will we meet the needs? Br. J. Ophthalmol. 104, 588\u2013592 (2020).","journal-title":"Br. J. Ophthalmol."},{"key":"2300_CR6","doi-asserted-by":"publisher","first-page":"e14","DOI":"10.1016\/j.ophtha.2021.08.023","volume":"129","author":"MD Abr\u00e0moff","year":"2022","unstructured":"Abr\u00e0moff, M. D. et al. Foundational considerations for artificial intelligence using ophthalmic images. Ophthalmology 129, e14\u2013e32 (2022).","journal-title":"Ophthalmology"},{"key":"2300_CR7","doi-asserted-by":"publisher","DOI":"10.1016\/j.xcrm.2023.101095","volume":"4","author":"Z Li","year":"2023","unstructured":"Li, Z. et al. Artificial intelligence in ophthalmology: the path to the real-world clinic. Cell Rep. Med. 4, 101095 (2023).","journal-title":"Cell Rep. Med."},{"key":"2300_CR8","doi-asserted-by":"publisher","first-page":"120","DOI":"10.1016\/j.aopr.2024.03.003","volume":"4","author":"K Jin","year":"2024","unstructured":"Jin, K. et al. Integration of smartphone technology and artificial intelligence for advanced ophthalmic care: a systematic review. Adv. Ophthalmol. Pract. Res. 4, 120\u2013127 (2024).","journal-title":"Adv. Ophthalmol. Pract. Res."},{"key":"2300_CR9","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1001\/jamaophthalmol.2024.0017","volume":"142","author":"A Mihalache","year":"2024","unstructured":"Mihalache, A. et al. Accuracy of an artificial intelligence Chatbot\u2019s interpretation of clinical ophthalmic images. JAMA Ophthalmol. 142, 321\u2013326 (2024).","journal-title":"JAMA Ophthalmol."},{"key":"2300_CR10","doi-asserted-by":"publisher","first-page":"599","DOI":"10.1007\/s40123-025-01109-y","volume":"14","author":"T Yu","year":"2025","unstructured":"Yu, T. et al. A systematic review of advances in AI-assisted analysis of fundus fluorescein angiography (FFA) images: from detection to report generation. Ophthalmol. Ther. 14, 599\u2013619 (2025).","journal-title":"Ophthalmol. Ther."},{"key":"2300_CR11","doi-asserted-by":"publisher","DOI":"10.1016\/j.xcrm.2022.100861","volume":"3","author":"MMH Shandhi","year":"2022","unstructured":"Shandhi, M. M. H. & Dunn, J. P. AI in medicine: where are we now and where are we going? Cell Rep. Med. 3, 100861 (2022).","journal-title":"Cell Rep. Med."},{"key":"2300_CR12","doi-asserted-by":"publisher","first-page":"999","DOI":"10.1136\/bjo-2022-322953","volume":"108","author":"Y Wang","year":"2024","unstructured":"Wang, Y. et al. Automated classification of multiple ophthalmic diseases using ultrasound images by deep learning. Br. J. Ophthalmol. 108, 999\u20131004 (2024).","journal-title":"Br. J. Ophthalmol."},{"key":"2300_CR13","doi-asserted-by":"publisher","first-page":"2645","DOI":"10.1007\/s40123-024-01009-7","volume":"13","author":"X Ye","year":"2024","unstructured":"Ye, X. et al. Ocular disease detection with deep learning (fine-grained image categorization) applied to ocular B-scan ultrasound images. Ophthalmol. Ther. 13, 2645\u20132659 (2024).","journal-title":"Ophthalmol. Ther."},{"key":"2300_CR14","doi-asserted-by":"publisher","first-page":"1852","DOI":"10.1136\/bjo-2022-321472","volume":"107","author":"Z Gao","year":"2023","unstructured":"Gao, Z. et al. Automatic interpretation and clinical evaluation for fundus fluorescein angiography images of diabetic retinopathy patients by deep learning. Br. J. Ophthalmol. 107, 1852\u20131858 (2023).","journal-title":"Br. J. Ophthalmol."},{"key":"2300_CR15","doi-asserted-by":"publisher","first-page":"487","DOI":"10.1097\/ICU.0000000000001089","volume":"35","author":"G Lim","year":"2024","unstructured":"Lim, G., Elangovan, K. & Jin, L. Vision language models in ophthalmology. Curr. Opin. Ophthalmol. 35, 487\u2013493 (2024).","journal-title":"Curr. Opin. Ophthalmol."},{"key":"2300_CR16","doi-asserted-by":"publisher","first-page":"2886","DOI":"10.1038\/s41591-024-03139-8","volume":"30","author":"J Li","year":"2024","unstructured":"Li, J. et al. Integrated image-based deep learning and language models for primary diabetes care. Nat. Med. 30, 2886\u20132896 (2024).","journal-title":"Nat. Med."},{"key":"2300_CR17","doi-asserted-by":"publisher","first-page":"1481","DOI":"10.1038\/s41591-024-02959-y","volume":"30","author":"M Christensen","year":"2024","unstructured":"Christensen, M., Vukadinovic, M., Yuan, N. & Ouyang, D. Vision\u2013language foundation model for echocardiogram interpretation. Nat. Med. 30, 1481\u20131488 (2024).","journal-title":"Nat. Med."},{"key":"2300_CR18","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-024-44824-z","volume":"15","author":"J Ma","year":"2024","unstructured":"Ma, J. et al. Segment anything in medical images. Nat. Commun. 15, 654 (2024).","journal-title":"Nat. Commun."},{"key":"2300_CR19","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2025.103547","volume":"102","author":"J Wu","year":"2025","unstructured":"Wu, J. et al. Medical SAM adapter: adapting segment anything model for medical image segmentation. Med. Image Anal. 102, 103547 (2025).","journal-title":"Med. Image Anal."},{"key":"2300_CR20","doi-asserted-by":"publisher","first-page":"730","DOI":"10.1038\/s41433-023-02765-9","volume":"38","author":"Y Yan","year":"2024","unstructured":"Yan, Y. et al. Clinical evaluation of deep learning systems for assisting in the diagnosis of the epiretinal membrane grade in general ophthalmologists. Eye 38, 730\u2013736 (2024).","journal-title":"Eye"},{"key":"2300_CR21","doi-asserted-by":"publisher","first-page":"3129","DOI":"10.1038\/s41591-024-03185-2","volume":"30","author":"K Zhang","year":"2024","unstructured":"Zhang, K. et al. A generalist vision\u2013language foundation model for diverse biomedical tasks. Nat. Med. 30, 3129\u20133141 (2024).","journal-title":"Nat. Med."},{"key":"2300_CR22","doi-asserted-by":"publisher","first-page":"573","DOI":"10.1001\/jamaophthalmol.2024.1165","volume":"142","author":"F Antaki","year":"2024","unstructured":"Antaki, F., Chopra, R. & Keane, P. A. Vision-language models for feature detection of macular diseases on optical coherence tomography. JAMA Ophthalmol. 142, 573\u2013576 (2024).","journal-title":"JAMA Ophthalmol."},{"key":"2300_CR23","doi-asserted-by":"publisher","first-page":"111","DOI":"10.1038\/s41746-024-01101-z","volume":"7","author":"X Chen","year":"2024","unstructured":"Chen, X. et al. FFA-GPT: an automated pipeline for fundus fluorescein angiography interpretation and question-answer. npj Digit Med. 7, 111 (2024).","journal-title":"npj Digit Med."},{"key":"2300_CR24","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2025.103514","volume":"102","author":"Y Lu","year":"2025","unstructured":"Lu, Y. & Wang, A. Integrating language into medical visual recognition and reasoning: a survey. Med. Image Anal. 102, 103514 (2025).","journal-title":"Med. Image Anal."},{"key":"2300_CR25","doi-asserted-by":"publisher","unstructured":"Jin, K., Yu, T. & Grzybowski, A. Multimodal artificial intelligence in ophthalmology: applications, challenges, and future directions. Survey Ophthalmol. https:\/\/doi.org\/10.1016\/j.survophthal.2025.07.003.","DOI":"10.1016\/j.survophthal.2025.07.003"},{"key":"2300_CR26","doi-asserted-by":"publisher","unstructured":"Jin, K. et al. Multimodal deep learning with feature level fusion for identification of choroidal neovascularization activity in age-related macular degeneration. Acta Ophthalmol. https:\/\/doi.org\/10.1111\/aos.14928.","DOI":"10.1111\/aos.14928"},{"key":"2300_CR27","doi-asserted-by":"publisher","unstructured":"Liu, J. et al. Challenges in AI-driven biomedical multimodal data fusion and analysis. Genom. Proteom. Bioinform. https:\/\/doi.org\/10.1093\/gpbjnl\/qzaf011 (2025).","DOI":"10.1093\/gpbjnl\/qzaf011"},{"key":"2300_CR28","doi-asserted-by":"publisher","DOI":"10.1038\/s41597-023-02188-x","volume":"10","author":"K Jin","year":"2023","unstructured":"Jin, K. et al. MSHF: a multi-source heterogeneous fundus (MSHF) dataset for image quality assessment. Sci. Data 10, 286 (2023).","journal-title":"Sci. Data"},{"key":"2300_CR29","doi-asserted-by":"publisher","unstructured":"Wu, H. et al. Diabetic retinopathy assessment through multitask learning approach on heterogeneous fundus image datasets. Ophthalmol. Sci. 5, https:\/\/doi.org\/10.1016\/j.xops.2025.100755 (2025).","DOI":"10.1016\/j.xops.2025.100755"},{"key":"2300_CR30","doi-asserted-by":"publisher","first-page":"210","DOI":"10.1016\/j.clindermatol.2023.12.013","volume":"42","author":"A Grzybowski","year":"2024","unstructured":"Grzybowski, A., Jin, K. & Wu, H. Challenges of artificial intelligence in medicine and dermatology. Clin. Dermatol. 42, 210\u2013215 (2024).","journal-title":"Clin. Dermatol."},{"key":"2300_CR31","doi-asserted-by":"publisher","first-page":"265","DOI":"10.1038\/s41746-024-01248-9","volume":"7","author":"K Wenderott","year":"2024","unstructured":"Wenderott, K., Krups, J., Zaruchas, F. & Weigl, M. Effects of artificial intelligence implementation on efficiency in medical imaging\u2014a systematic literature review and meta-analysis. NPJ Digit Med. 7, 265 (2024).","journal-title":"NPJ Digit Med."},{"key":"2300_CR32","doi-asserted-by":"publisher","first-page":"162","DOI":"10.1038\/s41746-022-00700-y","volume":"5","author":"T Ciecierski-Holmes","year":"2022","unstructured":"Ciecierski-Holmes, T., Singh, R., Axt, M., Brenner, S. & Barteit, S. Artificial intelligence for strengthening healthcare systems in low- and middle-income countries: a systematic scoping review. NPJ Digit Med. 5, 162 (2022).","journal-title":"NPJ Digit Med."},{"key":"2300_CR33","doi-asserted-by":"publisher","first-page":"499","DOI":"10.1016\/j.survophthal.2024.03.008","volume":"69","author":"H Wu","year":"2024","unstructured":"Wu, H., Jin, K., Yip, C. C., Koh, V. & Ye, J. A systematic review of economic evaluation of artificial intelligence-based screening for eye diseases: from possibility to reality. Surv. Ophthalmol. 69, 499\u2013507 (2024).","journal-title":"Surv. Ophthalmol."},{"key":"2300_CR34","doi-asserted-by":"publisher","unstructured":"Xu, K. et al. Digital twins in ophthalmology: concepts, applications, and challenges. Asia-Pacific J. Ophthalmol. 100205, https:\/\/doi.org\/10.1016\/j.apjo.2025.100205 (2025).","DOI":"10.1016\/j.apjo.2025.100205"},{"key":"2300_CR35","doi-asserted-by":"publisher","first-page":"e51926","DOI":"10.2196\/51926","volume":"26","author":"X Liu","year":"2024","unstructured":"Liu, X. et al. Uncovering language disparity of ChatGPT on retinal vascular disease classification: cross-sectional study. J. Med. Internet Res. 26, e51926 (2024).","journal-title":"J. Med. Internet Res."},{"key":"2300_CR36","doi-asserted-by":"publisher","first-page":"e258910","DOI":"10.1001\/jamanetworkopen.2025.8910","volume":"8","author":"Z Ying","year":"2025","unstructured":"Ying, Z. et al. Real-time AI-assisted insulin titration system for glucose control in patients with type 2 diabetes: a randomized clinical trial. JAMA Netw. Open 8, e258910 (2025).","journal-title":"JAMA Netw. Open"},{"key":"2300_CR37","doi-asserted-by":"publisher","first-page":"599","DOI":"10.1038\/s41591-024-03302-1","volume":"31","author":"R Tanno","year":"2025","unstructured":"Tanno, R. et al. Collaboration between clinicians and vision\u2013language models in radiology report generation. Nat. Med. 31, 599\u2013608 (2025).","journal-title":"Nat. Med."},{"key":"2300_CR38","unstructured":"Li, B. et al. Llava-onevision: easy visual task transfer. Trans. Mach. Learn. Res. (2025)."},{"key":"2300_CR39","unstructured":"Bai, S. et al. Qwen2. 5-vl technical report. Preprint at https:\/\/arxiv.org\/abs\/2502.13923 (2025)."},{"key":"2300_CR40","doi-asserted-by":"publisher","first-page":"1414","DOI":"10.1109\/TUFFC.2025.3605285","volume":"72","author":"H Rasaee","year":"2025","unstructured":"Rasaee, H., Koleilat, T. & Rivaz, H. Grounding DINO-US-SAM: text-prompted multiorgan segmentation in ultrasound with LoRA-tuned vision\u2013language models. IEEE Trans. Ultrason. Ferroelectr. Freq. Control 72, 1414\u20131425 (2025).","journal-title":"IEEE Trans. Ultrason. Ferroelectr. Freq. Control"}],"container-title":["npj Digital Medicine"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.nature.com\/articles\/s41746-025-02300-y","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s41746-025-02300-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s41746-025-02300-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,30]],"date-time":"2026-01-30T05:32:43Z","timestamp":1769751163000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.nature.com\/articles\/s41746-025-02300-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1,3]]},"references-count":40,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2026,12]]}},"alternative-id":["2300"],"URL":"https:\/\/doi.org\/10.1038\/s41746-025-02300-y","relation":{},"ISSN":["2398-6352"],"issn-type":[{"value":"2398-6352","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,1,3]]},"assertion":[{"value":"11 June 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 December 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 January 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors declare no competing interests.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"99"}}