{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T20:18:54Z","timestamp":1780345134449,"version":"3.54.1"},"reference-count":85,"publisher":"Springer Science and Business Media LLC","issue":"15","license":[{"start":{"date-parts":[[2025,9,25]],"date-time":"2025-09-25T00:00:00Z","timestamp":1758758400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,9,25]],"date-time":"2025-09-25T00:00:00Z","timestamp":1758758400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100012166","name":"National Key Research and Development Program of China","doi-asserted-by":"publisher","award":["2022YFC2407000"],"award-info":[{"award-number":["2022YFC2407000"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2025,12]]},"DOI":"10.1007\/s00371-025-04153-8","type":"journal-article","created":{"date-parts":[[2025,9,25]],"date-time":"2025-09-25T16:19:09Z","timestamp":1758817149000},"page":"12411-12424","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Visual-action AI agents for medical diagnosis and treatment: advances and future outlook"],"prefix":"10.1007","volume":"41","author":[{"given":"Yuanqi","family":"Yao","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yilun","family":"Luxue","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Xiang","family":"Chen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Chengxing","family":"Shen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Haodong","family":"Yang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Seungmin","family":"Lee","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Tingli","family":"Chen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Haiyan","family":"Ge","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jie","family":"Shen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,9,25]]},"reference":[{"issue":"1","key":"4153_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/s41746-018-0040-6","volume":"1","author":"MD Abr\u00e0moff","year":"2018","unstructured":"Abr\u00e0moff, M.D., Lavin, P.T., Birch, M., Shah, N., Folk, J.C.: Pivotal trial of an autonomous AI-based diagnostic system for detection of diabetic retinopathy in primary care offices. npj Digit. Med 1(1), 1\u20138 (2018). https:\/\/doi.org\/10.1038\/s41746-018-0040-6","journal-title":"npj Digit. Med"},{"key":"4153_CR2","unstructured":"Hayward, E.: Global first as NHS hospital uses AI for instant skin cancer checks. https:\/\/www.thetimes.com\/uk\/healthcare\/article\/global-first-as-nhs-hospital-uses-ai-for-instant-skin-cancer-checks-3clspdmk0. Accessed 27 Mar 2025"},{"key":"4153_CR3","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1016\/j.jbi.2018.01.005","volume":"79","author":"A Masood","year":"2018","unstructured":"Masood, A., et al.: Computer-assisted decision support system in pulmonary cancer detection and stage classification on CT images. J. Biomed. Inform. 79, 117\u2013128 (2018)","journal-title":"J. Biomed. Inform."},{"key":"4153_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/JTEHM.2019.2955458","volume":"8","author":"A Masood","year":"2019","unstructured":"Masood, A., et al.: Cloud-based automated clinical decision support system for detection and diagnosis of lung cancer in chest CT. IEEE J. Transl. Eng. Health Med. 8, 1\u201313 (2019)","journal-title":"IEEE J. Transl. Eng. Health Med."},{"issue":"1","key":"4153_CR5","doi-asserted-by":"publisher","first-page":"5517","DOI":"10.1038\/s41598-023-32312-1","volume":"13","author":"Z Cao","year":"2023","unstructured":"Cao, Z., Li, R., Yang, X., Fang, L., Li, Z., Li, J.: Multi-scale detection of pulmonary nodules by integrating attention mechanism. Sci. Rep. 13(1), 5517 (2023). https:\/\/doi.org\/10.1038\/s41598-023-32312-1","journal-title":"Sci. Rep."},{"issue":"12","key":"4153_CR6","doi-asserted-by":"publisher","first-page":"3033","DOI":"10.1038\/s41591-023-02640-w","volume":"29","author":"K Cao","year":"2023","unstructured":"Cao, K., et al.: Large-scale pancreatic cancer detection via non-contrast CT and deep learning. Nat. Med. 29(12), 3033\u20133043 (2023). https:\/\/doi.org\/10.1038\/s41591-023-02640-w","journal-title":"Nat. Med."},{"issue":"1","key":"4153_CR7","doi-asserted-by":"publisher","first-page":"64","DOI":"10.1109\/TMI.2023.3289859","volume":"43","author":"J Li","year":"2024","unstructured":"Li, J., et al.: DSMT-net: dual self-supervised multi-operator transformation for multi-source endoscopic ultrasound diagnosis. IEEE Trans. Med. Imaging 43(1), 64\u201375 (2024). https:\/\/doi.org\/10.1109\/TMI.2023.3289859","journal-title":"IEEE Trans. Med. Imaging"},{"issue":"12","key":"4153_CR8","doi-asserted-by":"publisher","first-page":"4404","DOI":"10.1109\/TMI.2024.3421644","volume":"43","author":"J Xiao","year":"2024","unstructured":"Xiao, J., et al.: Multi-label chest x-ray image classification with single positive labels. IEEE Trans. Med. Imaging 43(12), 4404\u20134418 (2024). https:\/\/doi.org\/10.1109\/TMI.2024.3421644","journal-title":"IEEE Trans. Med. Imaging"},{"key":"4153_CR9","doi-asserted-by":"publisher","DOI":"10.1016\/j.artmed.2024.102919","volume":"154","author":"J Li","year":"2024","unstructured":"Li, J., et al.: SSM-net: Semi-supervised multi-task network for joint lesion segmentation and classification from pancreatic EUS images. Artif. Intell. Med. 154, 102919 (2024). https:\/\/doi.org\/10.1016\/j.artmed.2024.102919","journal-title":"Artif. Intell. Med."},{"issue":"1","key":"4153_CR10","doi-asserted-by":"publisher","first-page":"3058","DOI":"10.1038\/s41598-019-39795-x","volume":"9","author":"S Masood","year":"2019","unstructured":"Masood, S., et al.: Automatic choroid layer segmentation from optical coherence tomography images using deep learning. Sci. Rep. 9(1), 3058 (2019). https:\/\/doi.org\/10.1038\/s41598-019-39795-x","journal-title":"Sci. Rep."},{"key":"4153_CR11","doi-asserted-by":"publisher","first-page":"971943","DOI":"10.3389\/fpubh.2022.971943","volume":"10","author":"B Sheng","year":"2022","unstructured":"Sheng, B., et al.: An overview of artificial intelligence in diabetic retinopathy and other ocular diseases. Front. Public Health 10, 971943 (2022)","journal-title":"Front. Public Health"},{"key":"4153_CR12","doi-asserted-by":"publisher","unstructured":"Li, T., Sheng, B.: MSCE-LT: multi-label supervised contrastive enhancement for long-tailed retinal diseases recognition. In: 2024 IEEE International Conference on Bioinformatics and Biomedicine (BIBM), pp 2128\u20132133 (2024). https:\/\/doi.org\/10.1109\/BIBM62325.2024.10821772","DOI":"10.1109\/BIBM62325.2024.10821772"},{"issue":"11","key":"4153_CR13","doi-asserted-by":"publisher","first-page":"1006","DOI":"10.1001\/jamaophthalmol.2024.3707","volume":"142","author":"B Qian","year":"2024","unstructured":"Qian, B., et al.: A competition for the diagnosis of myopic maculopathy by artificial intelligence algorithms. JAMA Ophthalmol. 142(11), 1006\u20131015 (2024). https:\/\/doi.org\/10.1001\/jamaophthalmol.2024.3707","journal-title":"JAMA Ophthalmol."},{"issue":"9","key":"4153_CR14","doi-asserted-by":"publisher","first-page":"6627","DOI":"10.1007\/s00371-023-03189-y","volume":"40","author":"G Huang","year":"2024","unstructured":"Huang, G., Wen, Y., Qian, B., Bi, L., Chen, T., Sheng, B.: Attention-based multi-scale feature fusion network for myopia grading using optical coherence tomography images. Vis. Comput. 40(9), 6627\u20136638 (2024). https:\/\/doi.org\/10.1007\/s00371-023-03189-y","journal-title":"Vis. Comput."},{"issue":"5","key":"4153_CR15","doi-asserted-by":"publisher","first-page":"2441","DOI":"10.1007\/s40123-023-00746-5","volume":"12","author":"X Ye","year":"2023","unstructured":"Ye, X., et al.: Artificial intelligence-based quantification of central macular fluid volume and VA prediction for diabetic macular edema using OCT images. Ophthalmol. Ther. 12(5), 2441\u20132452 (2023). https:\/\/doi.org\/10.1007\/s40123-023-00746-5","journal-title":"Ophthalmol. Ther."},{"issue":"10","key":"4153_CR16","doi-asserted-by":"publisher","first-page":"2886","DOI":"10.1038\/s41591-024-03139-8","volume":"30","author":"J Li","year":"2024","unstructured":"Li, J., et al.: Integrated image-based deep learning and language models for primary diabetes care. Nat. Med. 30(10), 2886\u20132896 (2024). https:\/\/doi.org\/10.1038\/s41591-024-03139-8","journal-title":"Nat. Med."},{"issue":"2","key":"4153_CR17","doi-asserted-by":"publisher","first-page":"584","DOI":"10.1038\/s41591-023-02702-z","volume":"30","author":"L Dai","year":"2024","unstructured":"Dai, L., et al.: A deep learning system for predicting time to progression of diabetic retinopathy. Nat. Med. 30(2), 584\u2013594 (2024)","journal-title":"Nat. Med."},{"key":"4153_CR18","doi-asserted-by":"publisher","unstructured":"Krishnan, N.: AI agents: evolution, architecture, and real-world applications (2025). https:\/\/doi.org\/10.48550\/arXiv.2503.12687. arXiv: arXiv:2503.12687","DOI":"10.48550\/arXiv.2503.12687"},{"key":"4153_CR19","unstructured":"The Artificial Intelligence Clinician learns optimal treatment strategies for sepsis in intensive care\u2014PubMed. https:\/\/pubmed.ncbi.nlm.nih.gov\/30349085\/. Accessed 24 Mar 2025"},{"key":"4153_CR20","doi-asserted-by":"publisher","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-Net: convolutional networks for biomedical image segmentation (2015). https:\/\/doi.org\/10.48550\/arXiv.1505.04597. arXiv: arXiv:1505.04597","DOI":"10.48550\/arXiv.1505.04597"},{"key":"4153_CR21","doi-asserted-by":"crossref","unstructured":"Cheng, Z., Yang, Q., Sheng, B.: Deep colorization. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 415\u2013423 (2015). http:\/\/openaccess.thecvf.com\/content_iccv_2015\/html\/Cheng_Deep_Colorization_ICCV_2015_paper.html. Accessed 23 Mar 2025","DOI":"10.1109\/ICCV.2015.55"},{"key":"4153_CR22","doi-asserted-by":"publisher","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster R-CNN: towards real-time object detection with region proposal networks (2016). https:\/\/doi.org\/10.48550\/arXiv.1506.01497. arXiv: arXiv:1506.01497","DOI":"10.48550\/arXiv.1506.01497"},{"issue":"2","key":"4153_CR23","doi-asserted-by":"publisher","first-page":"994","DOI":"10.1109\/TIP.2018.2874285","volume":"28","author":"Y Wen","year":"2018","unstructured":"Wen, Y., Sheng, B., Li, P., Lin, W., Feng, D.D.: Deep color guided coarse-to-fine convolutional network cascade for depth image super-resolution. IEEE Trans. Image Process. 28(2), 994\u20131006 (2018)","journal-title":"IEEE Trans. Image Process."},{"key":"4153_CR24","doi-asserted-by":"publisher","first-page":"56559","DOI":"10.1109\/ACCESS.2020.2982187","volume":"8","author":"X Zeng","year":"2020","unstructured":"Zeng, X., Tong, S., Lu, Y., Xu, L., Huang, Z.: Adaptive medical image deep color perception algorithm. IEEE Access 8, 56559\u201356571 (2020). https:\/\/doi.org\/10.1109\/ACCESS.2020.2982187","journal-title":"IEEE Access"},{"key":"4153_CR25","doi-asserted-by":"publisher","unstructured":"Devlin, J., Chang, M.-W., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding (2019). https:\/\/doi.org\/10.48550\/arXiv.1810.04805. arXiv: arXiv:1810.04805","DOI":"10.48550\/arXiv.1810.04805"},{"key":"4153_CR26","doi-asserted-by":"publisher","unstructured":"Dai, Z., Yang, Z., Yang, Y., Carbonell, J., Le, Q.V., Salakhutdinov, R.: Transformer-XL: attentive language models beyond a fixed-length context (2019). https:\/\/doi.org\/10.48550\/arXiv.1901.02860. arXiv: arXiv:1901.02860","DOI":"10.48550\/arXiv.1901.02860"},{"key":"4153_CR27","doi-asserted-by":"publisher","first-page":"50","DOI":"10.1109\/TMM.2021.3120873","volume":"25","author":"X Lin","year":"2023","unstructured":"Lin, X., Sun, S., Huang, W., Sheng, B., Li, P., Feng, D.D.: EAPT: efficient attention pyramid transformer for image processing. IEEE Trans. Multimed. 25, 50\u201361 (2023). https:\/\/doi.org\/10.1109\/TMM.2021.3120873","journal-title":"IEEE Trans. Multimed."},{"key":"4153_CR28","doi-asserted-by":"publisher","unstructured":"Vaswani, A., et al.: Attention is all you need (2023). https:\/\/doi.org\/10.48550\/arXiv.1706.03762. arXiv: arXiv:1706.03762","DOI":"10.48550\/arXiv.1706.03762"},{"key":"4153_CR29","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1016\/j.media.2018.06.001","volume":"48","author":"S Parisot","year":"2018","unstructured":"Parisot, S., et al.: Disease prediction using graph convolutional networks: application to Autism Spectrum Disorder and Alzheimer\u2019s disease. Med. Image Anal. 48, 117\u2013130 (2018). https:\/\/doi.org\/10.1016\/j.media.2018.06.001","journal-title":"Med. Image Anal."},{"issue":"8","key":"4153_CR30","doi-asserted-by":"publisher","first-page":"4499","DOI":"10.1109\/TNNLS.2021.3116209","volume":"34","author":"Z Xie","year":"2021","unstructured":"Xie, Z., Zhang, W., Sheng, B., Li, P., Chen, C.P.: Bagfn: broad attentive graph fusion network for high-order feature interactions. IEEE Trans. Neural Netw. Learn. Syst. 34(8), 4499\u20134513 (2021)","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"4153_CR31","doi-asserted-by":"publisher","unstructured":"Chen, Z., Fu, L., Yao, J., Guo, W., Plant, C., Wang, S.: Learnable graph convolutional network and feature fusion for multi-view learning (2022). https:\/\/doi.org\/10.48550\/arXiv.2211.09155. arXiv: arXiv:2211.09155","DOI":"10.48550\/arXiv.2211.09155"},{"key":"4153_CR32","doi-asserted-by":"publisher","unstructured":"Singh, A., et al.: FLAVA: a foundational language and vision alignment model (2022). https:\/\/doi.org\/10.48550\/arXiv.2112.04482. arXiv: arXiv:2112.04482","DOI":"10.48550\/arXiv.2112.04482"},{"key":"4153_CR33","doi-asserted-by":"publisher","unstructured":"Radford, A., et al.: Learning transferable visual models from natural language supervision (2021). https:\/\/doi.org\/10.48550\/arXiv.2103.00020. arXiv: arXiv:2103.00020","DOI":"10.48550\/arXiv.2103.00020"},{"key":"4153_CR34","doi-asserted-by":"publisher","unstructured":"Wang, J., et al.: UFO: a unified transformer for vision-language representation learning (2021). https:\/\/doi.org\/10.48550\/arXiv.2111.10023. arXiv: arXiv:2111.10023","DOI":"10.48550\/arXiv.2111.10023"},{"key":"4153_CR35","doi-asserted-by":"publisher","unstructured":"Cheng, M., et al.: ViSTA: vision and scene text aggregation for cross-modal retrieval, (2022). https:\/\/doi.org\/10.48550\/arXiv.2203.16778. arXiv: arXiv:2203.16778","DOI":"10.48550\/arXiv.2203.16778"},{"key":"4153_CR36","doi-asserted-by":"publisher","unstructured":"Agarwal, K., Eftimov, T., Addanki, R., Choudhury, S., Tamang, S., Rallo, R.: Snomed2Vec: random walk and poincar\u00e9 embeddings of a clinical knowledge base for healthcare analytics (2019). https:\/\/doi.org\/10.48550\/arXiv.1907.08650. arXiv: arXiv:1907.08650","DOI":"10.48550\/arXiv.1907.08650"},{"key":"4153_CR37","doi-asserted-by":"publisher","first-page":"167","DOI":"10.18653\/v1\/2020.bionlp-1.18","volume":"2020","author":"D Chang","year":"2020","unstructured":"Chang, D., Bala\u017eevi\u0107, I., Allen, C., Chawla, D., Brandt, C., Taylor, R.A.: Benchmark and best practices for biomedical knowledge graph embeddings. Proc Conf Assoc Comput Linguist Meet 2020, 167\u2013176 (2020). https:\/\/doi.org\/10.18653\/v1\/2020.bionlp-1.18","journal-title":"Proc Conf Assoc Comput Linguist Meet"},{"key":"4153_CR38","doi-asserted-by":"publisher","unstructured":"Jiang, P., et al.: Reasoning-enhanced healthcare predictions with knowledge graph community retrieval (2024). https:\/\/doi.org\/10.48550\/arXiv.2410.04585. arXiv: arXiv:2410.04585","DOI":"10.48550\/arXiv.2410.04585"},{"issue":"10","key":"4153_CR39","doi-asserted-by":"publisher","first-page":"2633","DOI":"10.1038\/s41591-023-02552-9","volume":"29","author":"G Wang","year":"2023","unstructured":"Wang, G., et al.: Optimized glycemic control of type 2 diabetes with reinforcement learning: a proof-of-concept trial. Nat. Med. 29(10), 2633\u20132642 (2023). https:\/\/doi.org\/10.1038\/s41591-023-02552-9","journal-title":"Nat. Med."},{"issue":"5","key":"4153_CR40","doi-asserted-by":"publisher","first-page":"3114","DOI":"10.1109\/JBHI.2024.3377214","volume":"28","author":"D Tamboli","year":"2024","unstructured":"Tamboli, D., Chen, J., Jotheeswaran, K.P., Yu, D., Aggarwal, V.: Reinforced sequential decision-making for sepsis treatment: the PosNegDM framework with mortality classifier and transformer. IEEE J. Biomed. Health Inform. 28(5), 3114\u20133122 (2024). https:\/\/doi.org\/10.1109\/JBHI.2024.3377214","journal-title":"IEEE J. Biomed. Health Inform."},{"issue":"1","key":"4153_CR41","doi-asserted-by":"publisher","first-page":"337","DOI":"10.1038\/s41746-024-01316-0","volume":"7","author":"P Jayaraman","year":"2024","unstructured":"Jayaraman, P., Desman, J., Sabounchi, M., Nadkarni, G.N., Sakhuja, A.: A primer on reinforcement learning in medicine for clinicians. NPJ Digit. Med. 7(1), 337 (2024). https:\/\/doi.org\/10.1038\/s41746-024-01316-0","journal-title":"NPJ Digit. Med."},{"issue":"1","key":"4153_CR42","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1007\/s44230-025-00093-7","volume":"5","author":"R Tu","year":"2025","unstructured":"Tu, R., et al.: Offline safe reinforcement learning for sepsis treatment: tackling variable-length episodes with sparse rewards. Hum.-Cent. Intell. Syst. 5(1), 63\u201376 (2025). https:\/\/doi.org\/10.1007\/s44230-025-00093-7","journal-title":"Hum.-Cent. Intell. Syst."},{"key":"4153_CR43","unstructured":"Frontiers | CNN-TumorNet: leveraging explainability in deep learning for precise brain tumor diagnosis on MRI images. https:\/\/www.frontiersin.org\/journals\/oncology\/articles\/10.3389\/fonc.2025.1554559\/full. Accessed 6 Jul 2025"},{"issue":"10","key":"4153_CR44","doi-asserted-by":"publisher","first-page":"101213","DOI":"10.1016\/j.xcrm.2023.101213","volume":"4","author":"Z Guan","year":"2023","unstructured":"Guan, Z., et al.: Artificial intelligence in diabetes management: advancements, opportunities, and challenges. Cell Rep. Med. 4(10), 101213 (2023)","journal-title":"Cell Rep. Med."},{"issue":"1","key":"4153_CR45","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/s41746-024-01106-8","volume":"7","author":"C McGenity","year":"2024","unstructured":"McGenity, C., et al.: \u201cArtificial intelligence in digital pathology: a systematic review and meta-analysis of diagnostic test accuracy. npj Digit. Med. 7(1), 1\u201319 (2024). https:\/\/doi.org\/10.1038\/s41746-024-01106-8","journal-title":"npj Digit. Med."},{"issue":"8","key":"4153_CR46","doi-asserted-by":"publisher","first-page":"569","DOI":"10.1016\/S2213-8587(24)00154-2","volume":"12","author":"B Sheng","year":"2024","unstructured":"Sheng, B., et al.: Artificial intelligence for diabetes care: current and future prospects. Lancet Diabetes Endocrinol. 12(8), 569\u2013595 (2024)","journal-title":"Lancet Diabetes Endocrinol."},{"issue":"1","key":"4153_CR47","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1016\/j.jacc.2024.05.003","volume":"84","author":"R Khera","year":"2024","unstructured":"Khera, R., et al.: Transforming cardiovascular care with artificial intelligence: from discovery to practice. J. Am. Coll. Cardiol. 84(1), 97\u2013114 (2024). https:\/\/doi.org\/10.1016\/j.jacc.2024.05.003","journal-title":"J. Am. Coll. Cardiol."},{"issue":"5","key":"4153_CR48","doi-asserted-by":"publisher","first-page":"711","DOI":"10.1158\/2159-8290.CD-23-1199","volume":"14","author":"W Lotter","year":"2024","unstructured":"Lotter, W., Hassett, M.J., Schultz, N., Kehl, K.L., Van Allen, E.M., Cerami, E.: Artificial intelligence (AI) in oncology: current landscape, challenges, and future directions. Cancer Discov. 14(5), 711\u2013726 (2024). https:\/\/doi.org\/10.1158\/2159-8290.CD-23-1199","journal-title":"Cancer Discov."},{"issue":"1","key":"4153_CR49","doi-asserted-by":"publisher","first-page":"3242","DOI":"10.1038\/s41467-021-23458-5","volume":"12","author":"L Dai","year":"2021","unstructured":"Dai, L., et al.: A deep learning system for detecting diabetic retinopathy across the disease spectrum. Nat. Commun. 12(1), 3242 (2021)","journal-title":"Nat. Commun."},{"issue":"6","key":"4153_CR50","doi-asserted-by":"publisher","first-page":"100512","DOI":"10.1016\/j.patter.2022.100512","volume":"3","author":"R Liu","year":"2022","unstructured":"Liu, R., et al.: Deepdrid: Diabetic retinopathy\u2014grading and image quality estimation challenge. Patterns 3(6), 100512 (2022)","journal-title":"Patterns"},{"key":"4153_CR51","doi-asserted-by":"publisher","unstructured":"Qian, B., et al.: DRAC: diabetic retinopathy analysis challenge with ultra-wide optical coherence tomography angiography images (2023). https:\/\/doi.org\/10.48550\/arXiv.2304.02389. arXiv: arXiv:2304.02389","DOI":"10.48550\/arXiv.2304.02389"},{"issue":"7","key":"4153_CR52","first-page":"4925","volume":"65","author":"TY Wong","year":"2024","unstructured":"Wong, T.Y., et al.: An integrated image-based deep learning and language models for diabetic retinopathy: a multi-stage development, testing and prospective comparative study. Investig. Ophthalmol. Vis. Sci. 65(7), 4925 (2024)","journal-title":"Investig. Ophthalmol. Vis. Sci."},{"issue":"no. 11","key":"4153_CR53","doi-asserted-by":"publisher","first-page":"e2134254","DOI":"10.1001\/jamanetworkopen.2021.34254","volume":"4","author":"E Ipp","year":"2021","unstructured":"Ipp, E., et al.: Pivotal evaluation of an artificial intelligence system for autonomous detection of referrable and vision-threatening diabetic retinopathy. JAMA Netw. Open 4(11), e2134254 (2021). https:\/\/doi.org\/10.1001\/jamanetworkopen.2021.34254","journal-title":"JAMA Netw. Open"},{"key":"4153_CR54","doi-asserted-by":"publisher","DOI":"10.1016\/j.cmpb.2023.107879","volume":"243","author":"NA Wani","year":"2024","unstructured":"Wani, N.A., Kumar, R., Bedi, J.: Deepxplainer: an interpretable deep learning based approach for lung cancer detection using explainable artificial intelligence. Comput. Methods Programs Biomed. 243, 107879 (2024). https:\/\/doi.org\/10.1016\/j.cmpb.2023.107879","journal-title":"Comput. Methods Programs Biomed."},{"issue":"12","key":"4153_CR55","doi-asserted-by":"publisher","first-page":"7791","DOI":"10.1109\/TII.2020.2972918","volume":"16","author":"A Masood","year":"2020","unstructured":"Masood, A., et al.: Automated decision support system for lung cancer detection and classification via enhanced RFCN with multilayer fusion RPN. IEEE Trans. Ind. Inform. 16(12), 7791\u20137801 (2020). https:\/\/doi.org\/10.1109\/TII.2020.2972918","journal-title":"IEEE Trans. Ind. Inform."},{"issue":"7","key":"4153_CR56","first-page":"5644","volume":"65","author":"Y Wu","year":"2024","unstructured":"Wu, Y., Qian, B., Li, T., Guan, Z., Sheng, B., Wong, T.Y.: EyeNET, an integrated multimidal foundation model for ocular imaging. Investig. Ophthalmol. Vis. Sci. 65(7), 5644 (2024)","journal-title":"Investig. Ophthalmol. Vis. Sci."},{"issue":"1","key":"4153_CR57","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/s41746-023-00752-8","volume":"6","author":"LL Foo","year":"2023","unstructured":"Foo, L.L., et al.: Deep learning system to predict the 5-year risk of high myopia using fundus imaging in children. npj Digit. Med. 6(1), 1\u201310 (2023). https:\/\/doi.org\/10.1038\/s41746-023-00752-8","journal-title":"npj Digit. Med."},{"issue":"1","key":"4153_CR58","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/s41746-024-01204-7","volume":"7","author":"Z Qi","year":"2024","unstructured":"Qi, Z., et al.: A deep learning system for myopia onset prediction and intervention effectiveness evaluation in children. npj Digit. Med. 7(1), 1\u201310 (2024). https:\/\/doi.org\/10.1038\/s41746-024-01204-7","journal-title":"npj Digit. Med."},{"key":"4153_CR59","doi-asserted-by":"publisher","first-page":"3499","DOI":"10.2147\/OPTH.S438127","volume":"17","author":"M Nuliqiman","year":"2023","unstructured":"Nuliqiman, M., et al.: Artificial intelligence in ophthalmic surgery: current applications and expectations. Clin. Ophthalmol. 17, 3499\u20133511 (2023). https:\/\/doi.org\/10.2147\/OPTH.S438127","journal-title":"Clin. Ophthalmol."},{"key":"4153_CR60","doi-asserted-by":"publisher","unstructured":"Hemker, K., Simidjievski, N., Jamnik, M.: HEALNet: multimodal fusion for heterogeneous biomedical data (2024). https:\/\/doi.org\/10.48550\/arXiv.2311.09115. arXiv: arXiv:2311.09115","DOI":"10.48550\/arXiv.2311.09115"},{"issue":"5","key":"4153_CR61","doi-asserted-by":"publisher","first-page":"1149","DOI":"10.1109\/TMI.2018.2794988","volume":"37","author":"L Dai","year":"2018","unstructured":"Dai, L., et al.: Clinical report guided retinal microaneurysm detection with multi-sieving deep learning. IEEE Trans. Med. Imaging 37(5), 1149\u20131161 (2018)","journal-title":"IEEE Trans. Med. Imaging"},{"key":"4153_CR62","doi-asserted-by":"publisher","unstructured":"Tucci, V., Saary, J., Doyle, T.: Factors influencing trust in medical artificial intelligence for healthcare professionals: a narrative review. J. Med. Artif. Intell. 5 (2022). https:\/\/doi.org\/10.21037\/jmai-21-25","DOI":"10.21037\/jmai-21-25"},{"issue":"1","key":"4153_CR63","doi-asserted-by":"publisher","DOI":"10.1186\/s12911-020-01332-6","volume":"20","author":"J Amann","year":"2020","unstructured":"Amann, J., Blasimme, A., Vayena, E., Frey, D., Madai, V.I., the Precise4Q consortium: Explainability for artificial intelligence in healthcare: a multidisciplinary perspective. BMC Med. Inform. Decis. Mak. 20(1), 310 (2020). https:\/\/doi.org\/10.1186\/s12911-020-01332-6","journal-title":"BMC Med. Inform. Decis. Mak."},{"key":"4153_CR64","doi-asserted-by":"publisher","unstructured":"Xie, Y., et al.: A preliminary study of o1 in medicine: are we closer to an AI doctor? (2024). https:\/\/doi.org\/10.48550\/arXiv.2409.15277. arXiv: arXiv:2409.15277","DOI":"10.48550\/arXiv.2409.15277"},{"key":"4153_CR65","doi-asserted-by":"publisher","DOI":"10.1101\/2025.01.27.25321169","author":"G Mondillo","year":"2025","unstructured":"Mondillo, G., Colosimo, S., Perrotta, A., Frattolillo, V., Masino, M.: Comparative evaluation of advanced AI reasoning models in pediatric clinical decision support: ChatGPT O1 vs. DeepSeek-R1. Medrxiv (2025). https:\/\/doi.org\/10.1101\/2025.01.27.25321169","journal-title":"Medrxiv"},{"key":"4153_CR66","doi-asserted-by":"publisher","unstructured":"Fern\u00e1ndez-Lor\u00eda, C., Provost, F., Han, X.: Explaining data-driven decisions made by AI systems: the counterfactual approach (2021). https:\/\/doi.org\/10.48550\/arXiv.2001.07417. arXiv: arXiv:2001.07417","DOI":"10.48550\/arXiv.2001.07417"},{"key":"4153_CR67","doi-asserted-by":"publisher","DOI":"10.3389\/frai.2022.825565","author":"S Mertes","year":"2022","unstructured":"Mertes, S., Huber, T., Weitz, K., Heimerl, A., Andr\u00e9, E.: GANterfactual\u2014counterfactual explanations for medical non-experts using generative adversarial learning. Front. Artif. Intell. (2022). https:\/\/doi.org\/10.3389\/frai.2022.825565","journal-title":"Front. Artif. Intell."},{"issue":"CSCW2","key":"4153_CR68","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3610218","volume":"7","author":"MH Lee","year":"2023","unstructured":"Lee, M.H., Chew, C.J.: Understanding the effect of counterfactual explanations on trust and reliance on AI for human-AI collaborative clinical decision making. Proc. ACM Hum.-Comput. Interact. 7(CSCW2), 1\u201322 (2023). https:\/\/doi.org\/10.1145\/3610218","journal-title":"Proc. ACM Hum.-Comput. Interact."},{"key":"4153_CR69","doi-asserted-by":"publisher","unstructured":"Lundberg, S., Lee, S.-I.: A unified approach to interpreting model predictions (2017). https:\/\/doi.org\/10.48550\/arXiv.1705.07874. arXiv: arXiv:1705.07874","DOI":"10.48550\/arXiv.1705.07874"},{"key":"4153_CR70","doi-asserted-by":"publisher","unstructured":"Explainable AI-driven IoMT fusion: unravelling techniques, opportunities, and challenges with explainable AI in healthcare. Inf. Fusion 110, 102472 (2024). https:\/\/doi.org\/10.1016\/j.inffus.2024.102472","DOI":"10.1016\/j.inffus.2024.102472"},{"key":"4153_CR71","unstructured":"Synergizing fusion modeling for accurate cardiac prediction through explainable artificial intelligence | IEEE Journals & Magazine | IEEE Xplore. https:\/\/ieeexplore.ieee.org\/document\/10579789. Accessed 6 Jul 2025"},{"key":"4153_CR72","doi-asserted-by":"publisher","first-page":"22294","DOI":"10.18653\/v1\/2024.emnlp-main.1244","volume-title":"Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing","author":"W Shi","year":"2024","unstructured":"Shi, W., et al.: MedAdapter: efficient test-time adaptation of large language models towards medical reasoning. In: Al-Onaizan, Y., Bansal, M., Chen, Y.-N. (eds.) Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing, pp. 22294\u201322314. Association for Computational Linguistics, Miami (2024). https:\/\/doi.org\/10.18653\/v1\/2024.emnlp-main.1244"},{"key":"4153_CR73","doi-asserted-by":"publisher","unstructured":"Li, J., et al.: Agent hospital: a simulacrum of hospital with evolvable medical agents (2025). https:\/\/doi.org\/10.48550\/arXiv.2405.02957. arXiv: arXiv:2405.02957","DOI":"10.48550\/arXiv.2405.02957"},{"key":"4153_CR74","doi-asserted-by":"publisher","unstructured":"Hsu, H.-L., et al.: MedPlan: a two-stage RAG-based system for personalized medical plan generation (2025). https:\/\/doi.org\/10.48550\/arXiv.2503.17900. arXiv: arXiv:2503.17900","DOI":"10.48550\/arXiv.2503.17900"},{"key":"4153_CR75","doi-asserted-by":"publisher","DOI":"10.1056\/AIp2400289","author":"W Ma","year":"2024","unstructured":"Ma, W., et al.: Evolution of future medical AI models\u2014from task-specific, disease-centric to universal health. NEJM AI (2024). https:\/\/doi.org\/10.1056\/AIp2400289","journal-title":"NEJM AI"},{"key":"4153_CR76","doi-asserted-by":"publisher","first-page":"205520762311865","DOI":"10.1177\/20552076231186520","volume":"9","author":"E Sezgin","year":"2023","unstructured":"Sezgin, E.: Artificial intelligence in healthcare: complementing, not replacing, doctors and healthcare providers. Digit. Health 9, 20552076231186520 (2023). https:\/\/doi.org\/10.1177\/20552076231186520","journal-title":"Digit. Health"},{"key":"4153_CR77","doi-asserted-by":"publisher","first-page":"862322","DOI":"10.3389\/fsurg.2022.862322","volume":"9","author":"N Naik","year":"2022","unstructured":"Naik, N., et al.: Legal and ethical consideration in artificial intelligence in healthcare: who takes responsibility? Front. Surg. 9, 862322 (2022). https:\/\/doi.org\/10.3389\/fsurg.2022.862322","journal-title":"Front. Surg."},{"key":"4153_CR78","doi-asserted-by":"publisher","unstructured":"Raji, I.D., et al.: Closing the AI accountability gap: defining an end-to-end framework for internal algorithmic auditing (2020). https:\/\/doi.org\/10.48550\/arXiv.2001.00973. arXiv: arXiv:2001.00973","DOI":"10.48550\/arXiv.2001.00973"},{"key":"4153_CR79","unstructured":"Artificial Intelligence in healthcare\u2014European Commission. https:\/\/health.ec.europa.eu\/ehealth-digital-health-and-care\/artificial-intelligence-healthcare_en. Accessed 6 Jul 2025"},{"key":"4153_CR80","unstructured":"C. for D. and R. Health: Artificial Intelligence and machine learning in software as a medical device. FDA (2025). https:\/\/www.fda.gov\/medical-devices\/software-medical-device-samd\/artificial-intelligence-and-machine-learning-software-medical-device. Accessed 6 Jul 2025"},{"issue":"5","key":"4153_CR81","doi-asserted-by":"publisher","first-page":"e384","DOI":"10.1016\/S2589-7500(22)00003-6","volume":"4","author":"X Liu","year":"2022","unstructured":"Liu, X., Glocker, B., McCradden, M.M., Ghassemi, M., Denniston, A.K., Oakden-Rayner, L.: The medical algorithmic audit. Lancet Digit. Health 4(5), e384\u2013e397 (2022). https:\/\/doi.org\/10.1016\/S2589-7500(22)00003-6","journal-title":"Lancet Digit. Health"},{"issue":"2","key":"4153_CR82","doi-asserted-by":"publisher","first-page":"101419","DOI":"10.1016\/j.xcrm.2024.101419","volume":"5","author":"ZL Teo","year":"2024","unstructured":"Teo, Z.L., et al.: Federated machine learning in healthcare: a systematic review on clinical applications and technical architecture. Cell Rep. Med. 5(2), 101419 (2024). https:\/\/doi.org\/10.1016\/j.xcrm.2024.101419","journal-title":"Cell Rep. Med."},{"issue":"1","key":"4153_CR83","doi-asserted-by":"publisher","first-page":"12482","DOI":"10.1038\/s41598-025-97565-4","volume":"15","author":"R Haripriya","year":"2025","unstructured":"Haripriya, R., Khare, N., Pandey, M.: Privacy-preserving federated learning for collaborative medical data mining in multi-institutional settings. Sci. Rep. 15(1), 12482 (2025). https:\/\/doi.org\/10.1038\/s41598-025-97565-4","journal-title":"Sci. Rep."},{"issue":"1","key":"4153_CR84","doi-asserted-by":"publisher","first-page":"13061","DOI":"10.1038\/s41598-025-95858-2","volume":"15","author":"S Shukla","year":"2025","unstructured":"Shukla, S., Rajkumar, S., Sinha, A., Esha, M., Elango, K., Sampath, V.: Federated learning with differential privacy for breast cancer diagnosis enabling secure data sharing and model integrity. Sci. Rep. 15(1), 13061 (2025). https:\/\/doi.org\/10.1038\/s41598-025-95858-2","journal-title":"Sci. Rep."},{"key":"4153_CR85","doi-asserted-by":"publisher","unstructured":"Gawade, S., et al.: Multi agent based medical assistant for edge devices (2025). https:\/\/doi.org\/10.48550\/arXiv.2503.05397. arXiv: arXiv:2503.05397","DOI":"10.48550\/arXiv.2503.05397"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-025-04153-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-025-04153-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-025-04153-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,20]],"date-time":"2025-11-20T13:15:34Z","timestamp":1763644534000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-025-04153-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,25]]},"references-count":85,"journal-issue":{"issue":"15","published-print":{"date-parts":[[2025,12]]}},"alternative-id":["4153"],"URL":"https:\/\/doi.org\/10.1007\/s00371-025-04153-8","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,9,25]]},"assertion":[{"value":"22 April 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 August 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 September 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}