{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,8]],"date-time":"2026-01-08T11:31:59Z","timestamp":1767871919794,"version":"3.49.0"},"reference-count":36,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T00:00:00Z","timestamp":1764979200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2026,1,8]],"date-time":"2026-01-08T00:00:00Z","timestamp":1767830400000},"content-version":"vor","delay-in-days":33,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BioData Mining"],"DOI":"10.1186\/s13040-025-00495-0","type":"journal-article","created":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T16:36:57Z","timestamp":1765039017000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Clinically aligned multi-modal image-text model for pan-cancer prognosis prediction"],"prefix":"10.1186","volume":"19","author":[{"given":"Jonghyun","family":"Lee","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jacob S.","family":"Leiby","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lina","family":"Takemaru","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yidi","family":"Huang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Myung-Giun","family":"Noh","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jaesik","family":"Kim","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Byonghan","family":"Lee","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mattew E.","family":"Lee","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Derek A.","family":"Oldridge","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Young-Gyu","family":"Eun","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hyun Jee","family":"Lee","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Young Chan","family":"Lee","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dokyoon","family":"Kim","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,12,6]]},"reference":[{"issue":"5","key":"495_CR1","doi-asserted-by":"publisher","first-page":"323","DOI":"10.1038\/nrc3261","volume":"12","author":"A Marusyk","year":"2012","unstructured":"Marusyk A, Almendro V, Polyak K. Intra-tumour heterogeneity: a looking glass for cancer? Nat Rev Cancer. 2012;12(5):323\u201334.","journal-title":"Nat Rev Cancer"},{"issue":"12","key":"495_CR2","doi-asserted-by":"publisher","first-page":"930","DOI":"10.1038\/s44222-023-00096-8","volume":"1","author":"AH Song","year":"2023","unstructured":"Song AH, Jaume G, Williamson DF, Lu MY, Vaidya A, Miller TR, Mahmood F. Artificial intelligence for digital and computational pathology. Nat Rev Bioeng. 2023;1(12):930\u201349.","journal-title":"Nat Rev Bioeng"},{"key":"495_CR3","doi-asserted-by":"crossref","unstructured":"Xiang J, Wang X, Zhang X, Xi Y, Eweje F, Chen Y, Li Y, Bergstrom C, Gopaulchan M, Kim T, et al. A vision\u2013language foundation model for precision oncology. Nature. 2025;1\u201310.","DOI":"10.1038\/s41586-024-08378-w"},{"issue":"8035","key":"495_CR4","doi-asserted-by":"publisher","first-page":"970","DOI":"10.1038\/s41586-024-07894-z","volume":"634","author":"X Wang","year":"2024","unstructured":"Wang X, Zhao J, Marostica E, Yuan W, Jin J, Zhang J, Li R, Tang H, Wang K, Li Y, et al. A pathology foundation model for cancer diagnosis and prognosis prediction. Nature. 2024;634(8035):970\u201378.","journal-title":"Nature"},{"key":"495_CR5","doi-asserted-by":"crossref","unstructured":"Wang X, Yang S, Zhang J, Wang M, Zhang J, Yang W, Huang J, Han X. Transformer-based unsupervised contrastive learning for histopathological image classification. Med Image Anal. 2022;81, 102559.","DOI":"10.1016\/j.media.2022.102559"},{"key":"495_CR6","unstructured":"Vorontsov E, Bozkurt A, Casson A, Shaikovski G, Zelechowski M, Liu S, Severson K, Zimmermann E, Hall J, Tenenholtz N, et al. Virchow: a million-slide digital pathology foundation model. arXiv preprint arXiv:2309.07778. 2023."},{"key":"495_CR7","unstructured":"Ding T, Wagner SJ, Song AH, Chen RJ, Lu MY, Zhang A, Vaidya, AJ, Jaume G, Shaban M, Kim A, et al. Multimodal whole slide foundation model for pathology. arXiv preprint arXiv:2411.19666. 2024."},{"issue":"8015","key":"495_CR8","doi-asserted-by":"publisher","first-page":"181","DOI":"10.1038\/s41586-024-07441-w","volume":"630","author":"H Xu","year":"2024","unstructured":"Xu H, Usuyama N, Bagga J, Zhang S, Rao R, Naumann T, Wong C, Gero Z, Gonz\u00b4alez J, Gu Y, et al. A whole-slide foundation model for digital pathology from real-world data. Nature. 2024;630(8015):181\u201388.","journal-title":"Nature"},{"issue":"9","key":"495_CR9","doi-asserted-by":"publisher","first-page":"2307","DOI":"10.1038\/s41591-023-02504-3","volume":"29","author":"Z Huang","year":"2023","unstructured":"Huang Z, Bianchi F, Yuksekgonul M, Montine TJ, Zou J. A visual\u2013language foundation model for pathology image analysis using medical twitter. Nat Med. 2023;29(9):2307\u201316.","journal-title":"Nat Med"},{"issue":"3","key":"495_CR10","doi-asserted-by":"publisher","first-page":"863","DOI":"10.1038\/s41591-024-02856-4","volume":"30","author":"MY Lu","year":"2024","unstructured":"Lu MY, Chen B, Williamson DF, Chen RJ, Liang I, Ding T, Jaume G, Odintsov I, Le LP, Gerber G, et al. A visual-language foundation model for computational pathology. Nat Med. 2024;30(3):863\u201374.","journal-title":"Nat Med"},{"issue":"3","key":"495_CR11","doi-asserted-by":"publisher","first-page":"850","DOI":"10.1038\/s41591-024-02857-3","volume":"30","author":"RJ Chen","year":"2024","unstructured":"Chen RJ, Ding T, Lu MY, Williamson DF, Jaume G, Song AH, Chen B, Zhang A, Shao D, Shaban M, et al. Towards a general-purpose foundation model for computational pathology. Nat Med. 2024;30(3):850\u201362.","journal-title":"Nat Med"},{"issue":"1","key":"495_CR12","doi-asserted-by":"publisher","first-page":"154","DOI":"10.1038\/s41591-021-01620-2","volume":"28","author":"W Bulten","year":"2022","unstructured":"Bulten W, Kartasalo K, Chen P-HC, Str\u00f6m P, Pinckaers H, Nagpal K, Cai Y, Steiner DF, Van Boven H, Vink R, et al. Artificial intelligence for diagnosis and gleason grading of prostate cancer: the panda challenge. Nat Med. 2022;28(1):154\u201363.","journal-title":"Nat Med"},{"issue":"1","key":"495_CR13","first-page":"355","volume":"10","author":"J Lee","year":"2024","unstructured":"Lee J, Ahn S, Kim H-S, An J, Sim J. A robust model training strategy using hard negative mining in a weakly labeled dataset for lymphatic invasion in gastric cancer. The J Pathol: Clin Res. 2024;10(1):355.","journal-title":"The J Pathol: Clin Res"},{"issue":"2","key":"495_CR14","doi-asserted-by":"publisher","first-page":"430","DOI":"10.3390\/cancers16020430","volume":"16","author":"J Lee","year":"2024","unstructured":"Lee J, Cha S, Kim J, Kim JJ, Kim N, Jae Gal, SG Kim, JH, Lee JH, Choi Y.-D, Kang, S.-R., et al. Ensemble deep learning model to predict lymphovascular invasion in gastric cancer. Cancers. 2024;16(2):430.","journal-title":"Cancers"},{"key":"495_CR15","doi-asserted-by":"crossref","unstructured":"Jeong Y, Cho CE, Kim J-E, Lee J, Kim N, Jung WY, Sung J, Kim, JH, Lee YJ, Jung J, et al. Deep learning model to predict epstein\u2013barr virus associated gastric cancer in histology. Sci Rep. 2022;12(1):18466.","DOI":"10.1038\/s41598-022-22731-x"},{"issue":"10","key":"495_CR16","doi-asserted-by":"publisher","first-page":"1559","DOI":"10.1038\/s41591-018-0177-5","volume":"24","author":"N Coudray","year":"2018","unstructured":"Coudray N, Ocampo PS, Sakellaropoulos T, Narula N, Snuderl M, Feny\u00f6 Moreira AL, Razavian N, Tsirigos A. Classification and mutation prediction from non\u2013small cell lung cancer histopathology images using deep learning. Nat Med. 2018;24(10):1559\u201367.","journal-title":"Nat Med"},{"issue":"6","key":"495_CR17","doi-asserted-by":"publisher","first-page":"555","DOI":"10.1038\/s41551-020-00682-w","volume":"5","author":"MY Lu","year":"2021","unstructured":"Lu MY, Williamson DF, Chen TY, Chen RJ, Barbieri M, Mahmood F. Data-efficient and weakly supervised computational pathology on whole-slide images. Nat Biomed Eng. 2021;5(6):555\u201370.","journal-title":"Nat Biomed Eng"},{"issue":"8","key":"495_CR18","doi-asserted-by":"publisher","first-page":"865","DOI":"10.1016\/j.ccell.2022.07.004","volume":"40","author":"RJ Chen","year":"2022","unstructured":"Chen RJ, Lu MY, Williamson DF, Chen TY, Lipkova J, Noor Z, Shaban M, Shady M, Williams M, Joo B, et al. Pan-cancer integrative histology-genomic analysis via multimodal deep learning. Cancer Cell. 2022;40(8):865\u201378.","journal-title":"Cancer Cell"},{"key":"495_CR19","doi-asserted-by":"crossref","unstructured":"Jaume G, Vaidya A, Chen RJ, Williamson DF, Liang PP, Mahmood F. Modeling dense multimodal interactions between biological pathways and histology for survival prediction. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2024, pp. 11579\u201390.","DOI":"10.1109\/CVPR52733.2024.01100"},{"key":"495_CR20","unstructured":"Song AH, Chen RJ, Jaume G, Vaidya AJ, Baras A, Mahmood F. Multimodal prototyping for cancer survival prediction. Forty-first International Conference on Machine Learning. 2024."},{"issue":"10221","key":"495_CR21","doi-asserted-by":"publisher","first-page":"350","DOI":"10.1016\/S0140-6736(19)32998-8","volume":"395","author":"O-J Skrede","year":"2020","unstructured":"Skrede O-J, De Raedt S, Kleppe A, Hveem TS, Liest\u00f8l K, Maddison J, Askautrud HA, Pradhan M, Nesheim JA, Albregtsen F, et al. Deep learning for prediction of colorectal cancer outcome: a discovery and validation study. The Lancet. 2020;395(10221):350\u201360.","journal-title":"The Lancet"},{"issue":"10","key":"495_CR22","doi-asserted-by":"publisher","first-page":"1519","DOI":"10.1038\/s41591-019-0583-3","volume":"25","author":"P Courtiol","year":"2019","unstructured":"Courtiol P, Maussion C, Moarii M, Pronier E, Pilcer S, Sefta M, Manceron P, Toldo S, Zaslavskiy M, Le Stang N, et al. Deep learning-based classification of mesothelioma improves prediction of patient outcome. Nat Med. 2019;25(10):1519\u201325.","journal-title":"Nat Med"},{"key":"495_CR23","doi-asserted-by":"crossref","unstructured":"Chen RJ, Lu MY, Weng W-H, Chen TY, Williamson DF, Manz T, Shady M, Mahmood F. Multimodal co-attention transformer for survival prediction in gigapixel whole slide images. Proceedings of the IEEE\/CVF International Conference on Computer Vision. 2021, pp. 4015\u201325.","DOI":"10.1109\/ICCV48922.2021.00398"},{"key":"495_CR24","doi-asserted-by":"crossref","unstructured":"Jaume G, Oldenburg L, Vaidya A, Chen RJ, Williamson DF, Peeters T, Song AH, Mahmood F. Transcriptomics-guided slide representation learning in computational pathology. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2024, pp. 9632\u201344.","DOI":"10.1109\/CVPR52733.2024.00920"},{"key":"495_CR25","doi-asserted-by":"crossref","unstructured":"Song AH, Chen RJ, Ding T, Williamson DF, Jaume G, Mahmood F. Morphological prototyping for unsupervised slide representation learning in computational pathology. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2024, pp. 11566\u201378.","DOI":"10.1109\/CVPR52733.2024.01099"},{"key":"495_CR26","doi-asserted-by":"crossref","unstructured":"Jaume G, Vaidya A, Zhang A, Song AH, Chen RJ, Sahai S, Mo D, Madrigal E, Phi Le L, Mahmood F. Multistain pretraining for slide representation learning in pathology. European Conference on Computer Vision. Springer; 2024, pp. 19\u201337.","DOI":"10.1007\/978-3-031-73414-4_2"},{"key":"495_CR27","doi-asserted-by":"crossref","unstructured":"Multimodal representations of biomedical knowledge from limited training whole slide images and reports using deep learning. Med Image Anal. 2024;97:103303.","DOI":"10.1016\/j.media.2024.103303"},{"key":"495_CR28","first-page":"67551","volume":"36","author":"L Qu","year":"2023","unstructured":"Qu L, Fu K, Wang M, Song Z, et al. The rise of ai language pathologists: exploring two-level prompt learning for few-shot weakly-supervised whole slide image classification. Adv Neural Inf Process Syst. 2023;36:67551\u201364.","journal-title":"Adv Neural Inf Process Syst"},{"key":"495_CR29","unstructured":"Zhang A, Jaume G, Vaidya A, Ding T, Mahmood F. Accelerating data processing and benchmarking of ai models for pathology. arXiv preprint arXiv:2502.06750. 2025."},{"key":"495_CR30","doi-asserted-by":"crossref","unstructured":"Kefeli J, Tatonetti N. Tcga-reports: a machine-readable pathology report resource for benchmarking text-based AI models. Patterns. 2024;5(3).","DOI":"10.1016\/j.patter.2024.100933"},{"key":"495_CR31","unstructured":"Dubey A, Jauhri A, Pandey A, Kadian A, Al-Dahle A, Letman A, Mathur A, Schelten A, Yang, A, Fan A, et al. The llama 3 herd of models. arxiv E-Prints. 2024;2407."},{"issue":"1","key":"495_CR32","first-page":"1","volume":"3","author":"Y Gu","year":"2021","unstructured":"Gu Y, Tinn R, Cheng H, Lucas M, Usuyama N, Liu X, Naumann T, Gao J, Poon H. Domain-specific language model pretraining for biomedical natural language processing. ACM Trans On Comput For Healthcare (health). 2021;3(1):1\u201323.","journal-title":"ACM Trans On Comput For Healthcare (health)"},{"key":"495_CR33","unstructured":"Ilse M, Tomczak J, Welling M. Attention-based deep multiple instance learning. International Conference on Machine Learning. PMLR; 2018, pp. 2127\u201336."},{"issue":"9","key":"495_CR34","doi-asserted-by":"publisher","first-page":"3126","DOI":"10.1109\/TPAMI.2020.2979450","volume":"43","author":"SG Zadeh","year":"2020","unstructured":"Zadeh SG, Schmid M. Bias in cross-entropy-based training of deep survival networks. IEEE Trans On Pattern Anal And Mach Intel. 2020;43(9):3126\u201337.","journal-title":"IEEE Trans On Pattern Anal And Mach Intel"},{"issue":"2","key":"495_CR35","first-page":"3","volume":"1","author":"EJ Hu","year":"2022","unstructured":"Hu EJ, Shen Y, Wallis P, Allen-Zhu Z, Li Y, Wang S, Wang L, Chen W, et al. Lora: low-rank adaptation of large language models. ICLR. 2022;1(2):3.","journal-title":"ICLR"},{"key":"495_CR36","doi-asserted-by":"crossref","unstructured":"Wang W, Bao H, Dong L, Bjorck J, Peng Z, Liu Q, Aggarwal K, Mohammed, OK, Singhal, S, Som S, et al. Image as a foreign language: beit pretraining for vision and vision-language tasks. Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2023, pp. 19175\u201386.","DOI":"10.1109\/CVPR52729.2023.01838"}],"container-title":["BioData Mining"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13040-025-00495-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s13040-025-00495-0","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13040-025-00495-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,8]],"date-time":"2026-01-08T07:09:46Z","timestamp":1767856186000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1186\/s13040-025-00495-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,6]]},"references-count":36,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2026,12]]}},"alternative-id":["495"],"URL":"https:\/\/doi.org\/10.1186\/s13040-025-00495-0","relation":{},"ISSN":["1756-0381"],"issn-type":[{"value":"1756-0381","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,12,6]]},"assertion":[{"value":"31 July 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 October 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 December 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The retrospective study involving the KHMC-HNSC cohort was approved by the Institutional Review Board of Kyung Hee University Medical Center (approval number: KHNMC 2024\u201306-005\u2013002). The need for informed consent was waived due to the retrospective nature of the study and the use of de-identified data.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"The authors declare no competing interests.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"4"}}