{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T16:52:29Z","timestamp":1774025549796,"version":"3.50.1"},"reference-count":33,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2025,3,24]],"date-time":"2025-03-24T00:00:00Z","timestamp":1742774400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,3,24]],"date-time":"2025-03-24T00:00:00Z","timestamp":1742774400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Nat Mach Intell"],"DOI":"10.1038\/s42256-025-01016-8","type":"journal-article","created":{"date-parts":[[2025,3,24]],"date-time":"2025-03-24T11:12:14Z","timestamp":1742814734000},"page":"661-671","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["A disease-specific language model for variant pathogenicity in cardiac and regulatory genomics"],"prefix":"10.1038","volume":"7","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8926-1941","authenticated-orcid":false,"given":"Huixin","family":"Zhan","sequence":"first","affiliation":[]},{"given":"Jason H.","family":"Moore","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2016-8014","authenticated-orcid":false,"given":"Zijun","family":"Zhang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,3,24]]},"reference":[{"key":"1016_CR1","doi-asserted-by":"publisher","first-page":"415","DOI":"10.1038\/nrg3493","volume":"14","author":"SH Katsanis","year":"2013","unstructured":"Katsanis, S. H. & Katsanis, N. Molecular genetic testing and the future of clinical genomics. Nat. Rev. Genet. 14, 415\u2013426 (2013).","journal-title":"Nat. Rev. Genet."},{"key":"1016_CR2","doi-asserted-by":"publisher","first-page":"1497","DOI":"10.2215\/CJN.15141219","volume":"15","author":"E Cocchi","year":"2020","unstructured":"Cocchi, E., Nestor, J. G. & Gharavi, A. G. Clinical genetic screening in adult patients with kidney disease. Clin. J. Am. Soc. Nephrol. 15, 1497 (2020).","journal-title":"Clin. J. Am. Soc. Nephrol."},{"key":"1016_CR3","doi-asserted-by":"publisher","first-page":"691","DOI":"10.1038\/d41573-023-00098-6","volume":"22","author":"W Xie","year":"2023","unstructured":"Xie, W., Chen, B. & Wong, J. Genomic medicines: the coming waves? Nat. Rev. Drug Discov. 22, 691\u2013692 (2023).","journal-title":"Nat. Rev. Drug Discov."},{"key":"1016_CR4","doi-asserted-by":"publisher","first-page":"2059","DOI":"10.1016\/j.jacc.2023.03.419","volume":"81","author":"H Ni","year":"2023","unstructured":"Ni, H. et al. Screening for dilated cardiomyopathy in at-risk first-degree relatives. J. Am. Coll. Cardiol. 81, 2059\u20132071 (2023).","journal-title":"J. Am. Coll. Cardiol."},{"key":"1016_CR5","doi-asserted-by":"publisher","first-page":"887","DOI":"10.1016\/j.cell.2019.06.036","volume":"178","author":"J-M Lee","year":"2019","unstructured":"Lee, J.-M. et al. CAG repeat not polyglutamine length determines timing of Huntington\u2019s disease onset. Cell 178, 887\u2013900 (2019).","journal-title":"Cell"},{"key":"1016_CR6","doi-asserted-by":"publisher","first-page":"000067","DOI":"10.1161\/HCG.0000000000000067","volume":"13","author":"K Musunuru","year":"2020","unstructured":"Musunuru, K. et al. Genetic testing for inherited cardiovascular diseases: a scientific statement from the american heart association. Circ. Genom. Precis. Med. 13, 000067 (2020).","journal-title":"Circ. Genom. Precis. Med."},{"key":"1016_CR7","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1038\/gim.2015.30","volume":"17","author":"S Richards","year":"2015","unstructured":"Richards, S. et al. Standards and guidelines for the interpretation of sequence variants: a joint consensus recommendation of the American College of Medical Genetics and Genomics and the Association for Molecular Pathology. Genet. Med. 17, 405\u2013423 (2015).","journal-title":"Genet. Med."},{"key":"1016_CR8","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1038\/s41586-021-04043-8","volume":"599","author":"J Frazer","year":"2021","unstructured":"Frazer, J. et al. Disease variant prediction with deep generative models of evolutionary data. Nature 599, 91\u201395 (2021).","journal-title":"Nature"},{"key":"1016_CR9","doi-asserted-by":"publisher","first-page":"118","DOI":"10.1093\/nar\/gkr407","volume":"39","author":"B Reva","year":"2011","unstructured":"Reva, B., Antipin, Y. & Sander, C. Predicting the functional impact of protein mutations: application to cancer genomics. Nucleic Acids Res. 39, 118 (2011).","journal-title":"Nucleic Acids Res."},{"key":"1016_CR10","doi-asserted-by":"publisher","first-page":"886","DOI":"10.1093\/nar\/gky1016","volume":"47","author":"P Rentzsch","year":"2019","unstructured":"Rentzsch, P., Witten, D., Cooper, G. M., Shendure, J. & Kircher, M. CADD: predicting the deleteriousness of variants throughout the human genome. Nucleic Acids Res. 47, 886\u2013894 (2019).","journal-title":"Nucleic Acids Res."},{"key":"1016_CR11","doi-asserted-by":"publisher","first-page":"980","DOI":"10.1093\/nar\/gkt1113","volume":"42","author":"MJ Landrum","year":"2014","unstructured":"Landrum, M. J. et al. Clinvar: public archive of relationships among sequence variation and human phenotype. Nucleic Acids Res. 42, 980\u2013985 (2014).","journal-title":"Nucleic Acids Res."},{"key":"1016_CR12","unstructured":"Rao, R. M. et al. MSA transformer. In International Conference on Machine Learning (eds Meila, M. & Zhang, T.) 8844\u20138856 (PMLR, 2021)."},{"key":"1016_CR13","doi-asserted-by":"publisher","first-page":"7492","DOI":"10.1126\/science.adg7492","volume":"381","author":"J Cheng","year":"2023","unstructured":"Cheng, J. et al. Accurate proteome-wide missense variant effect prediction with alphamissense. Science 381, 7492 (2023).","journal-title":"Science"},{"key":"1016_CR14","doi-asserted-by":"publisher","first-page":"1512","DOI":"10.1038\/s41588-023-01465-0","volume":"55","author":"N Brandes","year":"2023","unstructured":"Brandes, N., Goldman, G., Wang, C. H., Ye, C. J. & Ntranos, V. Genome-wide prediction of disease variant effects with a deep protein language model. Nat. Genet. 55, 1512\u20131522 (2023).","journal-title":"Nat. Genet."},{"key":"1016_CR15","doi-asserted-by":"publisher","first-page":"1617","DOI":"10.1038\/s41587-022-01432-w","volume":"40","author":"R Chowdhury","year":"2022","unstructured":"Chowdhury, R. et al. Single-sequence protein structure prediction using a language model and deep learning. Nat. Biotechnol. 40, 1617\u20131623 (2022).","journal-title":"Nat. Biotechnol."},{"key":"1016_CR16","doi-asserted-by":"publisher","first-page":"1576","DOI":"10.1038\/s41587-022-01466-0","volume":"40","author":"JM Michaud","year":"2022","unstructured":"Michaud, J. M., Madani, A. & Fraser, J. S. A language model beats AlphaFold2 on orphans. Nat. Biotechnol. 40, 1576\u20131577 (2022).","journal-title":"Nat. Biotechnol."},{"key":"1016_CR17","doi-asserted-by":"publisher","first-page":"747","DOI":"10.1038\/nature08494","volume":"461","author":"TA Manolio","year":"2009","unstructured":"Manolio, T. A. et al. Finding the missing heritability of complex diseases. Nature 461, 747\u2013753 (2009).","journal-title":"Nature"},{"key":"1016_CR18","doi-asserted-by":"publisher","first-page":"174","DOI":"10.1016\/j.cmet.2015.01.013","volume":"21","author":"EM McNally","year":"2015","unstructured":"McNally, E. M., Barefield, D. Y. & Puckelwartz, M. J. The genetic landscape of cardiomyopathy and its role in heart failure. Cell Metab. 21, 174\u2013182 (2015).","journal-title":"Cell Metab."},{"key":"1016_CR19","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1038\/s41436-020-00972-3","volume":"23","author":"X Zhang","year":"2021","unstructured":"Zhang, X. et al. Disease-specific variant pathogenicity prediction significantly improves variant interpretation in inherited cardiac conditions. Genet. Med. 23, 69\u201379 (2021).","journal-title":"Genet. Med."},{"key":"1016_CR20","unstructured":"Han, L., Kashyap, A.L., Finin, T., Mayfield, J. & Weese, J. Umbc_ebiquity-core: semantic textual similarity systems. In Second Joint Conference on Lexical and Computational Semantics (* SEM) (eds Diab, M. et al.) Vol. 1, 44\u201352 (Association for Computational Linguistics, 2013)."},{"key":"1016_CR21","doi-asserted-by":"crossref","unstructured":"Reimers, N. & Gurevych, I. Sentence-BERT: sentence embeddings using Siamese BERT-networks. In Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (eds Pad\u00f3, S. & Huang, R.) 3982\u20133992 (Association for Computational Linguistics, 2019).","DOI":"10.18653\/v1\/D19-1410"},{"key":"1016_CR22","unstructured":"Zhou, Z. et al. DNABERT-2: efficient foundation model and benchmark for multi-species genome. In Proceedings of the Twelfth International Conference on Learning Representations (ed. Kim, B.) (ICLR, 2024)."},{"key":"1016_CR23","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1016\/j.molcel.2018.10.037","volume":"73","author":"R Chong","year":"2019","unstructured":"Chong, R. et al. A multiplexed assay for exon recognition reveals that an unappreciated fraction of rare genetic variants cause large-effect splicing disruptions. Mol. Cell 73, 183\u2013194 (2019).","journal-title":"Mol. Cell"},{"key":"1016_CR24","doi-asserted-by":"publisher","first-page":"2016239118","DOI":"10.1073\/pnas.2016239118","volume":"118","author":"A Rives","year":"2021","unstructured":"Rives, A. et al. Biological structure and function emerge from scaling unsupervised learning to 250 million protein sequences. Proc. Natl Acad. Sci. USA 118, 2016239118 (2021).","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"1016_CR25","doi-asserted-by":"publisher","first-page":"1123","DOI":"10.1126\/science.ade2574","volume":"379","author":"Z Lin","year":"2023","unstructured":"Lin, Z. et al. Evolutionary-scale prediction of atomic-level protein structure with a language model. Science 379, 1123\u20131130 (2023).","journal-title":"Science"},{"key":"1016_CR26","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1093\/bib\/bbaa303","volume":"22","author":"SK Ata","year":"2021","unstructured":"Ata, S. K. et al. Recent advances in network-based methods for disease gene prediction. Brief. Bioinform. 22, 303 (2021).","journal-title":"Brief. Bioinform."},{"key":"1016_CR27","doi-asserted-by":"publisher","first-page":"643","DOI":"10.1093\/bioinformatics\/btad643","volume":"39","author":"M Chatzianastasis","year":"2023","unstructured":"Chatzianastasis, M., Vazirgiannis, M. & Zhang, Z. Explainable multilayer graph neural network for cancer gene prediction. Bioinformatics 39, 643 (2023).","journal-title":"Bioinformatics"},{"key":"1016_CR28","doi-asserted-by":"publisher","first-page":"583","DOI":"10.1038\/s41586-021-03819-2","volume":"596","author":"J Jumper","year":"2021","unstructured":"Jumper, J. et al. Highly accurate protein structure prediction with AlphaFold. Nature 596, 583\u2013589 (2021).","journal-title":"Nature"},{"key":"1016_CR29","doi-asserted-by":"publisher","first-page":"279","DOI":"10.1093\/nar\/gkv1344","volume":"44","author":"RD Finn","year":"2016","unstructured":"Finn, R. D. et al. The Pfam protein families database: towards a more sustainable future. Nucleic Acids Res. 44, 279\u2013285 (2016).","journal-title":"Nucleic Acids Res."},{"key":"1016_CR30","doi-asserted-by":"crossref","unstructured":"McLachlan, G. J. & Krishnan, T. The EM Algorithm and Extensions (John Wiley & Sons, 2007).","DOI":"10.1002\/9780470191613"},{"key":"1016_CR31","doi-asserted-by":"publisher","first-page":"125","DOI":"10.1038\/s41576-022-00532-2","volume":"24","author":"G Novakovsky","year":"2023","unstructured":"Novakovsky, G., Dexter, N., Libbrecht, M. W., Wasserman, W. W. & Mostafavi, S. Obtaining genetics insights from deep learning via explainable artificial intelligence. Nat. Rev. Genet. 24, 125\u2013137 (2023).","journal-title":"Nat. Rev. Genet."},{"key":"1016_CR32","doi-asserted-by":"publisher","unstructured":"Zhan, H. & Zhang, Z. Dataset for DYNA: a disease specific language model for variant pathogenicity. Zenodo https:\/\/doi.org\/10.5281\/zenodo.13397296 (2024).","DOI":"10.5281\/zenodo.13397296"},{"key":"1016_CR33","doi-asserted-by":"publisher","unstructured":"Zhan, H., Moore, J. & Zhang, Z. zhanglab-aim\/DYNA: a disease specific language model for variant pathogenicity. Zenodo https:\/\/doi.org\/10.5281\/zenodo.14083637 (2024).","DOI":"10.5281\/zenodo.14083637"}],"container-title":["Nature Machine Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.nature.com\/articles\/s42256-025-01016-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s42256-025-01016-8","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s42256-025-01016-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,22]],"date-time":"2025-04-22T22:03:18Z","timestamp":1745359398000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.nature.com\/articles\/s42256-025-01016-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,24]]},"references-count":33,"journal-issue":{"issue":"4","published-online":{"date-parts":[[2025,4]]}},"alternative-id":["1016"],"URL":"https:\/\/doi.org\/10.1038\/s42256-025-01016-8","relation":{},"ISSN":["2522-5839"],"issn-type":[{"value":"2522-5839","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,3,24]]},"assertion":[{"value":"10 July 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 February 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 March 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors declare no competing interests.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}