{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,25]],"date-time":"2026-03-25T03:29:23Z","timestamp":1774409363465,"version":"3.50.1"},"reference-count":88,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T00:00:00Z","timestamp":1743033600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T00:00:00Z","timestamp":1743033600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Nat Mach Intell"],"DOI":"10.1038\/s42256-025-01011-z","type":"journal-article","created":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T10:09:38Z","timestamp":1743070178000},"page":"580-591","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":19,"title":["A text-guided protein design framework"],"prefix":"10.1038","volume":"7","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2030-2367","authenticated-orcid":false,"given":"Shengchao","family":"Liu","sequence":"first","affiliation":[]},{"given":"Yanjing","family":"Li","sequence":"additional","affiliation":[]},{"given":"Zhuoxinran","family":"Li","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5324-9833","authenticated-orcid":false,"given":"Anthony","family":"Gitter","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9432-3251","authenticated-orcid":false,"given":"Yutao","family":"Zhu","sequence":"additional","affiliation":[]},{"given":"Jiarui","family":"Lu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2618-7462","authenticated-orcid":false,"given":"Zhao","family":"Xu","sequence":"additional","affiliation":[]},{"given":"Weili","family":"Nie","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1622-5488","authenticated-orcid":false,"given":"Arvind","family":"Ramanathan","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7043-4926","authenticated-orcid":false,"given":"Chaowei","family":"Xiao","sequence":"additional","affiliation":[]},{"given":"Jian","family":"Tang","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7663-2421","authenticated-orcid":false,"given":"Hongyu","family":"Guo","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6974-6797","authenticated-orcid":false,"given":"Anima","family":"Anandkumar","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,3,27]]},"reference":[{"key":"1011_CR1","doi-asserted-by":"publisher","first-page":"102713","DOI":"10.1016\/j.copbio.2022.102713","volume":"75","author":"CR Freschlin","year":"2022","unstructured":"Freschlin, C. R., Fahlberg, S. A. & Romero, P. A. Machine learning to navigate fitness landscapes for protein engineering. Curr. Opin. Biotechnol. 75, 102713 (2022).","journal-title":"Curr. Opin. Biotechnol."},{"key":"1011_CR2","doi-asserted-by":"publisher","first-page":"583","DOI":"10.1038\/s41586-021-03819-2","volume":"596","author":"J Jumper","year":"2021","unstructured":"Jumper, J. et al. Highly accurate protein structure prediction with AlphaFold. Nature 596, 583\u2013589 (2021).","journal-title":"Nature"},{"key":"1011_CR3","doi-asserted-by":"crossref","unstructured":"Zhong, E. D., Lerer, A., Davis, J. H. & Berger, B. CryoDRGN2: ab initio neural reconstruction of 3D protein structures from real cryo-EM images. In 2021 IEEE\/CVF International Conference on Computer Vision (ICCV), 4046\u20134055 (IEEE, 2021).","DOI":"10.1109\/ICCV48922.2021.00403"},{"key":"1011_CR4","doi-asserted-by":"crossref","unstructured":"Hsu, C. et al. Learning inverse folding from millions of predicted structures. Proc. Mach. Learning Res. 162, 8946\u20138970 (2022).","DOI":"10.1101\/2022.04.10.487779"},{"key":"1011_CR5","doi-asserted-by":"crossref","unstructured":"Rao, R. M. et al. MSA Transformer. Proc. Mach. Learning Res. 139, 8844\u20138856 (2021).","DOI":"10.1101\/2021.02.12.430858"},{"key":"1011_CR6","doi-asserted-by":"crossref","unstructured":"Elnaggar, A. et al. ProtTrans: toward understanding the language of life through self-supervised learning. IEEE Trans. Pattern Anal. Mach. Intell. 44, 7112\u20137127 (2022).","DOI":"10.1109\/TPAMI.2021.3095381"},{"key":"1011_CR7","doi-asserted-by":"crossref","unstructured":"Meier, J. et al. Language models enable zero-shot prediction of the effects of mutations on protein function. Adv. Neural Inf. Process. Syst. 34, 29287\u201329303 (2021).","DOI":"10.1101\/2021.07.09.450648"},{"key":"1011_CR8","doi-asserted-by":"crossref","unstructured":"Li, M. et al. SESNet: sequence\u2013structure feature-integrated deep learning method for data-efficient protein engineering. J. Cheminformatics 15, 12 (2023).","DOI":"10.1186\/s13321-023-00688-x"},{"key":"1011_CR9","unstructured":"Jing, B., Eismann, S., Suriana, P., Townshend, R. J. L. & Dror, R. Learning from protein structure with geometric vector perceptrons. In International Conference on Learning Representations (2021)."},{"key":"1011_CR10","unstructured":"Wang, L., Liu, H., Liu, Y., Kurtin, J. & Ji, S. Learning protein representations via complete 3D graph networks. In The Eleventh International Conference on Learning Representations (2023)."},{"key":"1011_CR11","unstructured":"Radford, A. et al. Learning transferable visual models from natural language supervision. Proc. Mach. Learning Res. 139, 8748\u20138763 (2021)."},{"key":"1011_CR12","unstructured":"Nichol, A. Q. et al. GLIDE: towards photorealistic image generation and editing with text-guided diffusion models. Proc. Mach. Learning Res. 162, 16784\u201316804 (2022)."},{"key":"1011_CR13","doi-asserted-by":"publisher","unstructured":"Ramesh, A., Dhariwal, P., Nichol, A., Chu, C. & Chen, M. Hierarchical text-conditional image generation with clip latents. Preprint at https:\/\/doi.org\/10.48550\/arXiv.2204.06125 (2022).","DOI":"10.48550\/arXiv.2204.06125"},{"key":"1011_CR14","doi-asserted-by":"crossref","unstructured":"Patashnik, O., Wu, Z., Shechtman, E., Cohen-Or, D. & Lischinski, D. StyleCLIP: text-driven manipulation of StyleGAN imagery. In Proc. IEEE\/CVF International Conference on Computer Vision (ICCV) 2065\u20132074 (IEEE, 2021).","DOI":"10.1109\/ICCV48922.2021.00209"},{"key":"1011_CR15","unstructured":"Liu, S., Qu, M., Zhang, Z., Cai, H. & Tang, J. Structured multi-task learning for molecular property prediction. Proc. Mach. Learning Res. 151, 8906\u20138920 (2022)."},{"key":"1011_CR16","doi-asserted-by":"crossref","unstructured":"Edwards, C., Zhai, C. & Ji, H. Text2mol: cross-modal molecule retrieval with natural language queries. In Proc. 2021 Conference on Empirical Methods in Natural Language Processing (eds Moens, M.-F. et al.) 595\u2013607 (Association for Computational Linguistics, 2021).","DOI":"10.18653\/v1\/2021.emnlp-main.47"},{"key":"1011_CR17","doi-asserted-by":"publisher","first-page":"862","DOI":"10.1038\/s41467-022-28494-3","volume":"13","author":"Z Zeng","year":"2022","unstructured":"Zeng, Z., Yao, Y., Liu, Z. & Sun, M. A deep-learning system bridging molecule structure and biomedical text with comprehension comparable to human professionals. Nat. Commun. 13, 862 (2022).","journal-title":"Nat. Commun."},{"key":"1011_CR18","doi-asserted-by":"publisher","first-page":"1447","DOI":"10.1038\/s42256-023-00759-6","volume":"5","author":"S Liu","year":"2023","unstructured":"Liu, S. et al. Multi-modal molecule structure\u2013text model for text-based retrieval and editing. Nat. Mach. Intell. 5, 1447\u20131457 (2023).","journal-title":"Nat. Mach. Intell."},{"key":"1011_CR19","unstructured":"Liu, S. et al. Conversational drug editing using retrieval and domain feedback. In The Twelfth International Conference on Learning Representations (2024)."},{"key":"1011_CR20","doi-asserted-by":"crossref","unstructured":"The UniProt Consortium The Universal Protein Resource (UniProt). Nucleic Acids Res. 36, D190\u2013D195 (2007).","DOI":"10.1093\/nar\/gkm895"},{"key":"1011_CR21","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1038\/75556","volume":"25","author":"M Ashburner","year":"2000","unstructured":"Ashburner, M. et al. Gene Ontology: tool for the unification of biology. Nat. Genet. 25, 25\u201329 (2000).","journal-title":"Nat. Genet."},{"key":"1011_CR22","unstructured":"UniProt. Uniprotkg\/swiss-prot (2023); https:\/\/www.uniprot.org"},{"key":"1011_CR23","doi-asserted-by":"crossref","unstructured":"Boutet, E., Lieberherr, D., Tognolli, M., Schneider, M. & Bairoch, A. in Plant Bioinformatics (ed. Edwards, D.) 89\u2013112 (Springer, 2007).","DOI":"10.1007\/978-1-59745-535-0_4"},{"key":"1011_CR24","doi-asserted-by":"crossref","unstructured":"Branden, C. I. & Tooze, J. Introduction to Protein Structure (Garland, 2012).","DOI":"10.1201\/9781136969898"},{"key":"1011_CR25","unstructured":"Devlin, J., Chang, M.-W., Lee, K. & Toutanova, K. BERT: pre-training of deep bidirectional transformers for language understanding. In Proc. 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers) (eds Burstein, J. et al.) 4171\u20134186 (Association for Computational Linguistics, 2019)."},{"key":"1011_CR26","doi-asserted-by":"publisher","unstructured":"Vaswani, A. et al. Attention is all you need. Adv. Neural Inf. Process. Syst. https:\/\/doi.org\/10.48550\/arXiv.1706.03762 (2017).","DOI":"10.48550\/arXiv.1706.03762"},{"key":"1011_CR27","doi-asserted-by":"publisher","first-page":"603","DOI":"10.1038\/s41592-019-0437-4","volume":"16","author":"M Steinegger","year":"2019","unstructured":"Steinegger, M., Mirdita, M. & S\u00f6ding, J. Protein-level assembly increases protein sequence recovery from metagenomic samples manyfold. Nat. Methods 16, 603\u2013606 (2019).","journal-title":"Nat. Methods"},{"key":"1011_CR28","doi-asserted-by":"publisher","first-page":"2542","DOI":"10.1038\/s41467-018-04964-5","volume":"9","author":"M Steinegger","year":"2018","unstructured":"Steinegger, M. & S\u00f6ding, J. Clustering huge protein sequence sets in linear time. Nat. Commun. 9, 2542 (2018).","journal-title":"Nat. Commun."},{"key":"1011_CR29","doi-asserted-by":"crossref","unstructured":"Beltagy, I., Lo, K. & Cohan, A. SciBERT: a pretrained language model for scientific text. In Proc. 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP) (eds Inui, K. et al.) 3615\u20133620 (Association for Computational Linguistics, 2019).","DOI":"10.18653\/v1\/D19-1371"},{"key":"1011_CR30","doi-asserted-by":"publisher","first-page":"145","DOI":"10.5195\/jmla.2018.280","volume":"106","author":"S Fricke","year":"2018","unstructured":"Fricke, S. Semantic Scholar. J. Med. Libr. Assoc. 106, 145\u2013147 (2018).","journal-title":"J. Med. Libr. Assoc."},{"key":"1011_CR31","unstructured":"Taylor, R. et al. Galactica: a large language model for science. Preprint at https:\/\/arxiv.org\/abs\/2211.09085 (2022)."},{"key":"1011_CR32","unstructured":"Li, Y., Xu, H., Zhao, H., Guo, H. & Liu, S. ChatPathway: conversational large language models for biology pathway detection. In NeurIPS 2023 AI for Science Workshop (2023)."},{"key":"1011_CR33","doi-asserted-by":"publisher","first-page":"585","DOI":"10.1038\/s41587-023-01788-7","volume":"41","author":"N Savage","year":"2023","unstructured":"Savage, N. Drug discovery companies are customizing ChatGPT: here\u2019s how. Nat. Biotechnol. 41, 585\u2013586 (2023).","journal-title":"Nat. Biotechnol."},{"key":"1011_CR34","doi-asserted-by":"crossref","unstructured":"Gao, Z. et al. Empowering diffusion models on the embedding space for text generation. In Proc. 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers) (eds Duh, K. et al.) 4664\u20134683 (Association for Computational Linguistics, 2024).","DOI":"10.18653\/v1\/2024.naacl-long.261"},{"key":"1011_CR35","unstructured":"Lin, Z. et al. Text generation with diffusion language models: a pre-training approach with continuous paragraph denoise. Proc. Mach. Learning Res. 202, 21051\u201321064 (2023)."},{"key":"1011_CR36","doi-asserted-by":"crossref","unstructured":"Bar-Tal, O. et al. Lumiere: a space\u2013time diffusion model for video generation. In SIGGRAPH Asia 2024 Conference Papers 1\u201311 (Association for Computing Machinery, 2024).","DOI":"10.1145\/3680528.3687614"},{"key":"1011_CR37","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P. & Ommer, B. High-resolution image synthesis with latent diffusion models. In Proc. IEEE\/CVF Conference on Computer Vision and Pattern Recognition 10684\u201310695 (IEEE Computer Society, 2022).","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"1011_CR38","doi-asserted-by":"publisher","first-page":"2577","DOI":"10.1002\/bip.360221211","volume":"22","author":"W Kabsch","year":"1983","unstructured":"Kabsch, W. & Sander, C. Dictionary of protein secondary structure: pattern recognition of hydrogen-bonded and geometrical features. Biopolymers 22, 2577\u20132637 (1983).","journal-title":"Biopolymers"},{"key":"1011_CR39","doi-asserted-by":"publisher","first-page":"102372","DOI":"10.1016\/j.sbi.2022.102372","volume":"74","author":"JL Binder","year":"2022","unstructured":"Binder, J. L. et al. AlphaFold illuminates half of the dark human proteins. Curr. Opin. Struct. Biol. 74, 102372 (2022).","journal-title":"Curr. Opin. Struct. Biol."},{"key":"1011_CR40","doi-asserted-by":"publisher","first-page":"168","DOI":"10.1126\/science.aan0693","volume":"357","author":"GJ Rocklin","year":"2017","unstructured":"Rocklin, G. J. et al. Global analysis of protein folding using massively parallel design, synthesis, and testing. Science 357, 168\u2013175 (2017).","journal-title":"Science"},{"key":"1011_CR41","doi-asserted-by":"crossref","unstructured":"Rohl, C. A., Strauss, C. E., Misura, K. M. & Baker, D. in Methods in Enzymology Vol. 383 (eds Brand, L. & Johnson, M. L.) 66\u201393 (Elsevier, 2004).","DOI":"10.1016\/S0076-6879(04)83004-0"},{"key":"1011_CR42","doi-asserted-by":"publisher","first-page":"689","DOI":"10.1093\/bioinformatics\/btq007","volume":"26","author":"S Chaudhury","year":"2010","unstructured":"Chaudhury, S., Lyskov, S. & Gray, J. J. PyRosetta: a script-based interface for implementing molecular modeling algorithms using Rosetta. Bioinformatics 26, 689\u2013691 (2010).","journal-title":"Bioinformatics"},{"key":"1011_CR43","doi-asserted-by":"publisher","first-page":"6201","DOI":"10.1021\/acs.jctc.6b00819","volume":"12","author":"H Park","year":"2016","unstructured":"Park, H. et al. Simultaneous optimization of biomolecular energy functions on features from small molecules and macromolecules. J. Chem. Theory Comput. 12, 6201\u20136212 (2016).","journal-title":"J. Chem. Theory Comput."},{"key":"1011_CR44","doi-asserted-by":"publisher","first-page":"235","DOI":"10.1093\/nar\/28.1.235","volume":"28","author":"HM Berman","year":"2000","unstructured":"Berman, H. M. et al. The Protein Data Bank. Nucleic Acids Res. 28, 235\u2013242 (2000).","journal-title":"Nucleic Acids Res."},{"key":"1011_CR45","doi-asserted-by":"crossref","unstructured":"Liu, S. et al. A multi-grained symmetric differential equation model for learning protein\u2013ligand binding dynamics. Preprint at https:\/\/arxiv.org\/abs\/2401.15122 (2024).","DOI":"10.21203\/rs.3.rs-5538361\/v1"},{"key":"1011_CR46","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1186\/s13321-021-00522-2","volume":"13","author":"AT McNutt","year":"2021","unstructured":"McNutt, A. T. et al. gnina 1.0: molecular docking with deep learning. J. Cheminformatics 13, 43 (2021).","journal-title":"J. Cheminformatics"},{"key":"1011_CR47","doi-asserted-by":"publisher","first-page":"345","DOI":"10.1021\/jm901325e","volume":"53","author":"E Salsi","year":"2010","unstructured":"Salsi, E. et al. Design of O-acetylserine sulfhydrylase inhibitors by mimicking nature. J. Med. Chem. 53, 345\u2013356 (2010).","journal-title":"J. Med. Chem."},{"key":"1011_CR48","doi-asserted-by":"crossref","unstructured":"Rao, R. et al. Evaluating protein transfer learning with TAPE. Adv. Neural Inf. Process. Syst. 32 (2019).","DOI":"10.1101\/676825"},{"key":"1011_CR49","doi-asserted-by":"publisher","first-page":"520","DOI":"10.1002\/prot.25674","volume":"87","author":"MS Klausen","year":"2019","unstructured":"Klausen, M. S. et al. NetSurfP-2.0: improved prediction of protein structural features by integrated deep learning. Proteins 87, 520\u2013527 (2019).","journal-title":"Proteins"},{"key":"1011_CR50","doi-asserted-by":"publisher","first-page":"1295","DOI":"10.1093\/bioinformatics\/btx780","volume":"34","author":"J Hou","year":"2018","unstructured":"Hou, J., Adhikari, B. & Cheng, J. DeepSF: deep convolutional neural network for mapping protein sequences to folds. Bioinformatics 34, 1295\u20131303 (2018).","journal-title":"Bioinformatics"},{"key":"1011_CR51","doi-asserted-by":"publisher","first-page":"D304","DOI":"10.1093\/nar\/gkt1240","volume":"42","author":"NK Fox","year":"2013","unstructured":"Fox, N. K., Brenner, S. E. & Chandonia, J.-M. SCOPe: Structural Classification of Proteins\u2014extended, integrating SCOP and ASTRAL data and classification of new structures. Nucleic Acids Res. 42, D304\u2013D309 (2013).","journal-title":"Nucleic Acids Res."},{"key":"1011_CR52","doi-asserted-by":"publisher","first-page":"311","DOI":"10.1186\/s12859-019-2932-0","volume":"20","author":"M AlQuraishi","year":"2019","unstructured":"AlQuraishi, M. ProteinNet: a standardized data set for machine learning of protein structure. BMC Bioinform. 20, 311 (2019).","journal-title":"BMC Bioinform."},{"key":"1011_CR53","doi-asserted-by":"publisher","first-page":"7","DOI":"10.1002\/prot.25415","volume":"86","author":"J Moult","year":"2018","unstructured":"Moult, J., Fidelis, K., Kryshtafovych, A., Schwede, T. & Tramontano, A. Critical assessment of methods of protein structure prediction (CASP)\u2014Round XII. Proteins 86, 7\u201315 (2018).","journal-title":"Proteins"},{"key":"1011_CR54","doi-asserted-by":"publisher","first-page":"397","DOI":"10.1038\/nature17995","volume":"533","author":"KS Sarkisyan","year":"2016","unstructured":"Sarkisyan, K. S. et al. Local fitness landscape of the green fluorescent protein. Nature 533, 397\u2013401 (2016).","journal-title":"Nature"},{"key":"1011_CR55","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S. & Schmidhuber, J. Long short-term memory. Neural Comput. 9, 1735\u20131780 (1997).","journal-title":"Neural Comput."},{"key":"1011_CR56","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S. & Sun, J. Deep residual learning for image recognition. In Proc. IEEE Conference on Computer Vision and Pattern Recognition 770\u2013778 (IEEE, 2016).","DOI":"10.1109\/CVPR.2016.90"},{"key":"1011_CR57","unstructured":"Zhang, N. et al. OntoProtein: protein pretraining with Gene Ontology embedding. In International Conference on Learning Representations (2022)."},{"key":"1011_CR58","doi-asserted-by":"publisher","first-page":"1070","DOI":"10.1038\/s41586-023-06728-8","volume":"623","author":"J Ingraham","year":"2023","unstructured":"Ingraham, J. et al. Illuminating protein space with a programmable generative model. Nature 623, 1070\u20131078 (2023).","journal-title":"Nature"},{"key":"1011_CR59","doi-asserted-by":"publisher","first-page":"W587","DOI":"10.1093\/nar\/gkz389","volume":"47","author":"C-H Wei","year":"2019","unstructured":"Wei, C.-H., Allot, A., Leaman, R. & Lu, Z. PubTator Central: automated concept annotation for biomedical full text articles. Nucleic Acids Res. 47, W587\u2013W593 (2019).","journal-title":"Nucleic Acids Res."},{"key":"1011_CR60","unstructured":"Angermueller, C. et al. Model-based reinforcement learning for biological sequence design. In International Conference on Learning Representations (2020)."},{"key":"1011_CR61","doi-asserted-by":"publisher","first-page":"e2104878118","DOI":"10.1073\/pnas.2104878118","volume":"118","author":"S Gelman","year":"2021","unstructured":"Gelman, S., Fahlberg, S. A., Heinzelman, P., Romero, P. A. & Gitter, A. Neural networks to learn protein sequence\u2013function relationships from deep mutational scanning data. Proc. Natl Acad. Sci. USA 118, e2104878118 (2021).","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"1011_CR62","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-021-25976-8","volume":"12","author":"Y Luo","year":"2021","unstructured":"Luo, Y. et al. ECNet is an evolutionary context-integrated deep learning framework for protein engineering. Nat. Commun. 12, 5743 (2021).","journal-title":"Nat. Commun."},{"key":"1011_CR63","doi-asserted-by":"publisher","first-page":"389","DOI":"10.1038\/s41592-021-01100-y","volume":"18","author":"S Biswas","year":"2021","unstructured":"Biswas, S., Khimulya, G., Alley, E. C., Esvelt, K. M. & Church, G. M. Low-N protein engineering with data-efficient deep learning. Nat. Methods 18, 389\u2013396 (2021).","journal-title":"Nat. Methods"},{"key":"1011_CR64","unstructured":"Notin, P. et al. Tranception: protein fitness prediction with autoregressive transformers and inference-time retrieval. Proc. Mach. Learning Res. 162, 16990\u201317017 (2022)."},{"key":"1011_CR65","first-page":"9","volume":"1","author":"A Radford","year":"2019","unstructured":"Radford, A. et al. Language models are unsupervised multitask learners. OpenAI Blog 1, 9 (2019).","journal-title":"OpenAI Blog"},{"key":"1011_CR66","doi-asserted-by":"crossref","unstructured":"Lewis, M. et al. BART: denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension. In Proc. 58th Annual Meeting of the Association for Computational Linguistics (eds Jurafsky, D. et al.) 7871\u20137880 (Association for Computational Linguistics, 2020).","DOI":"10.18653\/v1\/2020.acl-main.703"},{"key":"1011_CR67","first-page":"1","volume":"21","author":"C Raffel","year":"2020","unstructured":"Raffel, C. et al. Exploring the limits of transfer learning with a unified text-to-text transformer. J. Mach. Learning Res. 21, 1\u201367 (2020).","journal-title":"J. Mach. Learning Res."},{"key":"1011_CR68","unstructured":"Ho, J., Jain, A. & Abbeel, P. Denoising diffusion probabilistic models. Adv. Neural Inf. Process. Syst. 33, 6840\u20136851 (2020)."},{"key":"1011_CR69","doi-asserted-by":"publisher","first-page":"1661","DOI":"10.1162\/NECO_a_00142","volume":"23","author":"P Vincent","year":"2011","unstructured":"Vincent, P. A connection between score matching and denoising autoencoders. Neural Comput. 23, 1661\u20131674 (2011).","journal-title":"Neural Comput."},{"key":"1011_CR70","unstructured":"Song, Y. & Ermon, S. Generative modeling by estimating gradients of the data distribution. Adv. Neural Inf. Process. Syst. 32 (2019)."},{"key":"1011_CR71","unstructured":"Song, Y. et al. Score-based generative modeling through stochastic differential equations. In International Conference on Learning Representations (2021)."},{"key":"1011_CR72","unstructured":"Hjelm, R. D. et al. Learning deep representations by mutual information estimation and maximization. In International Conference on Learning Representations (2019)."},{"key":"1011_CR73","unstructured":"Bachman, P., Hjelm, R. D. & Buchwalter, W. Learning representations by maximizing mutual information across views. Adv. Neural Inf. Process. Syst. 32 (2019)."},{"key":"1011_CR74","unstructured":"Oord, A. v. d., Li, Y. & Vinyals, O. Representation learning with contrastive predictive coding. Preprint at https:\/\/arxiv.org\/abs\/1807.03748 (2018)."},{"key":"1011_CR75","doi-asserted-by":"crossref","unstructured":"He, K., Fan, H., Wu, Y., Xie, S. & Girshick, R. Momentum contrast for unsupervised visual representation learning. In Proc. IEEE\/CVF Conference on Computer Vision and Pattern Recognition 9729\u20139738 (IEEE, 2020).","DOI":"10.1109\/CVPR42600.2020.00975"},{"key":"1011_CR76","unstructured":"Liu, S. et al. Pre-training molecular graph representation with 3D geometry. In International Conference on Learning Representations (2022)."},{"key":"1011_CR77","unstructured":"LeCun, Y., Chopra, S., Hadsell, R., Ranzato, M. & Huang, F. in Predicting Structured Data Vol. 1 (eds Bakir, G. et al.) (MIT Press, 2006)."},{"key":"1011_CR78","unstructured":"Khosla, P. et al. Supervised contrastive learning. Adv. Neural Inf. Process. Syst. 33, 18661\u201318673 (2020)."},{"key":"1011_CR79","unstructured":"Liu, S., Guo, H. & Tang, J. Molecular geometry pretraining with SE(3)-invariant denoising distance matching. In International Conference on Learning Representations (2023)."},{"key":"1011_CR80","doi-asserted-by":"crossref","unstructured":"Huang, W., Hayashi, T., Wu, Y., Kameoka, H. & Toda, T. Voice transformer network: sequence-to-sequence voice conversion using Transformer with text-to-speech pretraining. In Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25\u201329 October 2020 (eds Meng, H. et al.) 4676\u20134680 (ISCA, 2020).","DOI":"10.21437\/Interspeech.2020-1066"},{"key":"1011_CR81","doi-asserted-by":"crossref","unstructured":"Karita, S. et al. A comparative study on Transformer vs RNN in speech applications. In IEEE Automatic Speech Recognition and Understanding Workshop, ASRU 2019, Singapore, December 14\u201318, 2019 449\u2013456 (IEEE, 2019).","DOI":"10.1109\/ASRU46091.2019.9003750"},{"key":"1011_CR82","unstructured":"Chang, H. et al. Muse: text-to-image generation via masked generative transformers. Proc. Mach. Learning Res. 202, 4055\u20134075 (2023)."},{"key":"1011_CR83","unstructured":"Song, Y. & Kingma, D. P. How to train your energy-based models. Preprint at https:\/\/arxiv.org\/abs\/2101.03288 (2021)."},{"key":"1011_CR84","first-page":"12454","volume":"34","author":"E Hoogeboom","year":"2021","unstructured":"Hoogeboom, E., Nielsen, D., Jaini, P., Forr\u00e9, P. & Welling, M. Argmax flows and multinomial diffusion: learning categorical distributions. Adv. Neural Inf. Process. Syst. 34, 12454\u201312465 (2021).","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"1011_CR85","first-page":"17981","volume":"34","author":"J Austin","year":"2021","unstructured":"Austin, J., Johnson, D. D., Ho, J., Tarlow, D. & van den Berg, R. Structured denoising diffusion models in discrete state-spaces. Adv. Neural Inf. Process. Syst. 34, 17981\u201317993 (2021).","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"1011_CR86","unstructured":"Li, X., Thickstun, J., Gulrajani, I., Liang, P. S. & Hashimoto, T. B. Diffusion-LM improves controllable text generation. Adv. Neural Inf. Process Syst. 35, 4328\u20134343 (2022)."},{"key":"1011_CR87","doi-asserted-by":"crossref","unstructured":"Bond-Taylor, S., Hessey, P., Sasaki, H., Breckon, T. P. & Willcocks, C. G. Unleashing Transformers: parallel token prediction with discrete absorbing diffusion for fast high-resolution image generation from vector-quantized codes. In Computer Vision - ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23\u201327, 2022, Proc., Part XXIII (eds Avidan, S.) 170\u2013188 (Springer, 2022).","DOI":"10.1007\/978-3-031-20050-2_11"},{"key":"1011_CR88","doi-asserted-by":"publisher","unstructured":"Liu, S. et al. A text-guided protein design framework. Zenodo https:\/\/doi.org\/10.5281\/zenodo.14630813 (2025).","DOI":"10.5281\/zenodo.14630813"}],"container-title":["Nature Machine Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.nature.com\/articles\/s42256-025-01011-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s42256-025-01011-z","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s42256-025-01011-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,22]],"date-time":"2025-04-22T22:03:34Z","timestamp":1745359414000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.nature.com\/articles\/s42256-025-01011-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,27]]},"references-count":88,"journal-issue":{"issue":"4","published-online":{"date-parts":[[2025,4]]}},"alternative-id":["1011"],"URL":"https:\/\/doi.org\/10.1038\/s42256-025-01011-z","relation":{},"ISSN":["2522-5839"],"issn-type":[{"value":"2522-5839","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,3,27]]},"assertion":[{"value":"1 December 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 February 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 March 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors declare no competing interests.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}