{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,25]],"date-time":"2026-03-25T03:29:24Z","timestamp":1774409364715,"version":"3.50.1"},"reference-count":41,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2023,5,4]],"date-time":"2023-05-04T00:00:00Z","timestamp":1683158400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,5,4]],"date-time":"2023-05-04T00:00:00Z","timestamp":1683158400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100007202","name":"Gouvernement du Canada | Instituts de Recherche en Sant\u00e9 du Canada | CIHR Skin Research Training Centre","doi-asserted-by":"publisher","award":["PJT-153279"],"award-info":[{"award-number":["PJT-153279"]}],"id":[{"id":"10.13039\/501100007202","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100007202","name":"Gouvernement du Canada | Instituts de Recherche en Sant\u00e9 du Canada | CIHR Skin Research Training Centre","doi-asserted-by":"publisher","award":["PJT-153279"],"award-info":[{"award-number":["PJT-153279"]}],"id":[{"id":"10.13039\/501100007202","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002790","name":"Canadian Network for Research and Innovation in Machining Technology, Natural Sciences and Engineering Research Council of Canada","doi-asserted-by":"publisher","award":["RGPIN-2017-064"],"award-info":[{"award-number":["RGPIN-2017-064"]}],"id":[{"id":"10.13039\/501100002790","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002790","name":"Canadian Network for Research and Innovation in Machining Technology, Natural Sciences and Engineering Research Council of Canada","doi-asserted-by":"publisher","award":["RGPIN-2017-064"],"award-info":[{"award-number":["RGPIN-2017-064"]}],"id":[{"id":"10.13039\/501100002790","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002790","name":"Canadian Network for Research and Innovation in Machining Technology, Natural Sciences and Engineering Research Council of Canada","doi-asserted-by":"publisher","award":["RGPIN-2017-064"],"award-info":[{"award-number":["RGPIN-2017-064"]}],"id":[{"id":"10.13039\/501100002790","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100000024","name":"Gouvernement du Canada | Canadian Institutes of Health Research","doi-asserted-by":"publisher","award":["PJT-153279"],"award-info":[{"award-number":["PJT-153279"]}],"id":[{"id":"10.13039\/501100000024","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Nat Comput Sci"],"DOI":"10.1038\/s43588-023-00440-3","type":"journal-article","created":{"date-parts":[[2023,5,4]],"date-time":"2023-05-04T12:02:48Z","timestamp":1683201768000},"page":"382-392","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":71,"title":["Score-based generative modeling for de novo protein design"],"prefix":"10.1038","volume":"3","author":[{"given":"Jin Sub","family":"Lee","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4863-9773","authenticated-orcid":false,"given":"Jisun","family":"Kim","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3683-152X","authenticated-orcid":false,"given":"Philip M.","family":"Kim","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,5,4]]},"reference":[{"key":"440_CR1","doi-asserted-by":"publisher","first-page":"583","DOI":"10.1038\/s41586-021-03819-2","volume":"596","author":"J Jumper","year":"2021","unstructured":"Jumper, J. et al. Highly accurate protein structure prediction with AlphaFold. Nature 596, 583\u2013589 (2021).","journal-title":"Nature"},{"key":"440_CR2","first-page":"402\u2013411.e4","volume":"11","author":"A Strokach","year":"2020","unstructured":"Strokach, A., Becerra, D., Corbi-Verge, C., Perez-Riba, A. & Kim, P. M. Fast and flexible protein design using deep graph neural networks. Cell Syst. 11, 402\u2013411.e4 (2020).","journal-title":"Cell Syst."},{"key":"440_CR3","doi-asserted-by":"crossref","unstructured":"Hsu, C. et al. Learning inverse folding from millions of predicted structures. In International Conference on Machine Learning 8946\u20138970 (PMLR, 2022).","DOI":"10.1101\/2022.04.10.487779"},{"key":"440_CR4","doi-asserted-by":"crossref","unstructured":"Dauparas, J. et al. Robust deep learning based protein sequence design using ProteinMPNN. Science 378, 49\u201356 (2022).","DOI":"10.1126\/science.add2187"},{"key":"440_CR5","doi-asserted-by":"publisher","first-page":"D376","DOI":"10.1093\/nar\/gkz1064","volume":"48","author":"A Andreeva","year":"2020","unstructured":"Andreeva, A., Kulesha, E., Gough, J. & Murzin, A. G. The SCOP database in 2020: expanded classification of representative family and superfamily domains of known protein structures. Nucl. Acids Res. 48, D376\u2013D382 (2020).","journal-title":"Nucl. Acids Res."},{"key":"440_CR6","doi-asserted-by":"publisher","first-page":"D266","DOI":"10.1093\/nar\/gkaa1079","volume":"49","author":"I Sillitoe","year":"2021","unstructured":"Sillitoe, I. et al. CATH: increased structural coverage of functional space. Nucl. Acids Res. 49, D266\u2013D273 (2021).","journal-title":"Nucl. Acids Res."},{"key":"440_CR7","doi-asserted-by":"crossref","unstructured":"Wang, J. et al. Scaffolding protein functional sites using deep learning. Science 377, 387\u2013394 (2022).","DOI":"10.1126\/science.abn2100"},{"key":"440_CR8","unstructured":"Ho, J., Jain, A. & Abbeel, P. Denoising diffusion probabilistic models. In Advances in Neural Information Processing Systems Vol. 33, 6840\u20136851 (Curran Associates, 2020)."},{"key":"440_CR9","unstructured":"Song, Y. & Ermon, S. Generative modeling by estimating gradients of the data distribution. In Advances in Neural Information Processing Systems Vol. 32 (Curran Associates, 2019)."},{"key":"440_CR10","unstructured":"Dhariwal, P. & Nichol, A. Diffusion models beat gans on image synthesis. In Advances in Neural Information Processing Systems Vol. 34, 8780\u20138794 (Curran Associates, 2021)."},{"key":"440_CR11","unstructured":"Kong, Z., Ping, W., Huang, J., Zhao, K. & Catanzaro, B. Diffwave: a versatile diffusion model for audio synthesis. In International Conference of Learning Representations (ICLR, 2021)."},{"key":"440_CR12","unstructured":"Ramesh, A., Dhariwal, P., Nichol, A., Chu, C. & Chen, M. Hierarchical text-conditional image generation with CLIP latents. Preprint at http:\/\/arxiv.org\/abs\/2204.06125 (2022)."},{"key":"440_CR13","unstructured":"Niu, C. et al. Permutation invariant graph generation via score-based generative modeling. In International Conference on Artificial Intelligence and Statistics 4474\u20134484 (PMLR, 2020)."},{"key":"440_CR14","unstructured":"Jo, J., Lee, S. & Hwang, S. J. Score-based generative modeling of graphs via the system of stochastic differential equations. In International Conference on Machine Learning 10362\u201310383 (PMLR, 2022)."},{"key":"440_CR15","unstructured":"Hoogeboom, E., Satorras, V. G., Vignac, C. & Welling, M. Equivariant diffusion for molecule generation in 3d. In International Conference on Machine Learning 8867\u20138887 (PMLR, 2022)."},{"key":"440_CR16","unstructured":"Song, Y. et al. Score-based generative modeling through stochastic differential equations. In International Conference of Learning Representations (ICLR, 2020)."},{"key":"440_CR17","unstructured":"Anand, N. & Achim, T. Protein structure and sequence generation with equivariant denoising diffusion probabilistic models. Preprint at http:\/\/arxiv.org\/abs\/2205.15019 (2022)."},{"key":"440_CR18","unstructured":"Trippe, B. L. et al. Diffusion probabilistic modeling of protein backbones in 3D for the motif-scaffolding problem. In International Conference of Learning Representations (ICLR, 2022)."},{"key":"440_CR19","unstructured":"Wu, K. E. et al. Protein structure generation via folding diffusion. Preprint at http:\/\/arxiv.org\/abs\/2209.15611 (2022)."},{"key":"440_CR20","doi-asserted-by":"crossref","unstructured":"Watson, J. L. et al. Broadly applicable and accurate protein design by integrating structure prediction networks and diffusion generative models. Preprint at http:\/\/biorxiv.org\/lookup\/doi\/10.1101\/2022.12.09.519842 (2022).","DOI":"10.1101\/2022.12.09.519842"},{"key":"440_CR21","doi-asserted-by":"crossref","unstructured":"Ingraham, J. et al. Illuminating protein space with a programmable generative model. Preprint at http:\/\/biorxiv.org\/lookup\/doi\/10.1101\/2022.12.01.518682 (2022).","DOI":"10.1101\/2022.12.01.518682"},{"key":"440_CR22","doi-asserted-by":"crossref","unstructured":"Wu, R. et al. High-resolution de novo structure prediction from primary sequence. Preprint at http:\/\/biorxiv.org\/lookup\/doi\/10.1101\/2022.07.21.500999 (2022).","DOI":"10.1101\/2022.07.21.500999"},{"key":"440_CR23","doi-asserted-by":"publisher","first-page":"1496","DOI":"10.1073\/pnas.1914677117","volume":"117","author":"J Yang","year":"2020","unstructured":"Yang, J. et al. Improved protein structure prediction using predicted interresidue orientations. Proc. Natl Acad. Sci. USA 117, 1496\u20131503 (2020).","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"440_CR24","unstructured":"Lin, Z., Sercu, T., LeCun, Y. & Rives, A. Deep generative models create new and diverse protein structures. Machine Learning in Structural Biology (NeurIPS, 2021)."},{"key":"440_CR25","doi-asserted-by":"publisher","first-page":"2302","DOI":"10.1093\/nar\/gki524","volume":"33","author":"Y Zhang","year":"2005","unstructured":"Zhang, Y. & Skolnick, J. TM-align: a protein structure alignment algorithm based on the TM-score. Nucl. Acids Res. 33, 2302\u20132309 (2005).","journal-title":"Nucl. Acids Res."},{"key":"440_CR26","doi-asserted-by":"publisher","first-page":"889","DOI":"10.1093\/bioinformatics\/btq066","volume":"26","author":"J Xu","year":"2010","unstructured":"Xu, J. & Zhang, Y. How significant is a protein structure similarity with TM-score = 0.5? Bioinformatics 26, 889\u2013895 (2010).","journal-title":"Bioinformatics"},{"key":"440_CR27","doi-asserted-by":"publisher","first-page":"2577","DOI":"10.1002\/bip.360221211","volume":"22","author":"W Kabsch","year":"1983","unstructured":"Kabsch, W. & Sander, C. Dictionary of protein secondary structure: pattern recognition of hydrogen-bonded and geometrical features. Biopolymers 22, 2577\u20132637 (1983).","journal-title":"Biopolymers"},{"key":"440_CR28","doi-asserted-by":"publisher","first-page":"W315","DOI":"10.1093\/nar\/gky497","volume":"46","author":"Andr\u00e1s Micsonai","year":"2018","unstructured":"Micsonai, Andr\u00e1s et al. BeStSel: a web server for accurate protein secondary structure prediction and fold recognition from the circular dichroism spectra. Nucl. Acids Res. 46, W315\u2013W322 (2018).","journal-title":"Nucl. Acids Res."},{"key":"440_CR29","doi-asserted-by":"publisher","first-page":"2876","DOI":"10.1038\/nprot.2006.202","volume":"1","author":"NJ Greenfield","year":"2006","unstructured":"Greenfield, N. J. Using circular dichroism spectra to estimate protein secondary structure. Nat. Protocols 1, 2876\u20132890 (2006).","journal-title":"Nat. Protocols"},{"key":"440_CR30","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P. & Ommer, B. High-resolution image synthesis with latent diffusion models. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 10684\u201310695 (IEEE, 2022).","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"440_CR31","unstructured":"Van Rossum, G. & Drake, F. L. Python 3 Reference Manual (CreateSpace, 2009)."},{"key":"440_CR32","doi-asserted-by":"publisher","first-page":"357","DOI":"10.1038\/s41586-020-2649-2","volume":"585","author":"CR Harris","year":"2020","unstructured":"Harris, C. R. et al. Array programming with NumPy. Nature 585, 357\u2013362 (2020).","journal-title":"Nature"},{"key":"440_CR33","doi-asserted-by":"publisher","first-page":"90","DOI":"10.1109\/MCSE.2007.55","volume":"9","author":"JD Hunter","year":"2007","unstructured":"Hunter, J. D. Matplotlib: a 2D graphics environment. Comput. Sci. Eng. 9, 90\u201395 (2007).","journal-title":"Comput. Sci. Eng."},{"key":"440_CR34","unstructured":"Paszke, A. et al. Pytorch: an imperative style, high-performance deep learning library. In Advances in Neural Information Processing Systems Vol. 32, 8024\u20138035 (Curran Associates, 2019); http:\/\/papers.neurips.cc\/paper\/9015-pytorch-an-imperative-style-high-performance-deep-learning-library.pdf"},{"key":"440_CR35","doi-asserted-by":"publisher","first-page":"1422","DOI":"10.1093\/bioinformatics\/btp163","volume":"25","author":"PJA Cock","year":"2009","unstructured":"Cock, P. J. A. et al. Biopython: freely available Python tools for computational molecular biology and bioinformatics. Bioinformatics 25, 1422\u20131423 (2009).","journal-title":"Bioinformatics"},{"key":"440_CR36","doi-asserted-by":"crossref","unstructured":"Kunzmann, P. & Hamacher, K. Biotite: a unifying open source computational biology framework in python. BMC Bioinform. 19, 346 (2018).","DOI":"10.1186\/s12859-018-2367-z"},{"key":"440_CR37","doi-asserted-by":"publisher","first-page":"1661","DOI":"10.1162\/NECO_a_00142","volume":"23","author":"P Vincent","year":"2011","unstructured":"Vincent, P. A connection between score matching and denoising autoencoders. Neural Comput. 23, 1661\u20131674 (2011).","journal-title":"Neural Comput."},{"key":"440_CR38","doi-asserted-by":"crossref","unstructured":"Lin, G., Milan, A., Shen, C. & Reid, I. Refinenet: multi-path refinement networks for high-resolution semantic segmentation. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition 1925\u20131934 (IEEE, 2017).","DOI":"10.1109\/CVPR.2017.549"},{"key":"440_CR39","doi-asserted-by":"publisher","first-page":"3031","DOI":"10.1021\/acs.jctc.7b00125","volume":"13","author":"RF Alford","year":"2017","unstructured":"Alford, R. F. et al. The rosetta all-atom energy function for macromolecular modeling and design. J. Chem. Theory Comput. 13, 3031\u20133048 (2017).","journal-title":"J. Chem. Theory Comput."},{"key":"440_CR40","doi-asserted-by":"publisher","first-page":"689","DOI":"10.1093\/bioinformatics\/btq007","volume":"26","author":"S Chaudhury","year":"2010","unstructured":"Chaudhury, S., Lyskov, S. & Gray, J. J. PyRosetta: a script-based interface for implementing molecular modeling algorithms using Rosetta. Bioinformatics 26, 689\u2013691 (2010).","journal-title":"Bioinformatics"},{"key":"440_CR41","doi-asserted-by":"publisher","unstructured":"Lee, J. S., Kim, J. & Kim, P. M. Proteinsgm Codebase (Zenodo, 2023); https:\/\/doi.org\/10.5281\/zenodo.7755375","DOI":"10.5281\/zenodo.7755375"}],"container-title":["Nature Computational Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.nature.com\/articles\/s43588-023-00440-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s43588-023-00440-3","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s43588-023-00440-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,24]],"date-time":"2023-05-24T19:06:21Z","timestamp":1684955181000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.nature.com\/articles\/s43588-023-00440-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,5,4]]},"references-count":41,"journal-issue":{"issue":"5","published-online":{"date-parts":[[2023,5]]}},"alternative-id":["440"],"URL":"https:\/\/doi.org\/10.1038\/s43588-023-00440-3","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/2022.07.13.499967","asserted-by":"object"},{"id-type":"doi","id":"10.21203\/rs.3.rs-1855828\/v1","asserted-by":"object"}]},"ISSN":["2662-8457"],"issn-type":[{"value":"2662-8457","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,5,4]]},"assertion":[{"value":"13 July 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 March 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 May 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"P.M.K. is a co-founder and consultant to multiple companies, including Resolute Bio, Oracle Therapeutics and Navega Therapeutics and serves on the scientific advisory board of ProteinQure. The remaining authors declare no competing interests.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}