{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,7]],"date-time":"2026-04-07T16:10:35Z","timestamp":1775578235313,"version":"3.50.1"},"reference-count":45,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2021,1,18]],"date-time":"2021-01-18T00:00:00Z","timestamp":1610928000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2021,1,18]],"date-time":"2021-01-18T00:00:00Z","timestamp":1610928000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/100000051","name":"U.S. Department of Health & Human Services | NIH | National Human Genome Research Institute","doi-asserted-by":"publisher","award":["1R21HG010070-01"],"award-info":[{"award-number":["1R21HG010070-01"]}],"id":[{"id":"10.13039\/100000051","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000051","name":"U.S. Department of Health & Human Services | NIH | National Human Genome Research Institute","doi-asserted-by":"publisher","award":["1R21HG010070-01"],"award-info":[{"award-number":["1R21HG010070-01"]}],"id":[{"id":"10.13039\/100000051","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Nat Mach Intell"],"DOI":"10.1038\/s42256-020-00282-y","type":"journal-article","created":{"date-parts":[[2021,1,18]],"date-time":"2021-01-18T17:04:35Z","timestamp":1610989475000},"page":"172-180","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":91,"title":["Deep neural networks identify sequence context features predictive of transcription factor binding"],"prefix":"10.1038","volume":"3","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3689-2712","authenticated-orcid":false,"given":"An","family":"Zheng","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5797-1914","authenticated-orcid":false,"given":"Michael","family":"Lamkin","sequence":"additional","affiliation":[]},{"given":"Hanqing","family":"Zhao","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3687-2199","authenticated-orcid":false,"given":"Cynthia","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Hao","family":"Su","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6086-3903","authenticated-orcid":false,"given":"Melissa","family":"Gymrek","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,1,18]]},"reference":[{"key":"282_CR1","doi-asserted-by":"publisher","first-page":"650","DOI":"10.1016\/j.cell.2018.01.029","volume":"172","author":"SA Lambert","year":"2018","unstructured":"Lambert, S. A. et al. The human transcription factors. Cell 172, 650\u2013665 (2018).","journal-title":"Cell"},{"key":"282_CR2","doi-asserted-by":"publisher","first-page":"76","DOI":"10.1016\/j.gde.2015.12.003","volume":"37","author":"KS Zaret","year":"2016","unstructured":"Zaret, K. S. & Mango, S. E. Pioneer transcription factors, chromatin dynamics, and cell fate control. Curr. Opin. Genet. Dev. 37, 76\u201381 (2016).","journal-title":"Curr. Opin. Genet. Dev."},{"key":"282_CR3","doi-asserted-by":"publisher","first-page":"772","DOI":"10.1038\/nature04979","volume":"442","author":"E Segal","year":"2006","unstructured":"Segal, E. et al. A genomic code for nucleosome positioning. Nature 442, 772\u2013778 (2006).","journal-title":"Nature"},{"key":"282_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.sbi.2017.03.006","volume":"47","author":"E Morgunova","year":"2017","unstructured":"Morgunova, E. & Taipale, J. Structural perspective of cooperative transcription factor binding. Curr. Opin. Struct. Biol. 47, 1\u20138 (2017).","journal-title":"Curr. Opin. Struct. Biol."},{"key":"282_CR5","doi-asserted-by":"publisher","first-page":"1798","DOI":"10.1101\/gr.139105.112","volume":"22","author":"J Wang","year":"2012","unstructured":"Wang, J. et al. Sequence features and chromatin structure around the genomic regions bound by 119 human transcription factors. Genome Res. 22, 1798\u20131812 (2012).","journal-title":"Genome Res."},{"key":"282_CR6","doi-asserted-by":"publisher","first-page":"4654","DOI":"10.1073\/pnas.1422023112","volume":"112","author":"T Zhou","year":"2015","unstructured":"Zhou, T. et al. Quantitative modeling of transcription factor binding specificities using DNA shape. Proc. Natl Acad. Sci. USA 112, 4654\u20134659 (2015).","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"282_CR7","doi-asserted-by":"publisher","first-page":"891","DOI":"10.1101\/gr.226852.117","volume":"28","author":"Y Guo","year":"2018","unstructured":"Guo, Y., Tian, K., Zeng, H., Guo, X. & Gifford, D. K. A novel k-mer set memory (KSM) motif representation improves regulatory variant prediction. Genome Res. 28, 891\u2013900 (2018).","journal-title":"Genome Res."},{"key":"282_CR8","doi-asserted-by":"publisher","DOI":"10.1186\/1471-2105-9-484","volume":"9","author":"JO Westholm","year":"2008","unstructured":"Westholm, J. O., Xu, F., Ronne, H. & Komorowski, J. Genome-scale study of the importance of binding site context for transcription factor binding and gene regulation. BMC Bioinform. 9, 484 (2008).","journal-title":"BMC Bioinform."},{"key":"282_CR9","doi-asserted-by":"publisher","first-page":"831","DOI":"10.1038\/nbt.3300","volume":"33","author":"B Alipanahi","year":"2015","unstructured":"Alipanahi, B., Delong, A., Weirauch, M. T. & Frey, B. J. Predicting the sequence specificities of DNA-and RNA-binding proteins by deep learning. Nat. Biotechnol. 33, 831\u2013838 (2015).","journal-title":"Nat. Biotechnol."},{"key":"282_CR10","doi-asserted-by":"publisher","first-page":"739","DOI":"10.1101\/gr.227819.117","volume":"28","author":"DR Kelley","year":"2018","unstructured":"Kelley, D. R. et al. Sequential regulatory activity prediction across chromosomes with convolutional neural networks. Genome Res. 28, 739\u2013750 (2018).","journal-title":"Genome Res."},{"key":"282_CR11","doi-asserted-by":"publisher","first-page":"990","DOI":"10.1101\/gr.200535.115","volume":"26","author":"DR Kelley","year":"2016","unstructured":"Kelley, D. R., Snoek, J. & Rinn, J. L. Basset: learning the regulatory code of the accessible genome with deep convolutional neural networks. Genome Res. 26, 990\u2013999 (2016).","journal-title":"Genome Res."},{"key":"282_CR12","doi-asserted-by":"publisher","first-page":"955","DOI":"10.1038\/ng.3331","volume":"47","author":"D Lee","year":"2015","unstructured":"Lee, D. et al. A method to predict the impact of regulatory variants from DNA sequence. Nat. Genet. 47, 955\u2013961 (2015).","journal-title":"Nat. Genet."},{"key":"282_CR13","doi-asserted-by":"publisher","first-page":"e107","DOI":"10.1093\/nar\/gkw226","volume":"44","author":"D Quang","year":"2016","unstructured":"Quang, D. & Xie, X. DanQ: a hybrid convolutional and recurrent deep neural network for quantifying the function of DNA sequences. Nucleic Acids Res. 44, e107 (2016).","journal-title":"Nucleic Acids Res."},{"key":"282_CR14","doi-asserted-by":"publisher","first-page":"40","DOI":"10.1016\/j.ymeth.2019.03.020","volume":"166","author":"D Quang","year":"2019","unstructured":"Quang, D. & Xie, X. FactorNet: a deep learning framework for predicting cell type specific transcription factor binding from nucleotide-resolution sequential data. Methods 166, 40\u201347 (2019).","journal-title":"Methods"},{"key":"282_CR15","doi-asserted-by":"publisher","first-page":"490","DOI":"10.1093\/bioinformatics\/btv565","volume":"32","author":"H Zeng","year":"2016","unstructured":"Zeng, H., Hashimoto, T., Kang, D. D. & Gifford, D. K. GERV: a statistical method for generative evaluation of regulatory variants for transcription factor binding. Bioinformatics 32, 490\u2013496 (2016).","journal-title":"Bioinformatics"},{"key":"282_CR16","doi-asserted-by":"publisher","first-page":"931","DOI":"10.1038\/nmeth.3547","volume":"12","author":"J Zhou","year":"2015","unstructured":"Zhou, J. & Troyanskaya, O. G. Predicting effects of noncoding variants with deep learning\u2013based sequence model. Nat. Meth. 12, 931\u2013934 (2015).","journal-title":"Nat. Meth."},{"key":"282_CR17","doi-asserted-by":"crossref","unstructured":"Selvaraju, R. R. et al. Grad-CAM: visual explanations from deep networks via gradient-based localization. In Proc. IEEE International Conference on Computer Vision 618\u2013626 (2017).","DOI":"10.1109\/ICCV.2017.74"},{"key":"282_CR18","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1038\/nature11247","volume":"489","author":"EP Consortium","year":"2012","unstructured":"Consortium, E. P. An integrated encyclopedia of DNA elements in the human genome. Nature 489, 57\u201374 (2012).","journal-title":"Nature"},{"key":"282_CR19","doi-asserted-by":"publisher","first-page":"D260","DOI":"10.1093\/nar\/gkx1126","volume":"46","author":"A Khan","year":"2018","unstructured":"Khan, A. et al. JASPAR 2018: update of the open-access database of transcription factor binding profiles and its web framework. Nucleic Acids Res. 46, D260\u2013D266 (2018).","journal-title":"Nucleic Acids Res."},{"key":"282_CR20","doi-asserted-by":"publisher","first-page":"317","DOI":"10.1038\/nature14248","volume":"518","author":"A Kundaje","year":"2015","unstructured":"Kundaje, A. et al. Integrative analysis of 111 reference human epigenomes. Nature 518, 317\u2013330 (2015).","journal-title":"Nature"},{"key":"282_CR21","doi-asserted-by":"publisher","first-page":"3449","DOI":"10.1002\/sim.5777","volume":"32","author":"H Ma","year":"2013","unstructured":"Ma, H., Bandos, A. I., Rockette, H. E. & Gur, D. On use of partial area under the ROC curve for evaluation of diagnostic performance. Stat. Med. 32, 3449\u20133458 (2013).","journal-title":"Stat. Med."},{"key":"282_CR22","doi-asserted-by":"publisher","first-page":"879","DOI":"10.1016\/j.ajhg.2019.03.012","volume":"104","author":"T Amariuta","year":"2019","unstructured":"Amariuta, T. et al. IMPACT: genomic annotation of cell-state-specific regulatory elements inferred from the epigenome of bound transcription factors. Am. J. Hum. Genet. 104, 879\u2013895 (2019).","journal-title":"Am. J. Hum. Genet."},{"key":"282_CR23","unstructured":"Shrikumar, A., Greenside, P. & Kundaje, A. Learning important features through propagating activation differences. In Proc. 34th International Conference on Machine Learning 70, 3145\u20133153 (JMLR, 2017)."},{"key":"282_CR24","doi-asserted-by":"crossref","unstructured":"Lanchantin, J., Singh, R., Wang, B. & Qi, Y. Deep motif dashboard: visualizing and understanding genomic sequences using deep neural networks. In Pacific Symposium on Biocomputing 2017 254\u2013265 (World Scientific, 2017).","DOI":"10.1142\/9789813207813_0025"},{"key":"282_CR25","doi-asserted-by":"publisher","first-page":"565","DOI":"10.1101\/gr.104471.109","volume":"20","author":"V Gotea","year":"2010","unstructured":"Gotea, V. et al. Homotypic clusters of transcription factor binding sites are a key component of human promoters and enhancers. Genome Res. 20, 565\u2013577 (2010).","journal-title":"Genome Res."},{"key":"282_CR26","doi-asserted-by":"publisher","first-page":"61","DOI":"10.1016\/S0378-1119(99)00180-8","volume":"234","author":"K Roder","year":"1999","unstructured":"Roder, K., Wolf, S. S., Larkin, K. J. & Schweizer, M. Interaction between the two ubiquitously expressed transcription factors NF-Y and Sp1. Gene 234, 61\u201369 (1999).","journal-title":"Gene"},{"key":"282_CR27","doi-asserted-by":"publisher","first-page":"4684","DOI":"10.1093\/nar\/gkw096","volume":"44","author":"D Dolfini","year":"2016","unstructured":"Dolfini, D., Zambelli, F., Pedrazzoli, M., Mantovani, R. & Pavesi, G. A high definition look at the NF-Y regulome reveals genome-wide associations with selected transcription factors. Nucleic Acids Res. 44, 4684\u20134702 (2016).","journal-title":"Nucleic Acids Res."},{"key":"282_CR28","doi-asserted-by":"publisher","first-page":"2453","DOI":"10.1038\/sj.onc.1204239","volume":"20","author":"H Van Dam","year":"2001","unstructured":"Van Dam, H. & Castellazzi, M. Distinct roles of Jun: Fos and Jun: ATF dimers in oncogenesis. Oncogene 20, 2453\u20132464 (2001).","journal-title":"Oncogene"},{"key":"282_CR29","doi-asserted-by":"publisher","first-page":"576","DOI":"10.1016\/j.molcel.2010.05.004","volume":"38","author":"S Heinz","year":"2010","unstructured":"Heinz, S. et al. Simple combinations of lineage-determining transcription factors prime cis-regulatory elements required for macrophage and B cell identities. Mol. Cell 38, 576\u2013589 (2010).","journal-title":"Mol. Cell"},{"key":"282_CR30","doi-asserted-by":"publisher","first-page":"543","DOI":"10.1038\/nature11530","volume":"490","author":"P Li","year":"2012","unstructured":"Li, P. et al. BATF\u2013JUN is critical for IRF4-mediated transcription in T cells. Nature 490, 543\u2013546 (2012).","journal-title":"Nature"},{"key":"282_CR31","doi-asserted-by":"publisher","first-page":"e1003906","DOI":"10.1371\/journal.pgen.1003906","volume":"9","author":"C Benner","year":"2013","unstructured":"Benner, C. et al. Decoding a signature-based model of transcription cofactor recruitment dictated by cardinal cis-regulatory elements in proximal promoter regions. PLoS Genet. 9, e1003906 (2013).","journal-title":"PLoS Genet."},{"key":"282_CR32","doi-asserted-by":"crossref","unstructured":"Mevel, R., Draper, J. E., Lie, A. L. M., Kouskoff, V. & Lacaud, G. RUNX transcription factors: orchestrators of development. Development 146, dev148296 (2019).","DOI":"10.1242\/dev.148296"},{"key":"282_CR33","doi-asserted-by":"publisher","first-page":"649","DOI":"10.1038\/cmi.2017.37","volume":"14","author":"A Kroger","year":"2017","unstructured":"Kroger, A. IRFs as competing pioneers in T-cell differentiation. Cell. Mol. Immunol. 14, 649\u2013651 (2017).","journal-title":"Cell. Mol. Immunol."},{"key":"282_CR34","doi-asserted-by":"publisher","first-page":"1519","DOI":"10.1016\/j.cell.2016.04.027","volume":"165","author":"R Tewhey","year":"2016","unstructured":"Tewhey, R. et al. Direct identification of hundreds of expression-modulating variants using a multiplexed reporter assay. Cell 165, 1519\u20131529 (2016).","journal-title":"Cell"},{"key":"282_CR35","doi-asserted-by":"publisher","DOI":"10.1186\/s12859-019-2957-4","volume":"20","author":"G Liu","year":"2019","unstructured":"Liu, G., Zeng, H. & Gifford, D. K. Visualizing complex feature interactions and feature sharing in genomic deep neural networks. BMC Bioinform. 20, 401 (2019).","journal-title":"BMC Bioinform."},{"key":"282_CR36","doi-asserted-by":"publisher","first-page":"1259","DOI":"10.1002\/humu.23198","volume":"38","author":"H Zeng","year":"2017","unstructured":"Zeng, H., Edwards, M. D., Guo, Y. & Gifford, D. K. Accurate eQTL prioritization with an ensemble-based framework. Hum. Mutat. 38, 1259\u20131265 (2017).","journal-title":"Hum. Mutat."},{"key":"282_CR37","doi-asserted-by":"publisher","first-page":"1017","DOI":"10.1093\/bioinformatics\/btr064","volume":"27","author":"CE Grant","year":"2011","unstructured":"Grant, C. E., Bailey, T. L. & Noble, W. S. FIMO: scanning for occurrences of a given motif. Bioinformatics 27, 1017\u20131018 (2011).","journal-title":"Bioinformatics"},{"key":"282_CR38","unstructured":"Abadi, M. et al. TensorFlow: a system for large-scale machine learning. In Proc. 12th USENIX Symposium on Operating Systems Design and Implementation (OSDI \u201816) 265\u2013283 (USENIX, 2016)."},{"key":"282_CR39","doi-asserted-by":"publisher","first-page":"592","DOI":"10.1038\/s41587-019-0140-0","volume":"37","author":"\u017d Avsec","year":"2019","unstructured":"Avsec, \u017d. et al. The Kipoi repository accelerates community exchange and reuse of predictive models for genomics. Nat. Biotechnol. 37, 592\u2013600 (2019).","journal-title":"Nat. Biotechnol."},{"key":"282_CR40","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1038\/s41592-019-0686-2","volume":"17","author":"P Virtanen","year":"2020","unstructured":"Virtanen, P. et al. SciPy 1.0: fundamental algorithms for scientific computing in Python. Nat. Methods 17, 261\u2013272 (2020).","journal-title":"Nat. Methods"},{"key":"282_CR41","doi-asserted-by":"publisher","first-page":"D252","DOI":"10.1093\/nar\/gkx1106","volume":"46","author":"IV Kulakovskiy","year":"2018","unstructured":"Kulakovskiy, I. V. et al. HOCOMOCO: towards a complete collection of transcription factor binding models for human and mouse via large-scale ChIP-Seq analysis. Nucleic Acids Res. 46, D252\u2013D259 (2018).","journal-title":"Nucleic Acids Res."},{"key":"282_CR42","doi-asserted-by":"publisher","first-page":"434","DOI":"10.1038\/s41586-020-2308-7","volume":"581","author":"KJ Karczewski","year":"2020","unstructured":"Karczewski, K. J. et al. The mutational constraint spectrum quantified from variation in 141,456 humans. Nature 581, 434\u2013-443 (2020).","journal-title":"Nature"},{"key":"282_CR43","doi-asserted-by":"publisher","first-page":"285","DOI":"10.1038\/nature19057","volume":"536","author":"M Lek","year":"2016","unstructured":"Lek, M. et al. Analysis of protein-coding genetic variation in 60,706 humans. Nature 536, 285\u2013291 (2016).","journal-title":"Nature"},{"key":"282_CR44","doi-asserted-by":"publisher","first-page":"308","DOI":"10.1093\/nar\/29.1.308","volume":"29","author":"ST Sherry","year":"2001","unstructured":"Sherry, S. T. et al. dbSNP: the NCBI database of genetic variation. Nucleic Acids Res. 29, 308\u2013311 (2001).","journal-title":"Nucleic Acids Res."},{"key":"282_CR45","doi-asserted-by":"publisher","unstructured":"Zheng, A. Pandaman-Ryan\/AgentBind v.0.1 (accessed 19 November 2020); https:\/\/doi.org\/10.5281\/zenodo.4281456","DOI":"10.5281\/zenodo.4281456"}],"container-title":["Nature Machine Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.nature.com\/articles\/s42256-020-00282-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s42256-020-00282-y","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s42256-020-00282-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,3]],"date-time":"2022-12-03T20:43:10Z","timestamp":1670100190000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.nature.com\/articles\/s42256-020-00282-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,1,18]]},"references-count":45,"journal-issue":{"issue":"2","published-online":{"date-parts":[[2021,2]]}},"alternative-id":["282"],"URL":"https:\/\/doi.org\/10.1038\/s42256-020-00282-y","relation":{},"ISSN":["2522-5839"],"issn-type":[{"value":"2522-5839","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,1,18]]},"assertion":[{"value":"17 December 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 December 2020","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 January 2021","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors declare no competing interests.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}