{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,18]],"date-time":"2026-04-18T08:42:48Z","timestamp":1776501768567,"version":"3.51.2"},"reference-count":17,"publisher":"Oxford University Press (OUP)","issue":"14","license":[{"start":{"date-parts":[[2017,3,25]],"date-time":"2017-03-25T00:00:00Z","timestamp":1490400000000},"content-version":"vor","delay-in-days":1,"URL":"https:\/\/academic.oup.com\/journals\/pages\/about_us\/legal\/notices"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["DBI-1350041"],"award-info":[{"award-number":["DBI-1350041"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["IOS-1237880"],"award-info":[{"award-number":["IOS-1237880"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R01-HG006677"],"award-info":[{"award-number":["R01-HG006677"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017,7,15]]},"abstract":"<jats:title>Abstract<\/jats:title>\n                  <jats:sec>\n                    <jats:title>Summary<\/jats:title>\n                    <jats:p>GenomeScope is an open-source web tool to rapidly estimate the overall characteristics of a genome, including genome size, heterozygosity rate and repeat content from unprocessed short reads. These features are essential for studying genome evolution, and help to choose parameters for downstream analysis. We demonstrate its accuracy on 324 simulated and 16 real datasets with a wide range in genome sizes, heterozygosity levels and error rates.<\/jats:p>\n                  <\/jats:sec>\n                  <jats:sec>\n                    <jats:title>Availability and Implementation<\/jats:title>\n                    <jats:p>http:\/\/genomescope.org, https:\/\/github.com\/schatzlab\/genomescope.git.<\/jats:p>\n                  <\/jats:sec>\n                  <jats:sec>\n                    <jats:title>Supplementary information<\/jats:title>\n                    <jats:p>Supplementary data are available at Bioinformatics online.<\/jats:p>\n                  <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btx153","type":"journal-article","created":{"date-parts":[[2017,3,17]],"date-time":"2017-03-17T08:13:54Z","timestamp":1489738434000},"page":"2202-2204","source":"Crossref","is-referenced-by-count":1764,"title":["GenomeScope: fast reference-free genome profiling from short reads"],"prefix":"10.1093","volume":"33","author":[{"given":"Gregory W","family":"Vurture","sequence":"first","affiliation":[{"name":"Simons Center for Quantitative Biology, Cold Spring Harbor Laboratory, Cold Spring Harbor, NY, USA"}]},{"given":"Fritz J","family":"Sedlazeck","sequence":"additional","affiliation":[{"name":"Departments of Computer Science and Biology, Johns Hopkins University, Baltimore, MD, USA"}]},{"given":"Maria","family":"Nattestad","sequence":"additional","affiliation":[{"name":"Simons Center for Quantitative Biology, Cold Spring Harbor Laboratory, Cold Spring Harbor, NY, USA"}]},{"given":"Charles J","family":"Underwood","sequence":"additional","affiliation":[{"name":"Simons Center for Quantitative Biology, Cold Spring Harbor Laboratory, Cold Spring Harbor, NY, USA"}]},{"given":"Han","family":"Fang","sequence":"additional","affiliation":[{"name":"Simons Center for Quantitative Biology, Cold Spring Harbor Laboratory, Cold Spring Harbor, NY, USA"},{"name":"Department of Applied Mathematics and Statistics, Stony Brook University, Stony Brook, NY, USA"}]},{"given":"James","family":"Gurtowski","sequence":"additional","affiliation":[{"name":"Simons Center for Quantitative Biology, Cold Spring Harbor Laboratory, Cold Spring Harbor, NY, USA"}]},{"given":"Michael C","family":"Schatz","sequence":"additional","affiliation":[{"name":"Simons Center for Quantitative Biology, Cold Spring Harbor Laboratory, Cold Spring Harbor, NY, USA"},{"name":"Departments of Computer Science and Biology, Johns Hopkins University, Baltimore, MD, USA"}]}],"member":"286","published-online":{"date-parts":[[2017,3,24]]},"reference":[{"key":"2023051601055581000_btx153-B1","doi-asserted-by":"crossref","first-page":"455","DOI":"10.1089\/cmb.2012.0021","article-title":"SPAdes: a new genome assembly algorithm and its applications to single-cell sequencing","volume":"19","author":"Bankevich","year":"2012","journal-title":"J. Comput. Biol"},{"key":"2023051601055581000_btx153-B2","doi-asserted-by":"crossref","DOI":"10.1002\/9780470316757","volume-title":"Nonlinear Regression Analysis and Its Applications","author":"Bates","year":"1988"},{"key":"2023051601055581000_btx153-B3","doi-asserted-by":"crossref","first-page":"31","DOI":"10.1093\/bioinformatics\/btt310","article-title":"Informed and automated k-mer size selection for genome assembly","volume":"30","author":"Chikhi","year":"2014","journal-title":"Bioinformatics"},{"key":"2023051601055581000_btx153-B4","doi-asserted-by":"crossref","first-page":"1513","DOI":"10.1073\/pnas.1017351108","article-title":"High-quality draft assemblies of mammalian genomes from massively parallel sequence data","volume":"108","author":"Gnerre","year":"2011","journal-title":"Proc. Natl. Acad. Sci. U. S. A"},{"key":"2023051601055581000_btx153-B5","doi-asserted-by":"crossref","first-page":"333","DOI":"10.1038\/nrg.2016.49","article-title":"Coming of age: ten years of next-generation sequencing technologies","volume":"17","author":"Goodwin","year":"2016","journal-title":"Nat. Rev. Genet"},{"key":"2023051601055581000_btx153-B6","doi-asserted-by":"crossref","first-page":"1384","DOI":"10.1101\/gr.170720.113","article-title":"Efficient de novo assembly of highly heterozygous genomes from whole-genome shotgun short reads","volume":"24","author":"Kajitani","year":"2014","journal-title":"Genome Res"},{"key":"2023051601055581000_btx153-B7","doi-asserted-by":"crossref","first-page":"R116.","DOI":"10.1186\/gb-2010-11-11-r116","article-title":"Quake: quality-aware detection and correction of sequencing errors","volume":"11","author":"Kelley","year":"2010","journal-title":"Genome Biol"},{"key":"2023051601055581000_btx153-B8","article-title":"Aligning sequence reads, clone sequences and assembly contigs with BWA-MEM","author":"Li","year":"2013","journal-title":"ArXiv e-Prints"},{"key":"2023051601055581000_btx153-B9","doi-asserted-by":"crossref","first-page":"2078","DOI":"10.1093\/bioinformatics\/btp352","article-title":"The sequence alignment\/map format and SAMtools","volume":"25","author":"Li","year":"2009","journal-title":"Bioinformatics"},{"key":"2023051601055581000_btx153-B10","doi-asserted-by":"crossref","first-page":"1916","DOI":"10.1101\/gr.1251803","article-title":"Estimating the repeat structure and length of DNA sequences using L-tuples","volume":"13","author":"Li","year":"2003","journal-title":"Genome Res"},{"key":"2023051601055581000_btx153-B11","first-page":"2012","article-title":"Estimation of genomic characteristics by analyzing k-mer frequency in de novo genome projects","volume":"1308","author":"Liu","year":"2013","journal-title":"arXiv"},{"key":"2023051601055581000_btx153-B12","doi-asserted-by":"crossref","first-page":"764","DOI":"10.1093\/bioinformatics\/btr011","article-title":"A fast, lock-free approach for efficient parallel counting of occurrences of k-mers","volume":"27","author":"Marcais","year":"2011","journal-title":"Bioinformatics"},{"key":"2023051601055581000_btx153-B13","doi-asserted-by":"crossref","first-page":"3541","DOI":"10.1093\/bioinformatics\/btu713","article-title":"KmerStream: streaming algorithms for k-mer abundance estimation","volume":"30","author":"Melsted","year":"2014","journal-title":"Bioinformatics"},{"key":"2023051601055581000_btx153-B14","doi-asserted-by":"crossref","first-page":"e16327","DOI":"10.1371\/journal.pone.0016327","article-title":"ReadDepth: a parallel R package for detecting copy number alterations from short sequencing reads","volume":"6","author":"Miller","year":"2011","journal-title":"PLoS One"},{"key":"2023051601055581000_btx153-B15","doi-asserted-by":"crossref","first-page":"R55","DOI":"10.1186\/gb-2008-9-3-r55","article-title":"Genome assembly forensics: finding the elusive mis-assembly","volume":"9","author":"Phillippy","year":"2008","journal-title":"Genome Biol"},{"key":"2023051601055581000_btx153-B16","doi-asserted-by":"crossref","first-page":"1228","DOI":"10.1093\/bioinformatics\/btu023","article-title":"Exploring genome characteristics and sequence quality without a reference","volume":"30","author":"Simpson","year":"2014","journal-title":"Bioinformatics"},{"key":"2023051601055581000_btx153-B17","doi-asserted-by":"crossref","first-page":"235","DOI":"10.1186\/s13059-015-0803-1","article-title":"Teaser: Individualized benchmarking and optimization of read mapping results for NGS data","volume":"16","author":"Smolka","year":"2015","journal-title":"Genome Biol"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/33\/14\/2202\/50314582\/bioinformatics_33_14_2202.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/33\/14\/2202\/50314582\/bioinformatics_33_14_2202.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,15]],"date-time":"2023-05-15T21:06:28Z","timestamp":1684184788000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/33\/14\/2202\/3089939"}},"subtitle":[],"editor":[{"given":"Bonnie","family":"Berger","sequence":"additional","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2017,3,24]]},"references-count":17,"journal-issue":{"issue":"14","published-print":{"date-parts":[[2017,7,15]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btx153","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/075978","asserted-by":"object"}]},"ISSN":["1367-4803","1367-4811"],"issn-type":[{"value":"1367-4803","type":"print"},{"value":"1367-4811","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2017,7,15]]},"published":{"date-parts":[[2017,3,24]]}}}