{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,31]],"date-time":"2025-12-31T10:21:57Z","timestamp":1767176517674,"version":"build-2238731810"},"update-to":[{"DOI":"10.1371\/journal.pcbi.1008104","type":"new_version","label":"New version","source":"publisher","updated":{"date-parts":[[2020,8,12]],"date-time":"2020-08-12T00:00:00Z","timestamp":1597190400000}}],"reference-count":54,"publisher":"Public Library of Science (PLoS)","issue":"7","license":[{"start":{"date-parts":[[2020,7,31]],"date-time":"2020-07-31T00:00:00Z","timestamp":1596153600000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["www.ploscompbiol.org"],"crossmark-restriction":false},"short-container-title":["PLoS Comput Biol"],"DOI":"10.1371\/journal.pcbi.1008104","type":"journal-article","created":{"date-parts":[[2020,7,31]],"date-time":"2020-07-31T13:43:07Z","timestamp":1596202987000},"page":"e1008104","update-policy":"https:\/\/doi.org\/10.1371\/journal.pcbi.corrections_policy","source":"Crossref","is-referenced-by-count":35,"title":["Regional sequence expansion or collapse in heterozygous genome assemblies"],"prefix":"10.1371","volume":"16","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-6777-8701","authenticated-orcid":true,"given":"Kathryn C.","family":"Asalone","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5352-4663","authenticated-orcid":true,"given":"Kara M.","family":"Ryan","sequence":"additional","affiliation":[]},{"given":"Maryam","family":"Yamadi","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6867-5958","authenticated-orcid":true,"given":"Annastelle L.","family":"Cohen","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5250-0582","authenticated-orcid":true,"given":"William G.","family":"Farmer","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4631-1106","authenticated-orcid":true,"given":"Deborah J.","family":"George","sequence":"additional","affiliation":[]},{"given":"Claudia","family":"Joppert","sequence":"additional","affiliation":[]},{"given":"Kaitlyn","family":"Kim","sequence":"additional","affiliation":[]},{"given":"Madeeha Froze","family":"Mughal","sequence":"additional","affiliation":[]},{"given":"Rana","family":"Said","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7459-8955","authenticated-orcid":true,"given":"Metin","family":"Toksoz-Exley","sequence":"additional","affiliation":[]},{"given":"Evgeny","family":"Bisk","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8042-7685","authenticated-orcid":true,"given":"John R.","family":"Bracht","sequence":"additional","affiliation":[]}],"member":"340","published-online":{"date-parts":[[2020,7,31]]},"reference":[{"key":"pcbi.1008104.ref001","doi-asserted-by":"crossref","first-page":"333","DOI":"10.1038\/nmeth.1935","article-title":"De novo genome assembly: what every biologist should know","volume":"9","author":"M Baker","year":"2012","journal-title":"Nat Methods"},{"key":"pcbi.1008104.ref002","doi-asserted-by":"crossref","first-page":"3210","DOI":"10.1093\/bioinformatics\/btv351","article-title":"BUSCO: assessing genome assembly and annotation completeness with single-copy orthologs","volume":"31","author":"FA Sim\u00e3o","year":"2015","journal-title":"Bioinformatics"},{"key":"pcbi.1008104.ref003","doi-asserted-by":"crossref","first-page":"R47","DOI":"10.1186\/gb-2013-14-5-r47","article-title":"REAPR: a universal tool for genome assembly evaluation","volume":"14","author":"M Hunt","year":"2013","journal-title":"Genome Biol"},{"key":"pcbi.1008104.ref004","doi-asserted-by":"crossref","first-page":"157","DOI":"10.1038\/nrg3367","article-title":"Sequence assembly demystified","volume":"14","author":"N Nagarajan","year":"2013","journal-title":"Nat Rev Genet"},{"key":"pcbi.1008104.ref005","doi-asserted-by":"crossref","first-page":"329","DOI":"10.1038\/nrg3174","article-title":"A beginner\u2019s guide to eukaryotic genome annotation","volume":"13","author":"M Yandell","year":"2012","journal-title":"Nat Rev Genet"},{"key":"pcbi.1008104.ref006","doi-asserted-by":"crossref","first-page":"455","DOI":"10.1089\/cmb.2012.0021","article-title":"SPAdes: a new genome assembly algorithm and its applications to single-cell sequencing","volume":"19","author":"A Bankevich","year":"2012","journal-title":"J Comput Biol"},{"key":"pcbi.1008104.ref007","doi-asserted-by":"crossref","first-page":"1519","DOI":"10.1089\/cmb.2009.0238","article-title":"Ray: simultaneous assembly of reads from a mix of high-throughput sequencing technologies","volume":"17","author":"S Boisvert","year":"2010","journal-title":"J Comput Biol"},{"key":"pcbi.1008104.ref008","doi-asserted-by":"crossref","first-page":"22","DOI":"10.1186\/1748-7188-8-22","article-title":"Space-efficient and exact de Bruijn graph representation based on a Bloom filter","volume":"8","author":"R Chikhi","year":"2013","journal-title":"Algorithms Mol Biol"},{"key":"pcbi.1008104.ref009","doi-asserted-by":"crossref","first-page":"2717","DOI":"10.1093\/bioinformatics\/btu395","article-title":"Omega: an overlap-graph de novo assembler for metagenomics","volume":"30","author":"B Haider","year":"2014","journal-title":"Bioinformatics"},{"key":"pcbi.1008104.ref010","doi-asserted-by":"crossref","first-page":"1384","DOI":"10.1101\/gr.170720.113","article-title":"Efficient de novo assembly of highly heterozygous genomes from whole-genome shotgun short reads","volume":"24","author":"R Kajitani","year":"2014","journal-title":"Genome Res"},{"key":"pcbi.1008104.ref011","doi-asserted-by":"crossref","first-page":"18","DOI":"10.1186\/2047-217X-1-18","article-title":"SOAPdenovo2: an empirically improved memory-efficient short-read de novo assembler","volume":"1","author":"R Luo","year":"2012","journal-title":"Gigascience"},{"key":"pcbi.1008104.ref012","doi-asserted-by":"crossref","first-page":"2270","DOI":"10.1101\/gr.141515.112","article-title":"Finished bacterial genomes from shotgun sequence data","volume":"22","author":"FJ Ribeiro","year":"2012","journal-title":"Genome Res"},{"key":"pcbi.1008104.ref013","doi-asserted-by":"crossref","first-page":"1117","DOI":"10.1101\/gr.089532.108","article-title":"ABySS: a parallel assembler for short read sequence data","volume":"19","author":"JT Simpson","year":"2009","journal-title":"Genome Res"},{"key":"pcbi.1008104.ref014","doi-asserted-by":"crossref","first-page":"627","DOI":"10.1038\/nrg3933","article-title":"Genetic variation and the de novo assembly of human genomes","volume":"16","author":"MJP Chaisson","year":"2015","journal-title":"Nat Rev Genet"},{"key":"pcbi.1008104.ref015","doi-asserted-by":"crossref","DOI":"10.12688\/f1000research.13598.1","article-title":"Ten steps to get started in Genome Assembly and Annotation","volume":"7","author":"V Dominguez Del Angel","year":"2018","journal-title":"F1000Res"},{"key":"pcbi.1008104.ref016","doi-asserted-by":"crossref","first-page":"R55","DOI":"10.1186\/gb-2008-9-3-r55","article-title":"Genome assembly forensics: finding the elusive mis-assembly","volume":"9","author":"AM Phillippy","year":"2008","journal-title":"Genome Biol"},{"key":"pcbi.1008104.ref017","doi-asserted-by":"crossref","first-page":"e113","DOI":"10.1093\/nar\/gkw294","article-title":"Redundans: an assembly pipeline for highly heterozygous genomes","volume":"44","author":"LP Pryszcz","year":"2016","journal-title":"Nucleic Acids Res"},{"key":"pcbi.1008104.ref018","doi-asserted-by":"crossref","first-page":"e62856","DOI":"10.1371\/journal.pone.0062856","article-title":"Effects of GC bias in next-generation-sequencing data on de novo genome assembly","volume":"8","author":"Y-C Chen","year":"2013","journal-title":"PLoS One"},{"key":"pcbi.1008104.ref019","doi-asserted-by":"crossref","first-page":"2","DOI":"10.1016\/j.atg.2016.06.001","article-title":"Standardization and quality management in next-generation sequencing","volume":"10","author":"C Endrullat","year":"2016","journal-title":"Appl Transl Genom"},{"key":"pcbi.1008104.ref020","doi-asserted-by":"crossref","first-page":"79","DOI":"10.1111\/1755-0998.12712","article-title":"Assembly and RNA-free annotation of highly heterozygous genomes: The case of the thick-billed murre (Uria lomvia)","author":"A Tigano","year":"2018","journal-title":"Molecular Ecology Resources"},{"key":"pcbi.1008104.ref021","doi-asserted-by":"crossref","first-page":"6227","DOI":"10.1093\/nar\/gkm688","article-title":"DNA sequencing: bench to bedside and beyond","volume":"35","author":"CA 3rd Hutchison","year":"2007","journal-title":"Nucleic Acids Res"},{"key":"pcbi.1008104.ref022","doi-asserted-by":"crossref","first-page":"255","DOI":"10.1016\/j.ygeno.2008.07.001","article-title":"Applications of next-generation sequencing technologies in functional genomics","author":"O Morozova","year":"2008","journal-title":"Genomics"},{"key":"pcbi.1008104.ref023","doi-asserted-by":"crossref","first-page":"413","DOI":"10.1007\/s13353-011-0057-x","article-title":"Sequencing technologies and genome sequencing","volume":"52","author":"CS Pareek","year":"2011","journal-title":"J Appl Genet"},{"key":"pcbi.1008104.ref024","doi-asserted-by":"crossref","first-page":"16","DOI":"10.1038\/nmeth1156","article-title":"Next-generation sequencing transforms today\u2019s biology","volume":"5","author":"SC Schuster","year":"2008","journal-title":"Nat Methods"},{"key":"pcbi.1008104.ref025","doi-asserted-by":"crossref","first-page":"79","DOI":"10.1038\/nature09974","article-title":"Nematoda from the terrestrial deep subsurface of South Africa","volume":"474","author":"G Borgonie","year":"2011","journal-title":"Nature"},{"key":"pcbi.1008104.ref026","doi-asserted-by":"crossref","first-page":"5268","DOI":"10.1038\/s41467-019-13245-8","article-title":"The genome of a subterrestrial nematode reveals adaptations to heat","volume":"10","author":"DJ Weinstein","year":"2019","journal-title":"Nat Commun"},{"key":"pcbi.1008104.ref027","doi-asserted-by":"crossref","first-page":"2202","DOI":"10.1093\/bioinformatics\/btx153","article-title":"GenomeScope: fast reference-free genome profiling from short reads","volume":"33","author":"GW Vurture","year":"2017","journal-title":"Bioinformatics"},{"key":"pcbi.1008104.ref028","doi-asserted-by":"crossref","first-page":"487","DOI":"10.1101\/gr.113985.110","article-title":"Adaptive seeds tame genomic sequence comparison","volume":"21","author":"SM Kie\u0142basa","year":"2011","journal-title":"Genome Res"},{"key":"pcbi.1008104.ref029","doi-asserted-by":"crossref","first-page":"188","DOI":"10.1101\/gr.6743907","article-title":"MAKER: an easy-to-use annotation pipeline designed for emerging model organism genomes","volume":"18","author":"BL Cantarel","year":"2008","journal-title":"Genome Res"},{"key":"pcbi.1008104.ref030","doi-asserted-by":"crossref","first-page":"2178","DOI":"10.1101\/gr.1224503","article-title":"OrthoMCL: identification of ortholog groups for eukaryotic genomes","volume":"13","author":"L Li","year":"2003","journal-title":"Genome Res"},{"key":"pcbi.1008104.ref031","doi-asserted-by":"crossref","first-page":"265","DOI":"10.1101\/gr.097261.109","article-title":"De novo assembly of human genomes with massively parallel short read sequencing","volume":"20","author":"R Li","year":"2010","journal-title":"Genome Res"},{"key":"pcbi.1008104.ref032","doi-asserted-by":"crossref","first-page":"56","DOI":"10.1093\/bib\/bbs015","article-title":"A survey of error-correction methods for next-generation sequencing","volume":"14","author":"X Yang","year":"2013","journal-title":"Brief Bioinform"},{"key":"pcbi.1008104.ref033","unstructured":"Smit AFA, Hubley R. RepeatModeler Open-1.0. Available from http:\/\/www repeatmasker org. 2008."},{"key":"pcbi.1008104.ref034","doi-asserted-by":"crossref","first-page":"543","DOI":"10.1093\/molbev\/msx319","article-title":"BUSCO Applications from Quality Assessments to Gene Prediction and Phylogenomics","volume":"35","author":"RM Waterhouse","year":"2018","journal-title":"Mol Biol Evol"},{"key":"pcbi.1008104.ref035","doi-asserted-by":"crossref","first-page":"1494","DOI":"10.1038\/nprot.2013.084","article-title":"De novo transcript sequence reconstruction from RNA-seq using the Trinity platform for reference generation and analysis","volume":"8","author":"BJ Haas","year":"2013","journal-title":"Nat Protoc"},{"key":"pcbi.1008104.ref036","doi-asserted-by":"crossref","first-page":"2114","DOI":"10.1093\/bioinformatics\/btu170","article-title":"Trimmomatic: a flexible trimmer for Illumina sequence data","volume":"30","author":"AM Bolger","year":"2014","journal-title":"Bioinformatics"},{"key":"pcbi.1008104.ref037","first-page":"2012","article-title":"The C. elegans Sequencing Consortium. Genome Sequence of the Nematode C. elegans: A Platform for Investigating Biology","author":"Consortium TCES","year":"1998","journal-title":"Science"},{"key":"pcbi.1008104.ref038","doi-asserted-by":"crossref","first-page":"W309","DOI":"10.1093\/nar\/gkh379","article-title":"AUGUSTUS: a web server for gene finding in eukaryotes","volume":"32","author":"M Stanke","year":"2004","journal-title":"Nucleic Acids Res"},{"key":"pcbi.1008104.ref039","doi-asserted-by":"crossref","first-page":"926","DOI":"10.1093\/bioinformatics\/btw742","article-title":"Training alignment parameters for arbitrary sequencers with LAST-TRAIN","volume":"33","author":"M Hamada","year":"2017","journal-title":"Bioinformatics"},{"key":"pcbi.1008104.ref040","doi-asserted-by":"crossref","first-page":"80","DOI":"10.1186\/1471-2105-11-80","article-title":"Parameters for accurate genome alignment","volume":"11","author":"MC Frith","year":"2010","journal-title":"BMC Bioinformatics"},{"key":"pcbi.1008104.ref041","volume-title":"MySQL Reference Manual: Documentation from the Source","author":"M Widenius","year":"2002"},{"key":"pcbi.1008104.ref042","doi-asserted-by":"crossref","first-page":"1575","DOI":"10.1093\/nar\/30.7.1575","article-title":"An efficient algorithm for large-scale detection of protein families","volume":"30","author":"AJ Enright","year":"2002","journal-title":"Nucleic Acids Res"},{"key":"pcbi.1008104.ref043","unstructured":"A:orthomcl with local mysql server on linux server, complete install. [cited 21 Jan 2020]. Available: https:\/\/www.biostars.org\/p\/120773\/"},{"key":"pcbi.1008104.ref044","doi-asserted-by":"crossref","first-page":"403","DOI":"10.1016\/S0022-2836(05)80360-2","article-title":"Basic local alignment search tool","volume":"215","author":"SF Altschul","year":"1990","journal-title":"J Mol Biol"},{"key":"pcbi.1008104.ref045","volume-title":"RStudio: integrated development for R","author":"Team R","year":"2015"},{"key":"pcbi.1008104.ref046","doi-asserted-by":"crossref","first-page":"1647","DOI":"10.1093\/bioinformatics\/bts199","article-title":"Geneious Basic: an integrated and extendable desktop software platform for the organization and analysis of sequence data","volume":"28","author":"M Kearse","year":"2012","journal-title":"Bioinformatics"},{"key":"pcbi.1008104.ref047","doi-asserted-by":"crossref","first-page":"1792","DOI":"10.1093\/nar\/gkh340","article-title":"MUSCLE: multiple sequence alignment with high accuracy and high throughput","volume":"32","author":"RC Edgar","year":"2004","journal-title":"Nucleic Acids Res"},{"key":"pcbi.1008104.ref048","doi-asserted-by":"crossref","first-page":"696","DOI":"10.1080\/10635150390235520","article-title":"A simple, fast, and accurate algorithm to estimate large phylogenies by maximum likelihood","volume":"52","author":"S Guindon","year":"2003","journal-title":"Syst Biol"},{"key":"pcbi.1008104.ref049","doi-asserted-by":"crossref","first-page":"2129","DOI":"10.1101\/gr.772403","article-title":"PANTHER: a library of protein families and subfamilies indexed by function","volume":"13","author":"PD Thomas","year":"2003","journal-title":"Genome Res"},{"key":"pcbi.1008104.ref050","doi-asserted-by":"crossref","first-page":"D377","DOI":"10.1093\/nar\/gks1118","article-title":"PANTHER in 2013: modeling the evolution of gene function, and other gene attributes, in the context of phylogenetic trees","volume":"41","author":"H Mi","year":"2013","journal-title":"Nucleic Acids Res"},{"key":"pcbi.1008104.ref051","doi-asserted-by":"crossref","first-page":"1754","DOI":"10.1093\/bioinformatics\/btp324","article-title":"Fast and accurate short read alignment with Burrows\u2013Wheeler transform","volume":"25","author":"H Li","year":"2009","journal-title":"Bioinformatics"},{"key":"pcbi.1008104.ref052","doi-asserted-by":"crossref","first-page":"2078","DOI":"10.1093\/bioinformatics\/btp352","article-title":"The Sequence Alignment\/Map format and SAMtools","volume":"25","author":"H Li","year":"2009","journal-title":"Bioinformatics"},{"key":"pcbi.1008104.ref053","doi-asserted-by":"crossref","first-page":"2987","DOI":"10.1093\/bioinformatics\/btr509","article-title":"A statistical framework for SNP calling, mutation discovery, association mapping and population genetical parameter estimation from sequencing data","volume":"27","author":"H Li","year":"2011","journal-title":"Bioinformatics"},{"key":"pcbi.1008104.ref054","doi-asserted-by":"crossref","first-page":"764","DOI":"10.1093\/bioinformatics\/btr011","article-title":"A fast, lock-free approach for efficient parallel counting of occurrences of k-mers","volume":"27","author":"G Mar\u00e7ais","year":"2011","journal-title":"Bioinformatics"}],"updated-by":[{"DOI":"10.1371\/journal.pcbi.1008104","type":"new_version","label":"New version","source":"publisher","updated":{"date-parts":[[2020,8,12]],"date-time":"2020-08-12T00:00:00Z","timestamp":1597190400000}}],"container-title":["PLOS Computational Biology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1008104","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,10,5]],"date-time":"2023-10-05T00:25:31Z","timestamp":1696465531000},"score":1,"resource":{"primary":{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1008104"}},"subtitle":[],"editor":[{"given":"Christos A.","family":"Ouzounis","sequence":"first","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2020,7,31]]},"references-count":54,"journal-issue":{"issue":"7","published-online":{"date-parts":[[2020,7,31]]}},"URL":"https:\/\/doi.org\/10.1371\/journal.pcbi.1008104","relation":{},"ISSN":["1553-7358"],"issn-type":[{"value":"1553-7358","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,7,31]]}}}