{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,28]],"date-time":"2026-02-28T05:03:33Z","timestamp":1772255013526,"version":"3.50.1"},"reference-count":35,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2016,4,5]],"date-time":"2016-04-05T00:00:00Z","timestamp":1459814400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BioData Mining"],"published-print":{"date-parts":[[2016,12]]},"DOI":"10.1186\/s13040-016-0090-8","type":"journal-article","created":{"date-parts":[[2016,4,5]],"date-time":"2016-04-05T04:10:30Z","timestamp":1459829430000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":21,"title":["Distinguishing highly similar gene isoforms with a clustering-based bioinformatics analysis of PacBio single-molecule long reads"],"prefix":"10.1186","volume":"9","author":[{"given":"Ma","family":"Liang","sequence":"first","affiliation":[]},{"given":"Castle","family":"Raley","sequence":"additional","affiliation":[]},{"given":"Xin","family":"Zheng","sequence":"additional","affiliation":[]},{"given":"Geetha","family":"Kutty","sequence":"additional","affiliation":[]},{"given":"Emile","family":"Gogineni","sequence":"additional","affiliation":[]},{"given":"Brad T.","family":"Sherman","sequence":"additional","affiliation":[]},{"given":"Qiang","family":"Sun","sequence":"additional","affiliation":[]},{"given":"Xiongfong","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Thomas","family":"Skelly","sequence":"additional","affiliation":[]},{"given":"Kristine","family":"Jones","sequence":"additional","affiliation":[]},{"given":"Robert","family":"Stephens","sequence":"additional","affiliation":[]},{"given":"Bin","family":"Zhou","sequence":"additional","affiliation":[]},{"given":"William","family":"Lau","sequence":"additional","affiliation":[]},{"given":"Calvin","family":"Johnson","sequence":"additional","affiliation":[]},{"given":"Tomozumi","family":"Imamichi","sequence":"additional","affiliation":[]},{"given":"Minkang","family":"Jiang","sequence":"additional","affiliation":[]},{"given":"Robin","family":"Dewar","sequence":"additional","affiliation":[]},{"given":"Richard A.","family":"Lempicki","sequence":"additional","affiliation":[]},{"given":"Bao","family":"Tran","sequence":"additional","affiliation":[]},{"given":"Joseph A.","family":"Kovacs","sequence":"additional","affiliation":[]},{"given":"Da Wei","family":"Huang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2016,4,5]]},"reference":[{"issue":"1","key":"90_CR1","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1038\/nbt.2024","volume":"30","author":"TR Mercer","year":"2012","unstructured":"Mercer TR, Gerhardt DJ, Dinger ME, Crawford J, Trapnell C, Jeddeloh JA, et al. Targeted RNA sequencing reveals the deep complexity of the human transcriptome. Nat Biotechnol. 2012;30(1):99\u2013104. doi: 10.1038\/nbt.2024 .","journal-title":"Nat Biotechnol"},{"issue":"12","key":"90_CR2","doi-asserted-by":"publisher","first-page":"1413","DOI":"10.1038\/ng.259","volume":"40","author":"Q Pan","year":"2008","unstructured":"Pan Q, Shai O, Lee LJ, Frey BJ, Blencowe BJ. Deep surveying of alternative splicing complexity in the human transcriptome by high-throughput sequencing. Nat Genet. 2008;40(12):1413\u20135. doi: 10.1038\/ng.259 .","journal-title":"Nat Genet"},{"issue":"11","key":"90_CR3","doi-asserted-by":"publisher","first-page":"1009","DOI":"10.1038\/nbt.2705","volume":"31","author":"D Sharon","year":"2013","unstructured":"Sharon D, Tilgner H, Grubert F, Snyder M. A single-molecule long-read survey of the human transcriptome. Nat Biotechnol. 2013;31(11):1009\u201314. doi: 10.1038\/nbt.2705 .","journal-title":"Nat Biotechnol"},{"issue":"7221","key":"90_CR4","doi-asserted-by":"publisher","first-page":"470","DOI":"10.1038\/nature07509","volume":"456","author":"ET Wang","year":"2008","unstructured":"Wang ET, Sandberg R, Luo S, Khrebtukova I, Zhang L, Mayr C, et al. Alternative isoform regulation in human tissue transcriptomes. Nature. 2008;456(7221):470\u20136. doi: 10.1038\/nature07509 .","journal-title":"Nature"},{"key":"90_CR5","doi-asserted-by":"publisher","first-page":"753675","DOI":"10.1155\/2010\/753675","volume":"2010","author":"W Guo","year":"2010","unstructured":"Guo W, Bharmal SJ, Esbona K, Greaser ML. Titin diversity--alternative splicing gone wild. J Biomed Biotechnol. 2010;2010:753675. doi: 10.1155\/2010\/753675 .","journal-title":"J Biomed Biotechnol"},{"issue":"5733","key":"90_CR6","doi-asserted-by":"publisher","first-page":"416","DOI":"10.1126\/science.1112642","volume":"309","author":"M Berriman","year":"2005","unstructured":"Berriman M, Ghedin E, Hertz-Fowler C, Blandin G, Renauld H, Bartholomeu DC, et al. The genome of the African trypanosome Trypanosoma brucei. Science. 2005;309(5733):416\u201322. doi: 10.1126\/science.1112642 .","journal-title":"Science"},{"issue":"5846","key":"90_CR7","doi-asserted-by":"publisher","first-page":"1921","DOI":"10.1126\/science.1143837","volume":"317","author":"HG Morrison","year":"2007","unstructured":"Morrison HG, McArthur AG, Gillin FD, Aley SB, Adam RD, Olsen GJ, et al. Genomic minimalism in the early diverging intestinal parasite Giardia lamblia. Science. 2007;317(5846):1921\u20136. doi: 10.1126\/science.1143837 .","journal-title":"Science"},{"issue":"6906","key":"90_CR8","doi-asserted-by":"publisher","first-page":"498","DOI":"10.1038\/nature01097","volume":"419","author":"MJ Gardner","year":"2002","unstructured":"Gardner MJ, Hall N, Fung E, White O, Berriman M, Hyman RW, et al. Genome sequence of the human malaria parasite Plasmodium falciparum. Nature. 2002;419(6906):498\u2013511. doi: 10.1038\/nature01097 .","journal-title":"Nature"},{"issue":"4","key":"90_CR9","doi-asserted-by":"publisher","first-page":"1589","DOI":"10.1534\/genetics.105.040733","volume":"170","author":"SP Keely","year":"2005","unstructured":"Keely SP, Renauld H, Wakefield AE, Cushion MT, Smulian AG, Fosker N, et al. Gene arrays at Pneumocystis carinii telomeres. Genetics. 2005;170(4):1589\u2013600. doi: 10.1534\/genetics.105.040733 .","journal-title":"Genetics"},{"key":"90_CR10","doi-asserted-by":"publisher","first-page":"367","DOI":"10.1186\/1471-2164-10-367","volume":"10","author":"SP Keely","year":"2009","unstructured":"Keely SP, Stringer JR. Complexity of the MSG gene family of Pneumocystis carinii. BMC Genomics. 2009;10:367. doi: 10.1186\/1471-2164-10-367 .","journal-title":"BMC Genomics"},{"issue":"1","key":"90_CR11","doi-asserted-by":"publisher","first-page":"8","DOI":"10.1111\/j.1550-7408.2006.00225.x","volume":"54","author":"JR Stringer","year":"2007","unstructured":"Stringer JR. Antigenic variation in Pneumocystis. J Eukaryot Microbiol. 2007;54(1):8\u201313. doi: 10.1111\/j.1550-7408.2006.00225.x .","journal-title":"J Eukaryot Microbiol"},{"issue":"7","key":"90_CR12","doi-asserted-by":"publisher","first-page":"493","DOI":"10.1038\/nrmicro2145","volume":"7","author":"KW Deitsch","year":"2009","unstructured":"Deitsch KW, Lukehart SA, Stringer JR. Common strategies for antigenic variation by bacterial, fungal and protozoan pathogens. Nat Rev Microbiol. 2009;7(7):493\u2013503. doi: 10.1038\/nrmicro2145 .","journal-title":"Nat Rev Microbiol"},{"issue":"10","key":"90_CR13","doi-asserted-by":"publisher","first-page":"1932","DOI":"10.1016\/j.bbadis.2014.06.015","volume":"1842","author":"HP Buermans","year":"2014","unstructured":"Buermans HP, den Dunnen JT. Next generation sequencing technology: Advances and applications. Biochim Biophys Acta. 2014;1842(10):1932\u201341. doi: 10.1016\/j.bbadis.2014.06.015 .","journal-title":"Biochim Biophys Acta"},{"issue":"1","key":"90_CR14","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1038\/nrg2626","volume":"11","author":"ML Metzker","year":"2010","unstructured":"Metzker ML. Sequencing technologies - the next generation. Nat Rev Genet. 2010;11(1):31\u201346. doi: 10.1038\/nrg2626 .","journal-title":"Nat Rev Genet"},{"issue":"6","key":"90_CR15","doi-asserted-by":"publisher","first-page":"315","DOI":"10.1016\/j.ygeno.2010.03.001","volume":"95","author":"JR Miller","year":"2010","unstructured":"Miller JR, Koren S, Sutton G. Assembly algorithms for next-generation sequencing data. Genomics. 2010;95(6):315\u201327. doi: 10.1016\/j.ygeno.2010.03.001 .","journal-title":"Genomics"},{"issue":"1","key":"90_CR16","doi-asserted-by":"publisher","first-page":"36","DOI":"10.1038\/nrg3117","volume":"13","author":"TJ Treangen","year":"2012","unstructured":"Treangen TJ, Salzberg SL. Repetitive DNA and next-generation sequencing: computational challenges and solutions. Nat Rev Genet. 2012;13(1):36\u201346. doi: 10.1038\/nrg3117 .","journal-title":"Nat Rev Genet"},{"key":"90_CR17","doi-asserted-by":"publisher","first-page":"2837","DOI":"10.1038\/srep02837","volume":"3","author":"MC Prosperi","year":"2013","unstructured":"Prosperi MC, Yin L, Nolan DJ, Lowe AD, Goodenow MM, Salemi M. Empirical validation of viral quasispecies assembly algorithms: state-of-the-art and challenges. Sci Rep. 2013;3:2837. doi: 10.1038\/srep02837 .","journal-title":"Sci Rep"},{"issue":"3","key":"90_CR18","doi-asserted-by":"publisher","first-page":"431","DOI":"10.1093\/bib\/bbs081","volume":"15","author":"M Schirmer","year":"2014","unstructured":"Schirmer M, Sloan WT, Quince C. Benchmarking of viral haplotype reconstruction programmes: an overview of the capacities and limitations of currently available programmes. Brief Bioinform. 2014;15(3):431\u201342. doi: 10.1093\/bib\/bbs081 .","journal-title":"Brief Bioinform"},{"key":"90_CR19","doi-asserted-by":"publisher","first-page":"475","DOI":"10.1186\/1471-2164-13-475","volume":"13","author":"X Yang","year":"2012","unstructured":"Yang X, Charlebois P, Gnerre S, Coole MG, Lennon NJ, Levin JZ, et al. De novo assembly of highly diverse viral populations. BMC Genomics. 2012;13:475. doi: 10.1186\/1471-2164-13-475 .","journal-title":"BMC Genomics"},{"issue":"24","key":"90_CR20","doi-asserted-by":"publisher","first-page":"2578","DOI":"10.1001\/jama.2009.880","volume":"301","author":"JA Kovacs","year":"2009","unstructured":"Kovacs JA, Masur H. Evolving health effects of Pneumocystis: one hundred years of progress in diagnosis and treatment. JAMA. 2009;301(24):2578\u201385. doi: 10.1001\/jama.2009.880 .","journal-title":"JAMA"},{"key":"90_CR21","doi-asserted-by":"publisher","DOI":"10.1016\/B978-0-12-801238-3.05473-8","author":"L Ma","year":"2015","unstructured":"Ma L. Pneumocystis: An atypical fungal pathogen. Ref Module Biomed Sci Elsevier. 2015. doi: 10.1016\/B978-0-12-801238-3.05473-8 .","journal-title":"Ref Module Biomed Sci Elsevier"},{"issue":"5","key":"90_CR22","doi-asserted-by":"publisher","first-page":"741","DOI":"10.1086\/590433","volume":"198","author":"G Kutty","year":"2008","unstructured":"Kutty G, Maldarelli F, Achaz G, Kovacs JA. Variation in the major surface glycoprotein genes in Pneumocystis jirovecii. J Infect Dis. 2008;198(5):741\u20139. doi: 10.1086\/590433 .","journal-title":"J Infect Dis"},{"issue":"9","key":"90_CR23","doi-asserted-by":"crossref","first-page":"4268","DOI":"10.1128\/IAI.66.9.4268-4273.1998","volume":"66","author":"Q Mei","year":"1998","unstructured":"Mei Q, Turner RE, Sorial V, Klivington D, Angus CW, Kovacs JA. Characterization of major surface glycoprotein genes of human Pneumocystis carinii and high-level expression of a conserved region. Infect Immun. 1998;66(9):4268\u201373.","journal-title":"Infect Immun"},{"issue":"Suppl 1","key":"90_CR24","doi-asserted-by":"publisher","first-page":"S89","DOI":"10.1111\/j.1550-7408.2006.00184.x","volume":"53","author":"BE Slaven","year":"2006","unstructured":"Slaven BE, Meller J, Porollo A, Sesterhenn T, Smulian AG, Cushion MT. Draft assembly and annotation of the Pneumocystis carinii genome. J Eukaryot Microbiol. 2006;53 Suppl 1:S89\u201391. doi: 10.1111\/j.1550-7408.2006.00184.x .","journal-title":"J Eukaryot Microbiol"},{"issue":"1","key":"90_CR25","doi-asserted-by":"publisher","first-page":"e00428","DOI":"10.1128\/mBio.00428-12","volume":"4","author":"OH Cisse","year":"2012","unstructured":"Cisse OH, Pagni M, Hauser PM. De novo assembly of the Pneumocystis jirovecii genome from a single bronchoalveolar lavage fluid specimen from a patient. mBio. 2012;4(1):e00428\u201312. doi: 10.1128\/mBio.00428-12 .","journal-title":"mBio"},{"issue":"5910","key":"90_CR26","doi-asserted-by":"publisher","first-page":"133","DOI":"10.1126\/science.1162986","volume":"323","author":"J Eid","year":"2009","unstructured":"Eid J, Fehr A, Gray J, Luong K, Lyle J, Otto G, et al. Real-time DNA sequencing from single polymerase molecules. Science. 2009;323(5910):133\u20138. doi: 10.1126\/science.1162986 .","journal-title":"Science"},{"issue":"7","key":"90_CR27","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1186\/gb-2013-14-6-405","volume":"14","author":"RJ Roberts","year":"2013","unstructured":"Roberts RJ, Carneiro MO, Schatz MC. The advantages of SMRT sequencing. Genome Biol. 2013;14(7):405. doi: 10.1186\/gb-2013-14-6-405 .","journal-title":"Genome Biol"},{"key":"90_CR28","doi-asserted-by":"publisher","first-page":"96","DOI":"10.1186\/1471-2164-15-96","volume":"15","author":"KG Frey","year":"2014","unstructured":"Frey KG, Herrera-Galeano JE, Redden CL, Luu TV, Servetas SL, Mateczun AJ, et al. Comparison of three next-generation sequencing platforms for metagenomic sequencing and identification of pathogens in blood. BMC Genomics. 2014;15:96. doi: 10.1186\/1471-2164-15-96 .","journal-title":"BMC Genomics"},{"issue":"3","key":"90_CR29","doi-asserted-by":"publisher","first-page":"136","DOI":"10.4172\/2153-0602.1000136","volume":"4","author":"X Jiao","year":"2013","unstructured":"Jiao X, Zheng X, Ma L, Kutty G, Gogineni E, Sun Q, et al. A benchmark study on error assessment and quality control of CCS reads derived from the PacBio RS. J Data Mining Genomics Proteomics. 2013;4(3):136. doi: 10.4172\/2153-0602.1000136 .","journal-title":"J Data Mining Genomics Proteomics"},{"issue":"19","key":"90_CR30","doi-asserted-by":"publisher","first-page":"2460","DOI":"10.1093\/bioinformatics\/btq461","volume":"26","author":"RC Edgar","year":"2010","unstructured":"Edgar RC. Search and clustering orders of magnitude faster than BLAST. Bioinformatics. 2010;26(19):2460\u20131. doi: 10.1093\/bioinformatics\/btq461 .","journal-title":"Bioinformatics"},{"key":"90_CR31","doi-asserted-by":"publisher","first-page":"113","DOI":"10.1186\/1471-2105-5-113","volume":"5","author":"RC Edgar","year":"2004","unstructured":"Edgar RC. MUSCLE: a multiple sequence alignment method with reduced time and space complexity. BMC Bioinformatics. 2004;5:113. doi: 10.1186\/1471-2105-5-113 .","journal-title":"BMC Bioinformatics"},{"key":"90_CR32","doi-asserted-by":"publisher","first-page":"10740","DOI":"10.1038\/ncomms10740","volume":"7","author":"L Ma","year":"2016","unstructured":"Ma L, Chen Z, Huang DW, Kutty G, Ishihara M, Wang H, et al. Genome analysis of three Pneumocystis species reveals adaptation mechanisms to life exclusively in mammalian hosts. Nat Commun. 2016;7:10740. doi: 10.1038\/ncomms10740 .","journal-title":"Nat Commun"},{"issue":"1","key":"90_CR33","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/2042-5783-4-1","volume":"4","author":"K McElroy","year":"2014","unstructured":"McElroy K, Thomas T, Luciani F. Deep sequencing of evolving pathogen populations: applications, errors, and bioinformatic solutions. Microb Inform Exp. 2014;4(1):1. doi: 10.1186\/2042-5783-4-1 .","journal-title":"Microb Inform Exp"},{"issue":"10","key":"90_CR34","doi-asserted-by":"publisher","first-page":"1437","DOI":"10.1093\/cid\/cis217","volume":"54","author":"M Sassi","year":"2012","unstructured":"Sassi M, Ripamonti C, Mueller NJ, Yazaki H, Kutty G, Ma L, et al. Outbreaks of Pneumocystis pneumonia in 2 renal transplant centers linked to a single strain of Pneumocystis: implications for transmission and virulence. Clin Infect Dis. 2012;54(10):1437\u201344. doi: 10.1093\/cid\/cis217 .","journal-title":"Clin Infect Dis"},{"issue":"8","key":"90_CR35","doi-asserted-by":"publisher","first-page":"R73","DOI":"10.1186\/gb-2011-12-8-r73","volume":"12","author":"A Melnikov","year":"2011","unstructured":"Melnikov A, Galinsky K, Rogov P, Fennell T, Van Tyne D, Russ C, et al. Hybrid selection for sequencing pathogen genomes from clinical samples. Genome Biol. 2011;12(8):R73. doi: 10.1186\/gb-2011-12-8-r73 .","journal-title":"Genome Biol"}],"container-title":["BioData Mining"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13040-016-0090-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s13040-016-0090-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13040-016-0090-8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13040-016-0090-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,9,18]],"date-time":"2020-09-18T04:52:28Z","timestamp":1600404748000},"score":1,"resource":{"primary":{"URL":"http:\/\/biodatamining.biomedcentral.com\/articles\/10.1186\/s13040-016-0090-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,4,5]]},"references-count":35,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2016,12]]}},"alternative-id":["90"],"URL":"https:\/\/doi.org\/10.1186\/s13040-016-0090-8","relation":{},"ISSN":["1756-0381"],"issn-type":[{"value":"1756-0381","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016,4,5]]},"article-number":"13"}}