{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,3,13]],"date-time":"2024-03-13T13:49:22Z","timestamp":1710337762634},"reference-count":36,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2015,1,28]],"date-time":"2015-01-28T00:00:00Z","timestamp":1422403200000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Algorithms Mol Biol"],"published-print":{"date-parts":[[2015,12]]},"DOI":"10.1186\/s13015-014-0029-x","type":"journal-article","created":{"date-parts":[[2015,1,27]],"date-time":"2015-01-27T11:28:09Z","timestamp":1422358089000},"update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":22,"title":["Clustering of reads with alignment-free measures and quality values"],"prefix":"10.1186","volume":"10","author":[{"given":"Matteo","family":"Comin","sequence":"first","affiliation":[]},{"given":"Andrea","family":"Leoni","sequence":"additional","affiliation":[]},{"given":"Michele","family":"Schimd","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,1,28]]},"reference":[{"key":"29_CR1","doi-asserted-by":"crossref","first-page":"419","DOI":"10.1038\/nrmicro1901","volume":"6","author":"D Medini","year":"2008","unstructured":"Medini D, Serruto D, Parkhill J, Relman DA, Donati C, Moxon R, et al. Microbiology in the post-genomic era. Nat Rev Microbiol. 2008; 6:419\u201330.","journal-title":"Nat Rev Microbiol."},{"key":"29_CR2","doi-asserted-by":"publisher","first-page":"5221","DOI":"10.1093\/nar\/gkn488","volume":"36","author":"R Jothi","year":"2008","unstructured":"Jothi R, Cuddapah S, Barski A, Cui K, Zhao K. Genome-wide identification of in vivo protein\u2013dna binding sites from chip-seq data. Nucleic Acids Res. 2008; 36:5221\u201331.","journal-title":"Nucleic Acids Res."},{"key":"29_CR3","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1016\/S0022-2836(05)80360-2","volume":"215","author":"SF Altschul","year":"1990","unstructured":"Altschul SF, Gish W, Miller W, Myers EW, Lipman DJ. Basic local alignment search tool. J Mol Biol. 1990; 215:403\u201310.","journal-title":"J Mol Biol."},{"key":"29_CR4","doi-asserted-by":"publisher","first-page":"2677","DOI":"10.1073\/pnas.0813249106","volume":"106","author":"GE Sims","year":"2009","unstructured":"Sims GE, Jun S-R, Wu GA, Kim S-H. Alignment-free genome comparison with feature frequency profiles (ffp) and optimal resolutions. Proc Nat Acad Sci. 2009; 106:2677\u201382.","journal-title":"Proc Nat Acad Sci."},{"key":"29_CR5","doi-asserted-by":"crossref","unstructured":"Comin M, Verzotto D. Whole-genome phylogeny by virtue of unic subwords. In: 23rd international workshop on Database and EXpert systems Applications (DEXA 2012): 2012. p. 190\u2013194.","DOI":"10.1109\/DEXA.2012.10"},{"issue":"1","key":"29_CR6","doi-asserted-by":"publisher","first-page":"34","DOI":"10.1186\/1748-7188-7-34","volume":"7","author":"M Comin","year":"2012","unstructured":"Comin M, Verzotto D. Alignment-free phylogeny of whole genomes using underlying subwords. Algorithms Mol Biol. 2012; 7(1):34.","journal-title":"Algorithms Mol Biol."},{"issue":"2","key":"29_CR7","doi-asserted-by":"publisher","first-page":"64","DOI":"10.1089\/cmb.2012.0228","volume":"20","author":"K Song","year":"2013","unstructured":"Song K, Ren J, Zhai Z, Liu X, Deng M, Sun F. Alignment-free sequence comparison based on next-generation sequencing reads. J Comput Biol. 2013; 20(2):64\u201379.","journal-title":"J Comput Biol."},{"issue":"Suppl 9","key":"29_CR8","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1471-2105-15-S9-S1","volume":"15","author":"M Comin","year":"2014","unstructured":"Comin M, Schimd M. Assembly-free genome comparison based on next-generation sequencing reads and variable length patterns. BMC Bioinformatics. 2014; 15(Suppl 9):1.","journal-title":"BMC Bioinformatics."},{"issue":"4","key":"29_CR9","doi-asserted-by":"publisher","first-page":"513","DOI":"10.1093\/bioinformatics\/btg005","volume":"19","author":"S Vinga","year":"2003","unstructured":"Vinga S, Almeida J. Alignment-free sequence comparison\u2013a review. Bioinformatics. 2003; 19(4):513\u201323.","journal-title":"Bioinformatics."},{"issue":"1","key":"29_CR10","doi-asserted-by":"publisher","first-page":"394","DOI":"10.1186\/1471-2105-9-394","volume":"9","author":"Q Dai","year":"2008","unstructured":"Dai Q, Wang T. Comparison study on k-word statistical measures for protein: From sequence to\u2019sequence space\u2019. BMC Bioinformatics. 2008; 9(1):394.","journal-title":"BMC Bioinformatics."},{"issue":"1","key":"29_CR11","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1186\/1471-2148-7-41","volume":"7","author":"L Gao","year":"2007","unstructured":"Gao L, Qi J. Whole genome molecular phylogeny of large dsdna viruses using composition vector method. BMC Evol Biol. 2007; 7(1):41.","journal-title":"BMC Evol Biol."},{"issue":"suppl 2","key":"29_CR12","doi-asserted-by":"publisher","first-page":"45","DOI":"10.1093\/nar\/gkh362","volume":"32","author":"J Qi","year":"2004","unstructured":"Qi J, Luo H, Hao B. Cvtree: a phylogenetic tree reconstruction tool based on whole genomes. Nucleic Acids Res. 2004; 32(suppl 2):45\u20137.","journal-title":"Nucleic Acids Res."},{"issue":"5","key":"29_CR13","doi-asserted-by":"publisher","first-page":"656","DOI":"10.1093\/bioinformatics\/bts028","volume":"28","author":"J G\u00f6ke","year":"2012","unstructured":"G\u00f6ke J, Schulz MH, Lasserre J, Vingron M. Estimation of pairwise sequence similarity of mammalian enhancers with word neighbourhood counts. Bioinformatics. 2012; 28(5):656\u201363.","journal-title":"Bioinformatics."},{"issue":"13","key":"29_CR14","doi-asserted-by":"publisher","first-page":"249","DOI":"10.1093\/bioinformatics\/btm211","volume":"23","author":"MR Kantorovitz","year":"2007","unstructured":"Kantorovitz MR, Robinson GE, Sinha S. A statistical method for alignment-free comparison of regulatory sequences. Bioinformatics. 2007; 23(13):249\u201355.","journal-title":"Bioinformatics."},{"issue":"4","key":"29_CR15","doi-asserted-by":"publisher","first-page":"628","DOI":"10.1109\/TCBB.2014.2306830","volume":"11","author":"M Comin","year":"2014","unstructured":"Comin M, Verzotto D. Beyond fixed-resolution alignment-free measures for mammalian enhancers sequence comparison. IEEE\/ACM Trans Comput Biol Bioinformatics. 2014; 11(4):628\u201337.","journal-title":"IEEE\/ACM Trans Comput Biol Bioinformatics."},{"key":"29_CR16","volume-title":"Pattern recognition in Bioinformatics. vol. 7986,","author":"M Comin","year":"2013","unstructured":"Comin M, Antonello M. Fast computation of entropic profiles for the detection of conservation in genomes In: Ngom A, Formenti E, Hao J-K, Zhao X-M, van Laarhoven T, editors. Pattern recognition in Bioinformatics. vol. 7986,Berlin Heidelberg: Springer: 2013. p. 277\u201388."},{"issue":"3","key":"29_CR17","doi-asserted-by":"publisher","first-page":"500","DOI":"10.1109\/TCBB.2013.2297924","volume":"11","author":"M Comin","year":"2014","unstructured":"Comin M, Antonello M. Fast entropic profiler: An information theoretic approach for the discovery of patterns in genomes. Comput Biol Bioinform IEEE\/ACM Trans. 2014; 11(3):500\u20139.","journal-title":"Comput Biol Bioinform IEEE\/ACM Trans."},{"issue":"Suppl 1","key":"29_CR18","doi-asserted-by":"publisher","first-page":"16","DOI":"10.1186\/1471-2105-11-S1-S16","volume":"11","author":"M Comin","year":"2010","unstructured":"Comin M, Verzotto D. Classification of protein sequences by means of irredundant patterns. BMC bioinformatics. 2010; 11(Suppl 1):16.","journal-title":"BMC bioinformatics."},{"issue":"12","key":"29_CR19","doi-asserted-by":"publisher","first-page":"1819","DOI":"10.1089\/cmb.2010.0171","volume":"18","author":"M Comin","year":"2011","unstructured":"Comin M, Verzotto D. The irredundant class method for remote homology detection of protein sequences. J Comput Biol. 2011; 18(12):1819\u201329.","journal-title":"J Comput Biol."},{"issue":"7","key":"29_CR20","doi-asserted-by":"publisher","first-page":"1309","DOI":"10.1101\/gr.089151.108","volume":"19","author":"W Qu","year":"2009","unstructured":"Qu W, Hashimoto S-i, Morishita S. Efficient frequency-based de novo short-read clustering for error trimming in next-generation sequencing. Genome Res. 2009; 19(7):1309\u201315.","journal-title":"Genome Res."},{"issue":"18","key":"29_CR21","doi-asserted-by":"crossref","first-page":"2502","DOI":"10.1093\/bioinformatics\/btr447","volume":"27","author":"E Bao","year":"2011","unstructured":"Bao E, Jiang T, Kaloshian I, Girke T. Seed: efficient clustering of next-generation sequences. Bioinformatics. 2011; 27(18):2502\u20139.","journal-title":"Bioinformatics."},{"issue":"1","key":"29_CR22","doi-asserted-by":"publisher","first-page":"268","DOI":"10.1186\/1471-2105-14-268","volume":"14","author":"A Solovyov","year":"2013","unstructured":"Solovyov A, Lipkin W. Centroid based clustering of high throughput sequencing reads based on n-mer counts. BMC Bioinformatics. 2013; 14(1):268.","journal-title":"BMC Bioinformatics."},{"issue":"11","key":"29_CR23","doi-asserted-by":"publisher","first-page":"1851","DOI":"10.1101\/gr.078212.108","volume":"18","author":"H Li","year":"2008","unstructured":"Li H, Ruan J, Durbin R. Mapping short dna sequencing reads and calling variants using mapping quality scores. Genome Res. 2008; 18(11):1851\u20138.","journal-title":"Genome Res."},{"issue":"6","key":"29_CR24","doi-asserted-by":"publisher","first-page":"961","DOI":"10.1101\/gr.112326.110","volume":"21","author":"CA Albers","year":"2011","unstructured":"Albers CA, Lunter G, MacArthur DG, McVean G, Ouwehand WH, Durbin R. Dindel: accurate indel calls from short-read data. Genome Res. 2011; 21(6):961\u201373.","journal-title":"Genome Res."},{"issue":"1","key":"29_CR25","doi-asserted-by":"publisher","first-page":"375","DOI":"10.1186\/1471-2164-13-375","volume":"13","author":"MO Carneiro","year":"2012","unstructured":"Carneiro MO, Russ C, Ross MG, Gabriel SB, Nusbaum C, DePristo MA. Pacific biosciences sequencing technology for genotyping and variation discovery in human data. BMC Genomics. 2012; 13(1):375.","journal-title":"BMC Genomics."},{"issue":"14","key":"29_CR26","doi-asserted-by":"publisher","first-page":"5155","DOI":"10.1073\/pnas.83.14.5155","volume":"83","author":"BE Blaisdell","year":"1986","unstructured":"Blaisdell BE. A measure of the similarity of sets of sequences not requiring sequence alignment. Proc Natl Acad Sci. 1986; 83(14):5155\u20139.","journal-title":"Proc Natl Acad Sci."},{"issue":"22","key":"29_CR27","doi-asserted-by":"publisher","first-page":"13980","DOI":"10.1073\/pnas.202468099","volume":"99","author":"RA Lippert","year":"2002","unstructured":"Lippert RA, Huang H, Waterman MS. Distributional regimes for the number of k-word matches between two random sequences. Proc Natl Acad Sci. 2002; 99(22):13980\u20139.","journal-title":"Proc Natl Acad Sci."},{"issue":"12","key":"29_CR28","doi-asserted-by":"publisher","first-page":"1615","DOI":"10.1089\/cmb.2009.0198","volume":"16","author":"G Reinert","year":"2009","unstructured":"Reinert G, Chew D, Sun F, Waterman MS. Alignment-free sequence comparison (i): statistics and power. J Comput Biol. 2009; 16(12):1615\u201334.","journal-title":"J Comput Biol."},{"issue":"11","key":"29_CR29","doi-asserted-by":"publisher","first-page":"1467","DOI":"10.1089\/cmb.2010.0056","volume":"17","author":"L Wan","year":"2010","unstructured":"Wan L, Reinert G, Sun F, Waterman MS. Alignment-free sequence comparison (ii): theoretical power of comparison statistics. J Comput Biol. 2010; 17(11):1467\u201390.","journal-title":"J Comput Biol."},{"issue":"3","key":"29_CR30","doi-asserted-by":"publisher","first-page":"186","DOI":"10.1101\/gr.8.3.175","volume":"8","author":"B Ewing","year":"1998","unstructured":"Ewing B, Green P. Base-calling of automated sequencer traces using phred. ii. error probabilities. Genome Res. 1998; 8(3):186\u201394.","journal-title":"Genome Res."},{"key":"29_CR31","unstructured":"NCBI dataset of human mRNA genes. \n                    ftp:\/\/ftp.ncbi.nlm.nih.gov\/refseq\/H_sapiens\/mRNA_Prot\/\n                    \n                  ."},{"key":"29_CR32","unstructured":"Mason. \n                    http:\/\/seqan.de\/projects\/mason.html\n                    \n                  ."},{"key":"29_CR33","unstructured":"Holtgrewe M. Mason\u2013a read simulator for second generation sequencing data. Technical Report FU Berlin. 2010. TR-B-10-06."},{"issue":"1","key":"29_CR34","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1038\/nmeth0111-59","volume":"8","author":"E Birney","year":"2011","unstructured":"Birney E. Assemblies: the good, the bad, the ugly. Nat Methods. 2011; 8(1):59\u201360.","journal-title":"Nat Methods."},{"issue":"5","key":"29_CR35","doi-asserted-by":"publisher","first-page":"821","DOI":"10.1101\/gr.074492.107","volume":"18","author":"DR Zerbino","year":"2008","unstructured":"Zerbino DR, Birney E. Velvet: algorithms for de novo short read assembly using de bruijn graphs. Genome Res. 2008; 18(5):821\u20139.","journal-title":"Genome Res."},{"key":"29_CR36","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/978-3-662-44753-6_1","volume":"8701","author":"M Comin","year":"2014","unstructured":"Comin M, Leoni A, Schimd M. Qcluster: Extending alignment-free measures with quality values for reads clustering. Algorithms Bioinform Lect Notes Comput Sci. 2014; 8701:1\u201313.","journal-title":"Algorithms Bioinform Lect Notes Comput Sci."}],"container-title":["Algorithms for Molecular Biology"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13015-014-0029-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s13015-014-0029-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13015-014-0029-x","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13015-014-0029-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,3,26]],"date-time":"2019-03-26T22:42:00Z","timestamp":1553640120000},"score":1,"resource":{"primary":{"URL":"https:\/\/almob.biomedcentral.com\/articles\/10.1186\/s13015-014-0029-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,1,28]]},"references-count":36,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2015,12]]}},"alternative-id":["29"],"URL":"https:\/\/doi.org\/10.1186\/s13015-014-0029-x","relation":{},"ISSN":["1748-7188"],"issn-type":[{"value":"1748-7188","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,1,28]]},"assertion":[{"value":"19 November 2014","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 December 2014","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 January 2015","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"4"}}