{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,16]],"date-time":"2026-03-16T17:10:31Z","timestamp":1773681031309,"version":"3.50.1"},"reference-count":79,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2015,6,1]],"date-time":"2015-06-01T00:00:00Z","timestamp":1433116800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BioData Mining"],"published-print":{"date-parts":[[2015,6]]},"DOI":"10.1186\/s13040-015-0073-1","type":"journal-article","created":{"date-parts":[[2015,12,9]],"date-time":"2015-12-09T11:05:17Z","timestamp":1449659117000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":14,"title":["LAF: Logic Alignment Free and its application to bacterial genomes classification"],"prefix":"10.1186","volume":"8","author":[{"given":"Emanuel","family":"Weitschek","sequence":"first","affiliation":[]},{"given":"Fabio","family":"Cunial","sequence":"additional","affiliation":[]},{"given":"Giovanni","family":"Felici","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,12,8]]},"reference":[{"issue":"3","key":"73_CR1","doi-asserted-by":"crossref","first-page":"635","DOI":"10.1016\/0888-7543(91)90071-L","volume":"11","author":"WR Pearson","year":"1991","unstructured":"Pearson WR. Searching protein sequence libraries: comparison of the sensitivity and selectivity of the smith-waterman and fasta algorithms. Genomics. 1991; 11(3):635\u201350.","journal-title":"Genomics"},{"issue":"3","key":"73_CR2","doi-asserted-by":"crossref","first-page":"443","DOI":"10.1016\/0022-2836(70)90057-4","volume":"48","author":"SB Needleman","year":"1970","unstructured":"Needleman SB, Wunsch CD. A general method applicable to the search for similarities in the amino acid sequence of two proteins. J Mol Biol. 1970; 48(3):443\u201353.","journal-title":"J Mol Biol"},{"key":"73_CR3","doi-asserted-by":"crossref","first-page":"63","DOI":"10.1016\/0076-6879(90)83007-V","volume":"183","author":"WR Pearson","year":"1990","unstructured":"Pearson WR. Rapid and sensitive sequence comparison with fastp and fasta. Methods Enzymol. 1990; 183:63\u201398.","journal-title":"Methods Enzymol"},{"issue":"17","key":"73_CR4","doi-asserted-by":"crossref","first-page":"3389","DOI":"10.1093\/nar\/25.17.3389","volume":"25","author":"SF Altschul","year":"1997","unstructured":"Altschul SF, Madden TL, Schaffer AA, Zhang J, Zhang Z, Miller W, et al.Gapped blast and psi-blast: a new generation of protein database search programs. Nucleic Acids Res. 1997; 25(17):3389\u2013402.","journal-title":"Nucleic Acids Res"},{"issue":"5","key":"73_CR5","doi-asserted-by":"crossref","first-page":"1792","DOI":"10.1093\/nar\/gkh340","volume":"32","author":"RC Edgar","year":"2004","unstructured":"Edgar RC. Muscle: multiple sequence alignment with high accuracy and high throughput. Nucleic Acids Res. 2004; 32(5):1792\u20137.","journal-title":"Nucleic Acids Res"},{"key":"73_CR6","doi-asserted-by":"crossref","first-page":"2.3.1","DOI":"10.1002\/0471250953.bi0203s00","volume":"00","author":"JD Thompson","year":"2002","unstructured":"Thompson JD, Gibson T, Higgins DG. Multiple sequence alignment using clustalw and clustalx. Curr Protocol Bioinformatics. 2002; 00:2.3:2.3.1\u20132.3.22.","journal-title":"Curr Protocol Bioinformatics"},{"key":"73_CR7","volume-title":"DEXA Workshops","author":"A Mokaddem","year":"2013","unstructured":"Mokaddem A, Elloumi M. Motalign: A multiple sequence alignment algorithm based on a new distance and a new score function. In: DEXA Workshops. Los Alamitos, CA, USA: IEEE Computer Society: 2013. p. 81\u20134."},{"issue":"14","key":"73_CR8","doi-asserted-by":"crossref","first-page":"3059","DOI":"10.1093\/nar\/gkf436","volume":"30","author":"K Katoh","year":"2002","unstructured":"Katoh K, Misawa K, Kuma K-i, Miyata T. Mafft: a novel method for rapid multiple sequence alignment based on fast fourier transform. Nucleic Acids Res. 2002; 30(14):3059\u201366.","journal-title":"Nucleic Acids Res"},{"issue":"4","key":"73_CR9","doi-asserted-by":"crossref","first-page":"513","DOI":"10.1093\/bioinformatics\/btg005","volume":"19","author":"S Vinga","year":"2003","unstructured":"Vinga S, Almeida J. Alignment-free sequence comparison-a review. Bioinformatics. 2003; 19(4):513\u201323.","journal-title":"Bioinformatics"},{"issue":"11","key":"73_CR10","doi-asserted-by":"crossref","first-page":"2369","DOI":"10.1093\/nar\/27.11.2369","volume":"27","author":"AL Delcher","year":"1999","unstructured":"Delcher AL, Kasif S, Fleischmann RD, Peterson J, White O, Salzberg SL. Alignment of whole genomes. Nucleic Acids Res. 1999; 27(11):2369\u201376.","journal-title":"Nucleic Acids Res"},{"key":"73_CR11","doi-asserted-by":"crossref","DOI":"10.1007\/978-0-387-49820-1","volume-title":"An Introduction to Kolmogorov Complexity and Its Applications","author":"M Li","year":"2008","unstructured":"Li M, Vitnyi PMB. An Introduction to Kolmogorov Complexity and Its Applications, 3rd ed. New York, USA: Springer; 2008."},{"key":"73_CR12","doi-asserted-by":"crossref","first-page":"6","DOI":"10.1186\/1471-2105-3-6","volume":"3","author":"JS Almeida","year":"2002","unstructured":"Almeida JS, Vinga S. Universal sequence map (usm) of arbitrary discrete sequences. BMC Bioinformatics. 2002; 3:6.","journal-title":"BMC Bioinformatics"},{"key":"73_CR13","volume-title":"Advanced Computational Methods for Biocomputing and Bioimaging","author":"S Vinga","year":"2007","unstructured":"Vinga S. Biological sequence analysis by vector-valued functions: revisiting alignment-free methodologies for DNA and protein classification In: Pham TD, Yan H, Crane DI, editors. Advanced Computational Methods for Biocomputing and Bioimaging. New York: Nova Science Publishers: 2007."},{"issue":"4","key":"73_CR14","doi-asserted-by":"crossref","first-page":"513","DOI":"10.1093\/bioinformatics\/btg005","volume":"19","author":"S Vinga","year":"2003","unstructured":"Vinga S, Almeida J. Alignment-free sequence comparison \u2013 a review. Bioinformatics. 2003; 19(4):513\u201323.","journal-title":"Bioinformatics"},{"key":"73_CR15","doi-asserted-by":"crossref","first-page":"771","DOI":"10.1146\/annurev.genet.38.072902.094318","volume":"38","author":"SD Bentley","year":"2004","unstructured":"Bentley SD, Parkhill J. Comparative genomic structure of prokaryotes. Annu Rev Genet. 2004; 38:771\u201391.","journal-title":"Annu Rev Genet"},{"key":"73_CR16","doi-asserted-by":"crossref","first-page":"864","DOI":"10.1016\/S0021-9258(18)64321-2","volume":"236","author":"J Josse","year":"1961","unstructured":"Josse J, Kaiser A, Kornberg A. Enzymatic synthesis of deoxyribonucleic acid. J Biol Chem. 1961; 236:864\u201375.","journal-title":"J Biol Chem"},{"issue":"3","key":"73_CR17","doi-asserted-by":"crossref","first-page":"449","DOI":"10.1073\/pnas.48.3.449","volume":"48","author":"T Trautner","year":"1962","unstructured":"Trautner T, Swartz M, Kornberg A. Enzymatic synthesis of deoxyribonucleic acid, x. influence of bromouracil substitutions on replication. Proc Natl Acad Sci U S A. 1962; 48(3):449.","journal-title":"Proc Natl Acad Sci U S A."},{"issue":"1","key":"73_CR18","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/S0022-2836(76)80090-3","volume":"108","author":"G Russell","year":"1976","unstructured":"Russell G, Walker P, Elton R, Subak-Sharpe J. Doublet frequency analysis of fractionated vertebrate nuclear DNA. J Mol Biol. 1976; 108(1):1\u201320.","journal-title":"J Mol Biol"},{"issue":"5602","key":"73_CR19","doi-asserted-by":"crossref","first-page":"533","DOI":"10.1038\/266533a0","volume":"266","author":"G Russell","year":"1977","unstructured":"Russell G, Subak-Sharpe J. Similarity of the general designs of protochordates and invertebrates. Nature. 1977; 266(5602):533\u20136.","journal-title":"Nature"},{"issue":"7","key":"73_CR20","doi-asserted-by":"crossref","first-page":"283","DOI":"10.1016\/S0168-9525(00)89076-9","volume":"11","author":"S Karlin","year":"1995","unstructured":"Karlin S, Burge C. Dinucleotide relative abundance extremes: a genomic signature. Trends Genet. 1995; 11(7):283\u201390.","journal-title":"Trends Genet"},{"issue":"19","key":"73_CR21","doi-asserted-by":"crossref","first-page":"10227","DOI":"10.1073\/pnas.94.19.10227","volume":"94","author":"S Karlin","year":"1997","unstructured":"Karlin S, Mr\u00e1zek J. Compositional differences within and between eukaryotic genomes. Proc Natl Acad Sci. 1997; 94(19):10227\u201332.","journal-title":"Proc Natl Acad Sci"},{"issue":"9","key":"73_CR22","doi-asserted-by":"crossref","first-page":"938","DOI":"10.1111\/j.1462-2920.2004.00624.x","volume":"6","author":"H Teeling","year":"2004","unstructured":"Teeling H, Meyerdierks A, Bauer M, Amann R, Gl\u00f6ckner FO. Application of tetranucleotide frequencies for the assignment of genomic fragments. Environ Microbiol. 2004; 6(9):938\u201347.","journal-title":"Environ Microbiol"},{"issue":"1","key":"73_CR23","doi-asserted-by":"crossref","first-page":"546","DOI":"10.1186\/1471-2105-9-546","volume":"9","author":"F Zhou","year":"2008","unstructured":"Zhou F, Olman V, Xu Y. Barcodes for genomes and applications. BMC Bioinformatics. 2008; 9(1):546.","journal-title":"BMC Bioinformatics"},{"issue":"10","key":"73_CR24","doi-asserted-by":"crossref","first-page":"1391","DOI":"10.1093\/oxfordjournals.molbev.a026048","volume":"16","author":"PJ Deschavanne","year":"1999","unstructured":"Deschavanne PJ, Giron A, Vilain J, Fagot G, Fertil B. Genomic signature: characterization and classification of species assessed by chaos game representation of sequences. Mol Biol Evol. 1999; 16(10):1391\u20139.","journal-title":"Mol Biol Evol"},{"issue":"8","key":"73_CR25","doi-asserted-by":"crossref","first-page":"1404","DOI":"10.1101\/gr.186401","volume":"11","author":"R Sandberg","year":"2001","unstructured":"Sandberg R, Winberg G, Br\u00e4nden CI, Kaske A, Ernberg I, C\u00f6ster J. Capturing whole-genome characteristics in short sequences using a naive bayesian classifier. Genome Res. 2001; 11(8):1404\u20139.","journal-title":"Genome Res"},{"issue":"2","key":"73_CR26","doi-asserted-by":"crossref","first-page":"145","DOI":"10.1101\/gr.335003","volume":"13","author":"DT Pride","year":"2003","unstructured":"Pride DT, Meinersmann RJ, Wassenaar TM, Blaser MJ. Evolutionary implications of microbial genome tetranucleotide frequency biases. Genome Res. 2003; 13(2):145\u201358.","journal-title":"Genome Res"},{"key":"73_CR27","first-page":"211","volume":"3","author":"D Gatherer","year":"2007","unstructured":"Gatherer D. Genome signatures, self-organizing maps and higher order phylogenies: A parametric analysis. Evol Bioinformatics Online. 2007; 3:211.","journal-title":"Evol Bioinformatics Online"},{"issue":"6","key":"73_CR28","doi-asserted-by":"crossref","first-page":"525","DOI":"10.1016\/j.ygeno.2009.01.009","volume":"93","author":"M Takahashi","year":"2009","unstructured":"Takahashi M, Kryukov K, Saitou N. Estimation of bacterial species phylogeny through oligonucleotide frequency distances. Genomics. 2009; 93(6):525\u201333.","journal-title":"Genomics"},{"issue":"1","key":"73_CR29","doi-asserted-by":"crossref","first-page":"163","DOI":"10.1186\/1471-2105-5-163","volume":"5","author":"H Teeling","year":"2004","unstructured":"Teeling H, Waldmann J, Lombardot T, Bauer M, Glockner FO. Tetra: a web-service and a stand-alone program for the analysis and comparison of tetranucleotide usage patterns in dna sequences. BMC Bioinformatics. 2004; 5(1):163.","journal-title":"BMC Bioinformatics"},{"issue":"2","key":"73_CR30","doi-asserted-by":"crossref","first-page":"264","DOI":"10.1002\/(SICI)1097-0134(19991101)37:2<264::AID-PROT11>3.0.CO;2-C","volume":"37","author":"I Rigoutsos","year":"1999","unstructured":"Rigoutsos I, Floratos A, Ouzounis C, Gao Y, Parida L. Dictionary building via unsupervised hierarchical motif discovery in the sequence space of natural proteins. Proteins. 1999; 37(2):264\u201377.","journal-title":"Proteins"},{"issue":"10","key":"73_CR31","doi-asserted-by":"crossref","first-page":"108","DOI":"10.1186\/gb-2009-10-10-r108","volume":"10","author":"B Chor","year":"2009","unstructured":"Chor B, Horn D, Goldman N, Levy Y, Massingham T. Genomic DNA k-mer spectra: models and modalities. Genome Biol. 2009; 10(10):108.","journal-title":"Genome Biol"},{"issue":"4","key":"73_CR32","doi-asserted-by":"crossref","first-page":"292","DOI":"10.1016\/j.compbiolchem.2006.05.001","volume":"30","author":"H O\u011ful","year":"2006","unstructured":"O\u011ful H, Mumcuo\u011flu E\u00dc. Svm-based detection of distant protein structural relationships using pairwise probabilistic suffix trees. Comput Biol Chem. 2006; 30(4):292\u20139.","journal-title":"Comput Biol Chem"},{"issue":"12","key":"73_CR33","doi-asserted-by":"crossref","first-page":"3899","DOI":"10.1128\/jb.179.12.3899-3913.1997","volume":"179","author":"S Karlin","year":"1997","unstructured":"Karlin S, Mrazek J, Campbell AM. Compositional biases of bacterial genomes and evolutionary implications. J Bacteriol. 1997; 179(12):3899\u2013913.","journal-title":"J Bacteriol"},{"issue":"12","key":"73_CR34","doi-asserted-by":"crossref","first-page":"1208","DOI":"10.1038\/sj.embor.7400538","volume":"6","author":"KU Foerstner","year":"2005","unstructured":"Foerstner KU, von Mering C, Hooper SD, Bork P. Environments shape the nucleotide composition of genomes. EMBO Rep. 2005; 6(12):1208\u201313.","journal-title":"EMBO Rep"},{"issue":"1","key":"73_CR35","doi-asserted-by":"crossref","first-page":"63","DOI":"10.1038\/nmeth976","volume":"4","author":"AC McHardy","year":"2007","unstructured":"McHardy AC, Mart\u00edn HG, Tsirigos A, Hugenholtz P, Rigoutsos I. Accurate phylogenetic classification of variable-length DNA fragments. Nat Methods. 2007; 4(1):63\u201372.","journal-title":"Nat Methods"},{"key":"73_CR36","volume-title":"Research in Computational Molecular Biology","author":"S Chatterji","year":"2008","unstructured":"Chatterji S, Yamazaki I, Bai Z, Eisen JA. Compostbin: A dna composition-based algorithm for binning environmental shotgun reads. In: Research in Computational Molecular Biology. Berlin: Springer: 2008. p. 17\u201328."},{"issue":"11","key":"73_CR37","doi-asserted-by":"crossref","first-page":"1489","DOI":"10.1093\/bioinformatics\/btr186","volume":"27","author":"HC Leung","year":"2011","unstructured":"Leung HC, Yiu S, Yang B, Peng Y, Wang Y, Liu Z, et al.A robust and accurate binning algorithm for metagenomic sequences with arbitrary species abundance ratio. Bioinformatics. 2011; 27(11):1489\u201395.","journal-title":"Bioinformatics"},{"issue":"2","key":"73_CR38","doi-asserted-by":"crossref","first-page":"241","DOI":"10.1089\/cmb.2011.0276","volume":"19","author":"Y Wang","year":"2012","unstructured":"Wang Y, Leung HC, Yiu S, Chin FY. Metacluster 4.0: a novel binning algorithm for ngs reads and huge number of species. J Comput Biol. 2012; 19(2):241\u20139.","journal-title":"J Comput Biol"},{"key":"73_CR39","volume-title":"Algorithms in Bioinformatics","author":"O Tanaseichuk","year":"2011","unstructured":"Tanaseichuk O, Borneman J, Jiang T. Separating metagenomic short reads into genomes via clustering. In: Algorithms in Bioinformatics. New York, NY, USA: Springer: 2011. p. 298\u2013313."},{"key":"73_CR40","volume-title":"Research in Computational Molecular Biology","author":"K Song","year":"2012","unstructured":"Song K, Ren J, Zhai Z, Liu X, Deng M, Sun F. Alignment-free sequence comparison based on next generation sequencing reads. In: Research in Computational Molecular Biology. Berlin: Springer: 2012. p. 272\u201385."},{"issue":"1","key":"73_CR41","doi-asserted-by":"crossref","first-page":"100","DOI":"10.1093\/bioinformatics\/18.1.100","volume":"18","author":"GW Stuart","year":"2002","unstructured":"Stuart GW, Moffett K, Baker S. Integrated gene and species phylogenies from unaligned whole genome protein sequences. Bioinformatics. 2002; 18(1):100\u20138.","journal-title":"Bioinformatics"},{"issue":"4","key":"73_CR42","doi-asserted-by":"crossref","first-page":"554","DOI":"10.1093\/oxfordjournals.molbev.a004111","volume":"19","author":"GW Stuart","year":"2002","unstructured":"Stuart GW, Moffett K, Leader JJ. A comprehensive vertebrate phylogeny using vector representations of protein sequences from whole genomes. Mol Biol Evol. 2002; 19(4):554\u201362.","journal-title":"Mol Biol Evol"},{"key":"73_CR43","volume-title":"Database and Expert Systems Applications (DEXA), 2012 23rd International Workshop On","author":"M Comin","year":"2012","unstructured":"Comin M, Verzotto D. Whole-genome phylogeny by virtue of unic subwords. In: Database and Expert Systems Applications (DEXA), 2012 23rd International Workshop On. Los Alamitos, CA, USA: IEEE Computer Society: 2012. p. 190\u20134."},{"issue":"Suppl. 14","key":"73_CR44","doi-asserted-by":"crossref","first-page":"9","DOI":"10.1186\/1471-2105-10-S14-S9","volume":"10","author":"P Kuksa","year":"2009","unstructured":"Kuksa P, Pavlovic V. Efficient alignment-free DNA barcode analytics. BMC Bioinformatics. 2009; 10(Suppl. 14):9.","journal-title":"BMC Bioinformatics"},{"issue":"1","key":"73_CR45","first-page":"17","volume":"9","author":"VV Solovyev","year":"1993","unstructured":"Solovyev VV, Makarova KS. A novel method of protein sequence classification based on oligopeptide frequency analysis and its application to search for functional sites and to domain localization. Comput Appl Biosci: CABIOS. 1993; 9(1):17\u201324.","journal-title":"Comput Appl Biosci: CABIOS"},{"key":"73_CR46","doi-asserted-by":"crossref","first-page":"355","DOI":"10.1111\/j.1471-8286.2007.01678.x","volume":"7","author":"S Ratnasingham","year":"2007","unstructured":"Ratnasingham S, Hebert PDN. BOLD: the barcode of life data system. Mol Ecol Notes. 2007; 7:355\u201364.","journal-title":"Mol Ecol Notes"},{"issue":"Suppl 2","key":"73_CR47","doi-asserted-by":"crossref","first-page":"4","DOI":"10.1186\/1471-2164-12-S2-S4","volume":"12","author":"B Liu","year":"2011","unstructured":"Liu B, Gibbons T, Ghodsi M, Treangen T, Pop M. Accurate and fast estimation of taxonomic profiles from metagenomic shotgun sequences. BMC Genomics. 2011; 12(Suppl 2):4.","journal-title":"BMC Genomics"},{"issue":"8","key":"73_CR48","doi-asserted-by":"crossref","first-page":"811","DOI":"10.1038\/nmeth.2066","volume":"9","author":"N Segata","year":"2012","unstructured":"Segata N, Waldron L, Ballarini A, Narasimhan V, Jousson O, Huttenhower C. Metagenomic microbial community profiling using unique clade-specific marker genes. Nat Methods. 2012; 9(8):811\u20134.","journal-title":"Nat Methods"},{"issue":"24","key":"73_CR49","doi-asserted-by":"crossref","first-page":"3316","DOI":"10.1093\/bioinformatics\/bts599","volume":"28","author":"RA Edwards","year":"2012","unstructured":"Edwards RA, Olson R, Disz T, Pusch GD, Vonstein V, Stevens R, et al.Real time metagenomics: Using k-mers to annotate metagenomes. Bioinformatics. 2012; 28(24):3316\u201317.","journal-title":"Bioinformatics"},{"issue":"17","key":"73_CR50","doi-asserted-by":"crossref","first-page":"2471","DOI":"10.1093\/bioinformatics\/btu340","volume":"30","author":"S Seth","year":"2014","unstructured":"Seth S, V\u00e4lim\u00e4ki N, Kaski S, Honkela A. Exploration and retrieval of whole-metagenome sequencing samples. Bioinformatics. 2014; 30(17):2471\u20139.","journal-title":"Bioinformatics"},{"key":"73_CR51","doi-asserted-by":"crossref","first-page":"4","DOI":"10.1186\/1756-0381-7-4","volume":"7","author":"E Weitschek","year":"2014","unstructured":"Weitschek E, Fiscon G, Felici G. Supervised dna barcodes species classification: analysis, comparisons and results. BioData Mining. 2014; 7:4.","journal-title":"BioData Mining"},{"issue":"1","key":"73_CR52","doi-asserted-by":"crossref","first-page":"4","DOI":"10.1186\/1756-0381-4-4","volume":"4","author":"T Lehr","year":"2011","unstructured":"Lehr T, Yuan J, Zeumer D, Jayadev S, Ritchie M. Rule based classifier for the analysis of gene-gene and gene-environment interactions in genetic association studies. BioData Mining. 2011; 4(1):4. doi: http:\/\/dx.doi.org\/10.1186\/1756-0381-4-4 .","journal-title":"BioData Mining"},{"issue":"2","key":"73_CR53","doi-asserted-by":"crossref","first-page":"79","DOI":"10.1016\/j.ygeno.2014.07.004","volume":"104","author":"D Polychronopoulos","year":"2014","unstructured":"Polychronopoulos D, Weitschek E, Dimitrieva S, Bucher P, Felici G, Almirantis Y. Classification of selectively constrained dna elements using feature vectors and rule-based classifiers. Genomics. 2014; 104(2):79\u201386.","journal-title":"Genomics"},{"key":"73_CR54","volume-title":"AAAI\/IAAI","author":"D Kudenko","year":"1998","unstructured":"Kudenko D, Hirsh H. Feature generation for sequence categorization. In: AAAI\/IAAI. Cambridge, USA: The MIT Press: 1998. p. 733\u20138."},{"issue":"suppl 1","key":"73_CR55","doi-asserted-by":"crossref","first-page":"26","DOI":"10.1093\/bioinformatics\/btg1002","volume":"19","author":"A Ben-Hur","year":"2003","unstructured":"Ben-Hur A, Brutlag D. Remote homology detection: a motif based approach. Bioinformatics. 2003; 19(suppl 1):26\u201333.","journal-title":"Bioinformatics"},{"issue":"1","key":"73_CR56","doi-asserted-by":"crossref","first-page":"40","DOI":"10.1145\/1882471.1882478","volume":"12","author":"Z Xing","year":"2010","unstructured":"Xing Z, Pei J, Keogh E. A brief survey on sequence classification. ACM SIGKDD Explorations Newslett. 2010; 12(1):40\u20138.","journal-title":"ACM SIGKDD Explorations Newslett"},{"key":"73_CR57","doi-asserted-by":"crossref","first-page":"9","DOI":"10.1186\/1471-2105-10-S14-S9","volume":"10 Suppl 14","author":"P Kuksa","year":"2009","unstructured":"Kuksa P, Pavlovic V. Efficient alignment-free dna barcode analytics. BMC Bioinformatics. 2009; 10 Suppl 14:9. doi: http:\/\/dx.doi.org\/10.1186\/1471-2105-10-S14-S9 .","journal-title":"BMC Bioinformatics"},{"key":"73_CR58","volume-title":"Statistical Learning Theory","author":"VN Vapnik","year":"1998","unstructured":"Vapnik VN, Vapnik V. Statistical Learning Theory. New York, NY, USA: Wiley; 1998."},{"issue":"S-14","key":"73_CR59","doi-asserted-by":"crossref","first-page":"7","DOI":"10.1186\/1471-2105-10-S14-S7","volume":"10","author":"P Bertolazzi","year":"2009","unstructured":"Bertolazzi P, Felici G, Weitschek E. Learning to classify species with barcodes. BMC Bioinformatics. 2009; 10(S-14):7.","journal-title":"BMC Bioinformatics"},{"issue":"9","key":"73_CR60","first-page":"1","volume":"58","author":"E Weitschek","year":"2012","unstructured":"Weitschek E, Lo Presti A, Drovandi G, Felici G, Ciccozzi M, Ciotti M, et al.Human polyomaviruses identification by logic mining techniques. BMC Virol J. 2012; 58(9):1\u20136.","journal-title":"BMC Virol J."},{"issue":"3","key":"73_CR61","doi-asserted-by":"crossref","first-page":"211","DOI":"10.1007\/BF00962234","volume":"5","author":"BR Gaines","year":"1995","unstructured":"Gaines BR, Compton P. Induction of ripple-down rules applied to modeling large databases. J Intell Inf Syst. 1995; 5(3):211\u201328.","journal-title":"J Intell Inf Syst."},{"key":"73_CR62","volume-title":"Proc. of the 15th Int. Conference on Machine Learning","author":"E Frank","year":"1998","unstructured":"Frank E, Witten IH. Generating accurate rule sets without global optimization. In: Proc. of the 15th Int. Conference on Machine Learning. San Francisco, CA, USA: Morgan Kaufmann: 1998."},{"key":"73_CR63","volume-title":"Proceedings of the Twelfth International Conference on Machine Learning","author":"WW Cohen","year":"1995","unstructured":"Cohen WW. Fast effective rule induction. In: Proceedings of the Twelfth International Conference on Machine Learning. San Francisco, CA, USA: Morgan Kaufmann: 1995. p. 115\u201323."},{"issue":"3","key":"73_CR64","first-page":"1","volume":"13","author":"G Felici","year":"2002","unstructured":"Felici G, Truemper K. A minsat approach for learning in logic domains. INFORMS J Comput. 2002; 13(3):1\u201317.","journal-title":"INFORMS J Comput"},{"issue":"S14","key":"73_CR65","doi-asserted-by":"crossref","first-page":"7","DOI":"10.1186\/1471-2105-10-S14-S7","volume":"10","author":"P Bertolazzi","year":"2009","unstructured":"Bertolazzi P, Felici G, Weitschek E. Learning to classify species with barcodes. BMC Bioinformatics. 2009; 10(S14):7.","journal-title":"BMC Bioinformatics"},{"key":"73_CR66","doi-asserted-by":"crossref","first-page":"77","DOI":"10.1613\/jair.279","volume":"4","author":"JR Quinlan","year":"1996","unstructured":"Quinlan JR. Improved use of continuous attributes in C4.5. J Artif Intell Res. 1996; 4:77\u201390.","journal-title":"J Artif Intell Res"},{"issue":"1","key":"73_CR67","doi-asserted-by":"crossref","first-page":"10","DOI":"10.1145\/1656274.1656278","volume":"11","author":"M Hall","year":"2009","unstructured":"Hall M, Frank E, Holmes G, Pfahringer B, Reutemann P, Witten IH. The weka data mining software: an update. SIGKDD Explor Newsl. 2009; 11(1):10\u201318. doi: http:\/\/dx.doi.org\/10.1145\/1656274.1656278 .","journal-title":"SIGKDD Explor Newsl"},{"issue":"6","key":"73_CR68","doi-asserted-by":"crossref","first-page":"764","DOI":"10.1093\/bioinformatics\/btr011","volume":"27","author":"G Marcais","year":"2011","unstructured":"Marcais G, Kingsford C. A fast, lock-free approach for efficient parallel counting of occurrences of k-mers. Bioinformatics. 2011; 27(6):764\u201370. doi: http:\/\/dx.doi.org\/10.1093\/bioinformatics\/btr011 .","journal-title":"Bioinformatics"},{"key":"73_CR69","unstructured":"An Introduction to Support Vector Machines and Other Kernel-based Learning Methods. Cambridge, UK: Cambridge University Press."},{"key":"73_CR70","volume-title":"Nearest Neighbor NN Norms: NN Pattern Classification Techniques","author":"BV Dasarathy","year":"1991","unstructured":"Dasarathy BV. Nearest Neighbor NN Norms: NN Pattern Classification Techniques. Los Alamitos, CA, USA: IEEE Computer Society Press; 1991."},{"issue":"9","key":"73_CR71","doi-asserted-by":"crossref","first-page":"938","DOI":"10.1111\/j.1462-2920.2004.00624.x","volume":"6","author":"H Teeling","year":"2004","unstructured":"Teeling H, Meyerdiekers A, Bauer M, Glockner FO. Application of tetranucleotide frequencies for the assignment of genomic fragments. Environ Microbiol. 2004; 6(9):938\u201347.","journal-title":"Environ Microbiol"},{"key":"73_CR72","doi-asserted-by":"crossref","first-page":"145","DOI":"10.1101\/gr.335003","volume":"13","author":"DT Pride","year":"2003","unstructured":"Pride DT, Meinersmann RJ, Wassenaar TM, Blaser MJ. Evolutionary implications of microbial genome tetranucleotide frequency biases. Genome Res. 2003; 13:145\u201358.","journal-title":"Genome Res"},{"key":"73_CR73","doi-asserted-by":"crossref","first-page":"163","DOI":"10.1186\/1471-2105-5-163","volume":"5","author":"H Teeling","year":"2004","unstructured":"Teeling H, Waldmann J, Lombardot T, Bauer M, Glockner FO. Tetra: a web-service and a stand-alone program for the analysis and comparison of tetranucleotide usage patterns in dna sequences. BMC Bioinformatics. 2004; 5:163.","journal-title":"BMC Bioinformatics"},{"issue":"1","key":"73_CR74","doi-asserted-by":"crossref","first-page":"79","DOI":"10.1109\/TCBB.2011.45","volume":"9","author":"RH Chan","year":"2012","unstructured":"Chan RH, Chan TH, Yeung HM, Wang RW. Composition vector method based on maximum entropy principle for sequence comparison. Comput Biol Bioinform IEEE\/ACM Trans. 2012; 9(1):79\u201387.","journal-title":"Comput Biol Bioinform IEEE\/ACM Trans"},{"issue":"1","key":"73_CR75","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/s00239-003-2493-7","volume":"58","author":"J Qi","year":"2004","unstructured":"Qi J, Wang B, Hao BI. Whole proteome prokaryote phylogeny without sequence alignment: a k-string composition approach. J Mol Evol. 2004; 58(1):1\u201311.","journal-title":"J Mol Evol"},{"issue":"4","key":"73_CR76","doi-asserted-by":"crossref","first-page":"538","DOI":"10.1007\/s00239-004-0255-9","volume":"60","author":"ZG Yu","year":"2005","unstructured":"Yu ZG, Zhou LQ, Anh VV, Chu KH, Long SC, Deng JQ. Phylogeny of prokaryotes and chloroplasts revealed by a simple composition approach on all protein sequences from complete genomes without sequence alignment. J Mol Evol. 2005; 60(4):538\u201345.","journal-title":"J Mol Evol"},{"issue":"3","key":"73_CR77","doi-asserted-by":"crossref","first-page":"343","DOI":"10.1093\/bib\/bbt067","volume":"15","author":"K Song","year":"2014","unstructured":"Song K, Ren J, Reinert G, Deng M, Waterman MS, Sun F. New developments of alignment-free sequence comparison: measures, statistics and next-generation sequencing. Brief Bioinform. 2014; 15(3):343\u201353.","journal-title":"Brief Bioinform"},{"key":"73_CR78","unstructured":"Blast Package Version 2.2.25-7. http:\/\/packages.ubuntu.com\/precise\/ncbi-blast+ . Accessed Dec 2015."},{"key":"73_CR79","doi-asserted-by":"crossref","first-page":"617","DOI":"10.1093\/nar\/gkt1078","volume":"42","author":"K Huang","year":"2014","unstructured":"Huang K, Brady A, Mahurkar A, White O, Gevers D, Huttenhower C, et al.Metaref: a pan-genomic database for comparative and community microbial genomics. Nucleic Acids Res. 2014; 42:617\u201324.","journal-title":"Nucleic Acids Res."}],"container-title":["BioData Mining"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13040-015-0073-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s13040-015-0073-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13040-015-0073-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,28]],"date-time":"2022-05-28T18:07:19Z","timestamp":1653761239000},"score":1,"resource":{"primary":{"URL":"http:\/\/biodatamining.biomedcentral.com\/articles\/10.1186\/s13040-015-0073-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,6]]},"references-count":79,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2015,6]]}},"alternative-id":["73"],"URL":"https:\/\/doi.org\/10.1186\/s13040-015-0073-1","relation":{},"ISSN":["1756-0381"],"issn-type":[{"value":"1756-0381","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,6]]},"article-number":"39"}}