{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,24]],"date-time":"2025-06-24T17:40:06Z","timestamp":1750786806980,"version":"3.41.0"},"reference-count":79,"publisher":"Springer Science and Business Media LLC","issue":"1","funder":[{"DOI":"10.13039\/501100001871","name":"Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia","doi-asserted-by":"publisher","award":["SFRH\/BPD\/92978\/2013","PEst-C\/MAR\/LA0015\/2013 and PTDC\/AAG-GLO\/6887\/2014 (POCI-01-0124-FEDER-016845)"],"award-info":[{"award-number":["SFRH\/BPD\/92978\/2013","PEst-C\/MAR\/LA0015\/2013 and PTDC\/AAG-GLO\/6887\/2014 (POCI-01-0124-FEDER-016845)"]}],"id":[{"id":"10.13039\/501100001871","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["BMC Bioinformatics"],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1186\/s12859-017-1758-x","type":"journal-article","created":{"date-parts":[[2017,7,21]],"date-time":"2017-07-21T12:31:53Z","timestamp":1500640313000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":11,"title":["Exploring general-purpose protein features for distinguishing enzymes and non-enzymes within the twilight zone"],"prefix":"10.1186","volume":"18","author":[{"given":"Yasser B.","family":"Ruiz-Blanco","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9908-2418","authenticated-orcid":false,"given":"Guillermin","family":"Ag\u00fcero-Chapin","sequence":"additional","affiliation":[]},{"given":"Enrique","family":"Garc\u00eda-Hern\u00e1ndez","sequence":"additional","affiliation":[]},{"given":"Orlando","family":"\u00c1lvarez","sequence":"additional","affiliation":[]},{"given":"Agostinho","family":"Antunes","sequence":"additional","affiliation":[]},{"given":"James","family":"Green","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,7,21]]},"reference":[{"key":"1758_CR1","doi-asserted-by":"crossref","unstructured":"Pundir S, Martin MJ, O'Donovan C. UniProt Protein Knowledgebase. Methods Mol Biol. 2017;1558:41\u201355.","DOI":"10.1007\/978-1-4939-6783-4_2"},{"key":"1758_CR2","doi-asserted-by":"crossref","unstructured":"Sheynkman GM, Shortreed MR, Cesnik AJ, Smith LM. Proteogenomics: Integrating Next-Generation Sequencing and Mass Spectrometry to Characterize Human Proteomic Variation. Annu Rev Anal Chem. 2016;9(1):521\u201345.","DOI":"10.1146\/annurev-anchem-071015-041722"},{"issue":"1","key":"1758_CR3","doi-asserted-by":"crossref","first-page":"6","DOI":"10.1093\/bib\/6.1.6","volume":"6","author":"S Batzoglou","year":"2005","unstructured":"Batzoglou S. The many faces of sequence alignment. Brief Bioinform. 2005;6(1):6\u201322.","journal-title":"Brief Bioinform"},{"issue":"12","key":"1758_CR4","doi-asserted-by":"crossref","first-page":"980","DOI":"10.1038\/nsb1203-980","volume":"10","author":"HM Berman","year":"2003","unstructured":"Berman HM, Henrick K, Nakamura H. Announcing the worldwide protein data Bank. Nat Struct Mol Biol. 2003;10(12):980.","journal-title":"Nat Struct Mol Biol"},{"issue":"Database issue","key":"1758_CR5","first-page":"D419","volume":"36","author":"A Andreeva","year":"2008","unstructured":"Andreeva A, Howorth D, Chandonia JM, Brenner SE, Hubbard TJ, Chothia C, Murzin AG. Data growth and its impact on the SCOP database: new developments. Nucleic Acids Res. 2008;36(Database issue):D419\u201325.","journal-title":"Nucleic Acids Res"},{"issue":"Database issue","key":"1758_CR6","doi-asserted-by":"crossref","first-page":"D376","DOI":"10.1093\/nar\/gku947","volume":"43","author":"I Sillitoe","year":"2015","unstructured":"Sillitoe I, Lewis TE, Cuff A, Das S, Ashford P, Dawson NL, Furnham N, Laskowski RA, Lee D, Lees JG, et al. CATH: comprehensive structural and functional annotations for genome sequences. Nucleic Acids Res. 2015;43(Database issue):D376\u201381.","journal-title":"Nucleic Acids Res"},{"key":"1758_CR7","first-page":"1-3","volume":"3.1","author":"WR Pearson","year":"2013","unstructured":"Pearson WR. An introduction to sequence similarity (\u201chomology\u201d) searching. Curr Protoc Bioinformatics. 2013;3.1:1-3\u20131. 8.","journal-title":"Curr Protoc Bioinformatics"},{"issue":"1","key":"1758_CR8","doi-asserted-by":"crossref","first-page":"195","DOI":"10.1016\/0022-2836(81)90087-5","volume":"147","author":"TF Smith","year":"1981","unstructured":"Smith TF, Waterman MS. Identification of common molecular subsequences. J Mol Biol. 1981;147(1):195\u20137.","journal-title":"J Mol Biol"},{"key":"1758_CR9","doi-asserted-by":"crossref","first-page":"403","DOI":"10.1016\/S0022-2836(05)80360-2","volume":"215","author":"SF Altschul","year":"1990","unstructured":"Altschul SF, Gish W, Miller W, Myers EW, Lipman DJ. Basic local alignment search tool. J Mol Biol. 1990;215:403\u201310.","journal-title":"J Mol Biol"},{"issue":"9","key":"1758_CR10","doi-asserted-by":"crossref","first-page":"755","DOI":"10.1093\/bioinformatics\/14.9.755","volume":"14","author":"SR Eddy","year":"1998","unstructured":"Eddy SR. Profile hidden Markov models. Bioinformatics. 1998;14(9):755\u201363.","journal-title":"Bioinformatics"},{"issue":"1","key":"1758_CR11","doi-asserted-by":"crossref","first-page":"276","DOI":"10.1093\/nar\/30.1.276","volume":"30","author":"A Bateman","year":"2002","unstructured":"Bateman A, Birney E, Cerruti L, Durbin R, Etwiller L, Eddy SR, Griffiths-Jones S, Howe KL, Marshall M, Sonnhammer ELL. The Pfam protein families database. Nucleic Acids Res. 2002;30(1):276\u201380.","journal-title":"Nucleic Acids Res"},{"issue":"1","key":"1758_CR12","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1186\/1471-2105-12-376","volume":"12","author":"S Quester","year":"2011","unstructured":"Quester S, Schomburg D. EnzymeDetector: an integrated enzyme function prediction tool and database. BMC bioinformatics. 2011;12(1):1.","journal-title":"BMC bioinformatics"},{"issue":"2","key":"1758_CR13","doi-asserted-by":"crossref","first-page":"85","DOI":"10.1093\/protein\/12.2.85","volume":"12","author":"B Rost","year":"1999","unstructured":"Rost B. Twilight zone of protein sequence alignments. Protein Eng. 1999;12(2):85\u201394.","journal-title":"Protein Eng"},{"key":"1758_CR14","doi-asserted-by":"crossref","first-page":"595","DOI":"10.1016\/S0022-2836(02)00016-5","volume":"318","author":"B Rost","year":"2002","unstructured":"Rost B. Enzyme function less conserved than anticipated. J Mol Biol. 2002;318:595\u2013608.","journal-title":"J Mol Biol"},{"issue":"5","key":"1758_CR15","doi-asserted-by":"crossref","first-page":"602","DOI":"10.1016\/j.ygeno.2007.01.008","volume":"89","author":"PK Strope","year":"2007","unstructured":"Strope PK, Moriyama EN. Simple alignment-free methods for protein classification: a case study from G-protein-coupled receptors. Genomics. 2007;89(5):602\u201312.","journal-title":"Genomics"},{"key":"1758_CR16","doi-asserted-by":"crossref","unstructured":"Deshmukh S, Khaitan S, Das D, Gupta M, Wangikar PP. An alignment-free method for classification of protein sequences. Protein Pept Lett. 2007;14(7):647\u201357.","DOI":"10.2174\/092986607781483804"},{"issue":"2","key":"1758_CR17","doi-asserted-by":"crossref","first-page":"121","DOI":"10.3233\/ISB-00350","volume":"8","author":"M Kumar","year":"2008","unstructured":"Kumar M, Thakur V, Raghava GP. COPid: composition based protein identification. In Silico Biol. 2008;8(2):121\u20138.","journal-title":"In Silico Biol"},{"issue":"3","key":"1758_CR18","doi-asserted-by":"crossref","first-page":"246","DOI":"10.1002\/prot.1035","volume":"43","author":"KC Chou","year":"2001","unstructured":"Chou KC. Prediction of protein cellular attributes using pseudo-amino acid composition. Proteins. 2001;43(3):246\u201355.","journal-title":"Proteins"},{"issue":"4","key":"1758_CR19","doi-asserted-by":"crossref","first-page":"1236","DOI":"10.1016\/j.bbrc.2004.06.073","volume":"320","author":"KC Chou","year":"2004","unstructured":"Chou KC, Cai YD. Prediction of protein subcellular locations by GO-FunD-PseAA predictor. Biochem Biophys Res Commun. 2004;320(4):1236\u20139.","journal-title":"Biochem Biophys Res Commun"},{"issue":"2","key":"1758_CR20","doi-asserted-by":"crossref","first-page":"395","DOI":"10.1016\/j.jtbi.2005.05.035","volume":"238","author":"YD Cai","year":"2006","unstructured":"Cai YD, Chou KC. Predicting membrane protein type by functional domain composition and pseudo-amino acid composition. J Theor Biol. 2006;238(2):395\u2013400.","journal-title":"J Theor Biol"},{"issue":"2","key":"1758_CR21","doi-asserted-by":"crossref","first-page":"282","DOI":"10.1002\/prot.10500","volume":"53","author":"KC Chou","year":"2003","unstructured":"Chou KC, Cai YD. Predicting protein quaternary structure by pseudo amino acid composition. Proteins. 2003;53(2):282\u20139.","journal-title":"Proteins"},{"issue":"2","key":"1758_CR22","doi-asserted-by":"crossref","first-page":"506","DOI":"10.1016\/j.bbrc.2004.10.058","volume":"325","author":"KC Chou","year":"2004","unstructured":"Chou KC, Cai YD. Using GO-PseAA predictor to predict enzyme sub-class. Biochem Biophys Res Commun. 2004;325(2):506\u20139.","journal-title":"Biochem Biophys Res Commun"},{"issue":"1","key":"1758_CR23","doi-asserted-by":"crossref","first-page":"10","DOI":"10.1093\/bioinformatics\/bth466","volume":"21","author":"KC Chou","year":"2005","unstructured":"Chou KC. Using amphiphilic pseudo amino acid composition to predict enzyme subfamily classes. Bioinformatics. 2005;21(1):10\u20139.","journal-title":"Bioinformatics"},{"issue":"1","key":"1758_CR24","doi-asserted-by":"crossref","first-page":"53","DOI":"10.1016\/j.bbrc.2007.09.098","volume":"364","author":"HB Shen","year":"2007","unstructured":"Shen HB, Chou KC. EzyPred: a top-down approach for predicting enzyme functional classes and subclasses. Biochem Biophys Res Commun. 2007;364(1):53\u20139.","journal-title":"Biochem Biophys Res Commun"},{"issue":"3","key":"1758_CR25","doi-asserted-by":"crossref","first-page":"1255","DOI":"10.1021\/ci050507z","volume":"46","author":"J Caballero","year":"2006","unstructured":"Caballero J, Fernandez L, Abreu JI, Fernandez M. Amino acid sequence autocorrelation vectors and ensembles of Bayesian-regularized genetic neural networks for prediction of conformational stability of human lysozyme mutants. J Chem Inf Model. 2006;46(3):1255\u201368.","journal-title":"J Chem Inf Model"},{"key":"1758_CR26","first-page":"359","volume":"4","author":"G Moreau","year":"1980","unstructured":"Moreau G, Broto P. The autocorrelation of a topological structure. A new molecular descriptor. Nouv J Chim. 1980;4:359\u201360.","journal-title":"Nouv J Chim"},{"issue":"Web Server","key":"1758_CR27","first-page":"W385","volume":"39","author":"HB Rao","year":"2011","unstructured":"Rao HB, Zhu F, Yang GB, Li ZR, Chen YZ. Update of PROFEAT: a web server for computing structural and physicochemical features of proteins and peptides from amino acid sequence. Nucleic Acids Res. 2011;39(Web Server):W385\u201390.","journal-title":"Nucleic Acids Res"},{"issue":"4","key":"1758_CR28","doi-asserted-by":"crossref","first-page":"750","DOI":"10.1002\/pmic.200700638","volume":"8","author":"H Gonzalez-Diaz","year":"2008","unstructured":"Gonzalez-Diaz H, Gonzalez-Diaz Y, Santana L, Ubeira FM, Uriarte E. Proteomics, networks and connectivity indices. Proteomics. 2008;8(4):750\u201378.","journal-title":"Proteomics"},{"issue":"2","key":"1758_CR29","doi-asserted-by":"crossref","first-page":"431","DOI":"10.1007\/s00726-010-0653-9","volume":"40","author":"G Aguero-Chapin","year":"2011","unstructured":"Aguero-Chapin G, Perez-Machado G, Molina-Ruiz R, Perez-Castillo Y, Morales-Helguera A, Vasconcelos V, Antunes A. TI2BioP: topological indices to BioPolymers. Its practical use to unravel cryptic bacteriocin-like domains. Amino Acids. 2011;40(2):431\u201342.","journal-title":"Amino Acids"},{"key":"1758_CR30","doi-asserted-by":"crossref","first-page":"162","DOI":"10.1186\/s12859-015-0586-0","volume":"16","author":"YB Ruiz-Blanco","year":"2015","unstructured":"Ruiz-Blanco YB, Paz W, Green J, Marrero-Ponce Y. ProtDCal: a program to compute general-purpose-numerical descriptors for sequences and 3D-structures of proteins. BMC Bioinformatics. 2015;16:162.","journal-title":"BMC Bioinformatics"},{"key":"1758_CR31","doi-asserted-by":"crossref","unstructured":"Ruiz-Blanco YB, Marrero-Ponce Y, Garc\u00eda-Hern\u00e1ndez E, Green J. Novel \u201cextended sequons\u201d of human N-glycosylation sites improve the precision of qualitative predictions: an alignment-free study of pattern recognition using ProtDCal protein features. Amino Acids. 2017; 49(2):317-25.","DOI":"10.1007\/s00726-016-2362-5"},{"key":"1758_CR32","doi-asserted-by":"crossref","first-page":"588","DOI":"10.1021\/acs.jcim.5b00630","volume":"56","author":"A Speck-Planche","year":"2016","unstructured":"Speck-Planche A, Kleandrova VV, Ruso JM, Cordeiro MNDS. First multitarget chemo-Bioinformatic model to enable the discovery of antibacterial peptides against multiple gram-positive pathogens. J Chem Inf Model. 2016;56:588\u201398.","journal-title":"J Chem Inf Model"},{"issue":"4","key":"1758_CR33","doi-asserted-by":"crossref","first-page":"771","DOI":"10.1016\/S0022-2836(03)00628-4","volume":"330","author":"PD Dobson","year":"2003","unstructured":"Dobson PD, Doig AJ. Distinguishing enzyme structures from non-enzymes without alignments. J Mol Biol. 2003;330(4):771\u201383.","journal-title":"J Mol Biol"},{"key":"1758_CR34","doi-asserted-by":"crossref","unstructured":"Louie B, Tarczy-Hornoch P, Higdon R, Kolker E. Validating annotations for uncharacterized proteins in Shewanella oneidensis. OMICS A J Integr Biol. 2008;12(3):211\u20135.","DOI":"10.1089\/omi.2008.0051"},{"issue":"1","key":"1758_CR35","doi-asserted-by":"crossref","first-page":"374","DOI":"10.1093\/nar\/28.1.374","volume":"28","author":"S Kawashima","year":"2000","unstructured":"Kawashima S, Kanehisa M. AAindex: amino acid index database. Nucleic Acids Res. 2000;28(1):374.","journal-title":"Nucleic Acids Res"},{"key":"1758_CR36","doi-asserted-by":"crossref","first-page":"1126","DOI":"10.1021\/jm00390a003","volume":"30","author":"S Hellberg","year":"1987","unstructured":"Hellberg S, Sjostrom M, Skagerberg B, Wold S. Peptide quantitative structure-activity relationships, a multivariate approach. J Med Chem. 1987;30:1126\u201335.","journal-title":"J Med Chem"},{"issue":"20","key":"1758_CR37","doi-asserted-by":"crossref","first-page":"4277","DOI":"10.1021\/bi00613a026","volume":"17","author":"M Levitt","year":"1978","unstructured":"Levitt M. Conformational preferences of amino acids in globular proteins. Biochemistry. 1978;17(20):4277\u201385.","journal-title":"Biochemistry"},{"key":"1758_CR38","doi-asserted-by":"crossref","first-page":"105","DOI":"10.1016\/0022-2836(82)90515-0","volume":"157","author":"J Kyte","year":"1982","unstructured":"Kyte J, Doolitle RF. A simple method for displaying the Hydropathic character of a protein. J Mol Biol. 1982;157:105\u201332.","journal-title":"J Mol Biol"},{"key":"1758_CR39","doi-asserted-by":"crossref","first-page":"2705","DOI":"10.1021\/jm00014a022","volume":"38","author":"ER Collantes","year":"1995","unstructured":"Collantes ER, Dunn-III WJ. Amino acid side chain descriptors for quantitative structure-activity relationship studies of peptide analogues. J Med Chem. 1995;38:2705\u201313.","journal-title":"J Med Chem"},{"key":"1758_CR40","doi-asserted-by":"crossref","first-page":"434","DOI":"10.1006\/bioo.1999.1150","volume":"27","author":"S Katrin","year":"1999","unstructured":"Katrin S, Karelson M, J\u00e4rv J. Modeling of the amino acid side chain effects on peptide conformation. Bioorg Chem. 1999;27:434\u201342.","journal-title":"Bioorg Chem"},{"key":"1758_CR41","doi-asserted-by":"crossref","first-page":"407","DOI":"10.1016\/j.jtbi.2014.09.002","volume":"364","author":"YB Ruiz-Blanco","year":"2015","unstructured":"Ruiz-Blanco YB, Marrero-Ponce Y, Prieto PJ, Salgado J, Garc\u00eda Y, Sotomayor-Torres CM. A Hooke\u2032 s law-based approach to protein folding rate. J Theor Biol. 2015;364:407\u201317.","journal-title":"J Theor Biol"},{"key":"1758_CR42","doi-asserted-by":"crossref","first-page":"44","DOI":"10.1016\/j.jtbi.2012.12.023","volume":"321","author":"YB Ruiz-Blanco","year":"2013","unstructured":"Ruiz-Blanco YB, Marrero-Ponce Y, Paz W, Garc\u00eda Y, Salgado J. Global stability of protein folding from an empirical free energy function. J Theor Biol. 2013;321:44\u201353.","journal-title":"J Theor Biol"},{"key":"1758_CR43","doi-asserted-by":"crossref","first-page":"135","DOI":"10.1016\/j.cplett.2014.07.014","volume":"610\u2013611","author":"YB Ruiz-Blanco","year":"2014","unstructured":"Ruiz-Blanco YB, Marrero-Ponce Y, Garc\u00eda Y, Puris A, Bello R, Green J, Sotomayor-Torres CM. A physics-based scoring function for protein structural decoys:dynamic testing on targets of CASP-ROLL. Chem Phys Lett. 2014;610\u2013611:135\u201340.","journal-title":"Chem Phys Lett"},{"key":"1758_CR44","doi-asserted-by":"crossref","first-page":"801","DOI":"10.1023\/A:1015952613760","volume":"7","author":"LB Kier","year":"1990","unstructured":"Kier LB, Hall LH. An Electrotopological-state index for atoms in molecules. Pharm Res. 1990;7:801\u20137.","journal-title":"Pharm Res"},{"key":"1758_CR45","volume-title":"Molecular structure description. The Electrotopological state","author":"LB Kier","year":"1999","unstructured":"Kier LB, Hall LH. Molecular structure description. The Electrotopological state. London: Academic Press; 1999."},{"key":"1758_CR46","unstructured":"Dunford N, Schwartz JT. Linear operators, vol. I. New York: Interscience; 1958;1963."},{"key":"1758_CR47","doi-asserted-by":"crossref","first-page":"379","DOI":"10.1002\/j.1538-7305.1948.tb01338.x","volume":"27","author":"CE Shannon","year":"1948","unstructured":"Shannon CE. A mathematical theory of communication. Bell Syst Tech J. 1948;27:379\u2013423.","journal-title":"Bell Syst Tech J"},{"issue":"3","key":"1758_CR48","doi-asserted-by":"crossref","first-page":"299","DOI":"10.1016\/S0022-5193(03)00091-2","volume":"223","author":"B N\u00f6lting","year":"2003","unstructured":"N\u00f6lting B, Sch\u00e4like W, Hampel P, Grundig F, Gantert S, Sips N, Bandlow W, Qi PX. Structural determinants of the rate of protein folding. J Theor Biol. 2003;223(3):299\u2013307.","journal-title":"J Theor Biol"},{"issue":"7","key":"1758_CR49","doi-asserted-by":"crossref","first-page":"e65926","DOI":"10.1371\/journal.pone.0065926","volume":"8","author":"G Ag\u00fcero-Chapin","year":"2013","unstructured":"Ag\u00fcero-Chapin G, Molina-Ruiz R, Maldonado E, de la Riva G, S\u00e1nchez-Rodr\u00edguez A, Vasconcelos V, Antunes A. Exploring the adenylation domain repertoire of nonribosomal peptide synthetases using an ensemble of sequence-search methods. PLoS One. 2013;8(7):e65926.","journal-title":"PLoS One"},{"issue":"1","key":"1758_CR50","doi-asserted-by":"crossref","first-page":"3","DOI":"10.1145\/584091.584093","volume":"5","author":"CE Shannon","year":"2001","unstructured":"Shannon CE. A mathematical theory of communication. SIGMOBILE Mob Comput Commun Rev. 2001;5(1):3\u201355.","journal-title":"SIGMOBILE Mob Comput Commun Rev"},{"key":"1758_CR51","first-page":"856","volume":"3","author":"L Yu","year":"2003","unstructured":"Yu L, Liu H. Feature selection for high-dimensional data: a fast correlation-based filter solution. ICML. 2003;3:856\u201363.","journal-title":"ICML"},{"issue":"2","key":"1758_CR52","doi-asserted-by":"crossref","first-page":"305","DOI":"10.1007\/s11030-014-9565-z","volume":"19","author":"RWP Urias","year":"2015","unstructured":"Urias RWP, Barigye SJ, Marrero-Ponce Y, Garc\u00eda-Jacas CR, Valdes-Martin\u00ed JR, Perez-Gimenez F. IMMAN: free software for information theory-based chemometric analysis. Mol Divers. 2015;19(2):305\u201319.","journal-title":"Mol Divers"},{"key":"1758_CR53","doi-asserted-by":"crossref","first-page":"87","DOI":"10.1021\/ci0103065","volume":"42","author":"JW Godden","year":"2002","unstructured":"Godden JW, Bajorath J. Chemical descriptors with distinct levels of information content and varying sensitivity to differences between selected compound databases identified by SE-DSE analysis. J Chem Inf Comput Sci. 2002;42:87\u201393.","journal-title":"J Chem Inf Comput Sci"},{"key":"1758_CR54","doi-asserted-by":"crossref","first-page":"796","DOI":"10.1021\/ci000321u","volume":"40","author":"JW Godden","year":"2000","unstructured":"Godden JW, Stahura FL, Bajorath J. Variability of molecular descriptors in compound databases revealed by Shannon entropy calculations. J Chem Inf Comput Sci. 2000;40:796\u2013800.","journal-title":"J Chem Inf Comput Sci"},{"key":"1758_CR55","unstructured":"Goldberg DE. Genetic Algorithms in Search, Optimization and Machine Learning. Boston: Addison-Wesley Longman Publishing Co., Inc."},{"key":"1758_CR56","doi-asserted-by":"crossref","unstructured":"Hall M, Frank E, Holmes G, Pfahringer B, Reutemann P, Witten IH. The WEKA Data Mining Software: An Update. SIGKDD Explorations. 2009;11(1):10-8.","DOI":"10.1145\/1656274.1656278"},{"issue":"1","key":"1758_CR57","doi-asserted-by":"crossref","first-page":"257","DOI":"10.1093\/nar\/28.1.257","volume":"28","author":"LL Conte","year":"2000","unstructured":"Conte LL, Ailey B, Hubbard TJ, Brenner SE, Murzin AG, Chothia C. SCOP: a structural classification of proteins database. Nucleic Acids Res. 2000;28(1):257\u20139.","journal-title":"Nucleic Acids Res"},{"issue":"5","key":"1758_CR58","doi-asserted-by":"crossref","first-page":"643","DOI":"10.1002\/pro.2635","volume":"24","author":"DB Roche","year":"2015","unstructured":"Roche DB, Bruls T. The enzymatic nature of an anonymous protein sequence cannot reliably be inferred from superfamily level structural information alone. Protein Sci. 2015;24(5):643\u201350.","journal-title":"Protein Sci"},{"issue":"1","key":"1758_CR59","doi-asserted-by":"crossref","first-page":"105","DOI":"10.1016\/S0022-2836(02)01036-7","volume":"324","author":"GJ Bartlett","year":"2002","unstructured":"Bartlett GJ, Porter CT, Borkakoti N, Thornton JM. Analysis of catalytic residues in enzyme active sites. J Mol Biol. 2002;324(1):105\u201321.","journal-title":"J Mol Biol"},{"key":"1758_CR60","doi-asserted-by":"crossref","first-page":"3190","DOI":"10.1074\/jbc.272.6.3190","volume":"272","author":"B Yan","year":"1997","unstructured":"Yan B, Sun Y. Glycine residues provide flexibility for enzyme active sites. J Biol Chem. 1997;272:3190\u20134.","journal-title":"J Biol Chem"},{"key":"1758_CR61","first-page":"200","volume-title":"Prienciples of biochemistry","author":"DL Nelson","year":"2012","unstructured":"Nelson DL, Cox MM. Specific catalytic groups contribute to catalysis. In: Ahr K, editor. Prienciples of biochemistry. 6th ed. New York: Sara Tenney (W. H. Freeman and Company); 2012. p. 200\u20132.","edition":"6th"},{"key":"1758_CR62","unstructured":"Shervashidze N. Scalable graph kernels. PhD thesis, Universit\u00e4t T\u00fcbingen; 2012. Available at http:\/\/hdl.handle.net\/10900\/49731 ."},{"key":"1758_CR63","unstructured":"Senelle M. Measures on graphs: from similarity to density. PhD thesis, Universit\u00e9 catholique de Louvain; 2014. Available at https:\/\/dial.uclouvain.be\/pr\/boreal\/object\/boreal:161671 ."},{"key":"1758_CR64","unstructured":"Shervashidze N, Schweitzer P, Van Leeuwen EJ, Mehlhorn K, Borgwardt KM. Weisfeiler-lehman graph kernels. J Mach Learn Res. 2011;12:2539\u201361."},{"issue":"2","key":"1758_CR65","doi-asserted-by":"crossref","first-page":"209","DOI":"10.1007\/s10994-015-5517-9","volume":"102","author":"M Neumann","year":"2016","unstructured":"Neumann M, Garnett R, Bauckhage C, Kersting K. Propagation kernels: efficient graph kernels from propagated information. Mach Learn. 2016;102(2):209\u201345.","journal-title":"Mach Learn"},{"issue":"4","key":"1758_CR66","doi-asserted-by":"crossref","first-page":"265","DOI":"10.1002\/sam.11153","volume":"5","author":"G Li","year":"2012","unstructured":"Li G, Semerci M, Yener B, Zaki MJ. Effective graph classification based on topological and label attributes. Stat Anal Data Min. 2012;5(4):265\u201383.","journal-title":"Stat Anal Data Min"},{"key":"1758_CR67","unstructured":"Li G, Semerci M, Yener B, Zaki MJ. Graph classification via topological and label attributes. In: Proceedings of the 9th international workshop on mining and learning with graphs (MLG), San Diego; 2011."},{"issue":"3","key":"1758_CR68","doi-asserted-by":"crossref","first-page":"1172","DOI":"10.1016\/j.patcog.2013.09.010","volume":"47","author":"L Bai","year":"2014","unstructured":"Bai L, Hancock ER. Depth-based complexity traces of graphs. Pattern Recogn. 2014;47(3):1172\u201386.","journal-title":"Pattern Recogn"},{"key":"1758_CR69","volume-title":"IJCAI proceedings-international joint conference on artificial intelligence IJCAI","author":"F Orsini","year":"2015","unstructured":"Orsini F, Frasconi P, De Raedt L. Graph invariant kernels. In: IJCAI proceedings-international joint conference on artificial intelligence IJCAI; 2015."},{"key":"1758_CR70","volume-title":"Fast shortest-path kernel computations using approximate methods","author":"J Kilham","year":"2015","unstructured":"Kilham J. Fast shortest-path kernel computations using approximate methods. 2015."},{"key":"1758_CR71","doi-asserted-by":"crossref","unstructured":"Johansson FD, Frost O, Retzner C, Dubhashi D. Classifying Large Graphs with Differential Privacy. In: Modeling Decisions for Artificial Intelligence. Cham: Springer; 2015. p. 3\u201317.","DOI":"10.1007\/978-3-319-23240-9_1"},{"issue":"1","key":"1758_CR72","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1016\/j.chemolab.2005.09.003","volume":"81","author":"B \u00dcst\u00fcn","year":"2006","unstructured":"\u00dcst\u00fcn B, Melssen WJ, Buydens LM. Facilitating the application of support vector regression by using a universal Pearson VII function based kernel. Chemom Intell Lab Syst. 2006;81(1):29\u201340.","journal-title":"Chemom Intell Lab Syst"},{"key":"1758_CR73","doi-asserted-by":"crossref","first-page":"16","DOI":"10.1016\/j.compbiolchem.2013.05.001","volume":"46","author":"G Zhang","year":"2013","unstructured":"Zhang G, Ge H. Support vector machine with a Pearson VII function kernel for discriminating halophilic and non-halophilic proteins. Comput Biol Chem. 2013;46:16\u201322.","journal-title":"Comput Biol Chem"},{"key":"1758_CR74","doi-asserted-by":"crossref","unstructured":"Qifu Z, Haifeng H, Youzheng Z, Guodong S. Support vector machine based on universal kernel function and its application in quantitative structure-toxicity relationship model. In: Information Technology and Applications, 2009 IFITA'09 International Forum on: 2009. IEEE: Chengdu; 2009. p. 708-11.","DOI":"10.1109\/IFITA.2009.256"},{"issue":"1","key":"1758_CR75","doi-asserted-by":"crossref","first-page":"74","DOI":"10.1111\/cbdd.12834","volume":"89","author":"A Qureshi","year":"2017","unstructured":"Qureshi A, Kaur G, Kumar M. AVCpred: an integrated web server for prediction and design of antiviral compounds. Chem Biol Drug Des. 2017;89(1):74\u201383.","journal-title":"Chem Biol Drug Des"},{"issue":"7","key":"1758_CR76","doi-asserted-by":"crossref","first-page":"e1002101","DOI":"10.1371\/journal.pcbi.1002101","volume":"7","author":"WS Sanders","year":"2011","unstructured":"Sanders WS, Johnston CI, Bridges SM, Burgess SC, Willeford KO. Prediction of cell penetrating peptides by support vector machines. PLoS Comput Biol. 2011;7(7):e1002101.","journal-title":"PLoS Comput Biol"},{"issue":"11","key":"1758_CR77","doi-asserted-by":"crossref","first-page":"1118","DOI":"10.1038\/nbt749","volume":"20","author":"JF Heidelberg","year":"2002","unstructured":"Heidelberg JF, Paulsen IT, Nelson KE, Gaidos EJ, Nelson WC, Read TD, Eisen JA, Seshadri R, Ward N, Methe B. Genome sequence of the dissimilatory metal ion\u2013reducing bacterium Shewanella oneidensis. Nat Biotechnol. 2002;20(11):1118\u201323.","journal-title":"Nat Biotechnol"},{"issue":"1","key":"1758_CR78","doi-asserted-by":"crossref","first-page":"304","DOI":"10.1093\/nar\/28.1.304","volume":"28","author":"A Bairoch","year":"2000","unstructured":"Bairoch A. The ENZYME database in 2000. Nucleic Acids Res. 2000;28(1):304\u20135.","journal-title":"Nucleic Acids Res"},{"issue":"Database issue","key":"1758_CR79","doi-asserted-by":"crossref","first-page":"D764","DOI":"10.1093\/nar\/gks1049","volume":"41","author":"I Schomburg","year":"2013","unstructured":"Schomburg I, Chang A, Placzek S, Sohngen C, Rother M, Lang M, Munaretto C, Ulas S, Stelzer M, Grote A, et al. BRENDA in 2013: integrated reactions, kinetic data, enzyme function data, improved disease classification: new options and contents in BRENDA. Nucleic Acids Res. 2013;41(Database issue):D764\u201372.","journal-title":"Nucleic Acids Res"}],"container-title":["BMC Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s12859-017-1758-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,24]],"date-time":"2025-06-24T17:07:44Z","timestamp":1750784864000},"score":1,"resource":{"primary":{"URL":"http:\/\/bmcbioinformatics.biomedcentral.com\/articles\/10.1186\/s12859-017-1758-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,7,21]]},"references-count":79,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2017,12]]}},"alternative-id":["1758"],"URL":"https:\/\/doi.org\/10.1186\/s12859-017-1758-x","relation":{},"ISSN":["1471-2105"],"issn-type":[{"type":"electronic","value":"1471-2105"}],"subject":[],"published":{"date-parts":[[2017,7,21]]},"article-number":"349"}}