{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,8,2]],"date-time":"2024-08-02T04:30:26Z","timestamp":1722573026439},"reference-count":55,"publisher":"Public Library of Science (PLoS)","issue":"7","content-domain":{"domain":["www.plosone.org"],"crossmark-restriction":false},"short-container-title":["PLoS ONE"],"DOI":"10.1371\/journal.pone.0065926","type":"journal-article","created":{"date-parts":[[2013,7,16]],"date-time":"2013-07-16T21:05:53Z","timestamp":1374008753000},"page":"e65926","update-policy":"http:\/\/dx.doi.org\/10.1371\/journal.pone.corrections_policy","source":"Crossref","is-referenced-by-count":7,"title":["Exploring the Adenylation Domain Repertoire of Nonribosomal Peptide Synthetases Using an Ensemble of Sequence-Search Methods"],"prefix":"10.1371","volume":"8","author":[{"given":"Guillermin","family":"Ag\u00fcero-Chapin","sequence":"first","affiliation":[]},{"given":"Reinaldo","family":"Molina-Ruiz","sequence":"additional","affiliation":[]},{"given":"Emanuel","family":"Maldonado","sequence":"additional","affiliation":[]},{"given":"Gustavo","family":"de la Riva","sequence":"additional","affiliation":[]},{"given":"Aminael","family":"S\u00e1nchez-Rodr\u00edguez","sequence":"additional","affiliation":[]},{"given":"Vitor","family":"Vasconcelos","sequence":"additional","affiliation":[]},{"given":"Agostinho","family":"Antunes","sequence":"additional","affiliation":[]}],"member":"340","published-online":{"date-parts":[[2013,7,16]]},"reference":[{"key":"ref1","doi-asserted-by":"crossref","first-page":"790","DOI":"10.1021\/cr800198j","article-title":"Graphical representation of proteins","volume":"111","author":"M Randic","year":"2011","journal-title":"Chem Rev"},{"key":"ref2","doi-asserted-by":"crossref","unstructured":"Randi\u0107 M (2004) Graphical representation of DNA as a 2-D map. Chem Phys Lett: 468\u2013471.","DOI":"10.1016\/j.cplett.2004.01.088"},{"key":"ref3","doi-asserted-by":"crossref","first-page":"290","DOI":"10.1016\/j.jmgm.2006.12.006","article-title":"On representation of proteins by star-like graphs","volume":"26","author":"M Randic","year":"2007","journal-title":"J Mol Graph Model"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"191","DOI":"10.1080\/10629360410001697753","article-title":"Highly compact 2D graphical representation of DNA sequences","volume":"15","author":"M Randic","year":"2004","journal-title":"SAR QSAR Environ Res"},{"key":"ref5","first-page":"149","article-title":"Recent investigations into global characteristics of long DNA sequences","volume":"31","author":"A Nandy","year":"1994","journal-title":"Indian J Biochem Biophys"},{"key":"ref6","doi-asserted-by":"crossref","first-page":"2122","DOI":"10.1021\/pr800867y","article-title":"Alignment-free prediction of polygalacturonases with pseudofolding topological indices: experimental isolation from Coffea arabica and prediction of a new sequence","volume":"8","author":"G Aguero-Chapin","year":"2009","journal-title":"J Proteome Res"},{"key":"ref7","doi-asserted-by":"crossref","first-page":"619","DOI":"10.1021\/tx700296t","article-title":"3D-MEDNEs: an alternative \u201cin silico\u201d technique for chemical research in toxicology. 2. quantitative proteome-toxicity relationships (QPTR) based on mass spectrum spiral entropy","volume":"21","author":"M Cruz-Monteagudo","year":"2008","journal-title":"Chem Res Toxicol"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"e26638","DOI":"10.1371\/journal.pone.0026638","article-title":"An alignment-free approach for eukaryotic ITS2 annotation and phylogenetic inference","volume":"6","author":"G Aguero-Chapin","year":"2011","journal-title":"PLoS One"},{"key":"ref9","doi-asserted-by":"crossref","first-page":"550","DOI":"10.1021\/ci000095o","article-title":"On interpretation of well-known topological indices","volume":"41","author":"M Randic","year":"2001","journal-title":"J Chem Inf Comput Sci"},{"key":"ref10","doi-asserted-by":"crossref","first-page":"1573","DOI":"10.2174\/0929867013371923","article-title":"Recent advances on the role of topological indices in drug discovery research","volume":"8","author":"E Estrada","year":"2001","journal-title":"Curr Med Chem"},{"key":"ref11","doi-asserted-by":"crossref","first-page":"136","DOI":"10.1016\/j.jtbi.2009.07.029","article-title":"Generalized lattice graphs for 2D-visualization of biological information","volume":"261","author":"H Gonzalez-Diaz","year":"2009","journal-title":"J Theor Biol"},{"key":"ref12","doi-asserted-by":"crossref","first-page":"637","DOI":"10.1016\/j.jmgm.2008.10.004","article-title":"Graphical representation of proteins as four-color maps and their numerical characterization","volume":"27","author":"M Randic","year":"2009","journal-title":"J Mol Graph Model"},{"key":"ref13","doi-asserted-by":"crossref","first-page":"3389","DOI":"10.1093\/nar\/25.17.3389","article-title":"Gapped BLAST and PSI-BLAST: a new generation of protein database search programs","volume":"25","author":"SF Altschul","year":"1997","journal-title":"Nucleic Acids Res"},{"key":"ref14","first-page":"205","article-title":"A new generation of homology search tools based on probabilistic inference","volume":"23","author":"SR Eddy","year":"2009","journal-title":"Genome Inform"},{"key":"ref15","doi-asserted-by":"crossref","first-page":"W405","DOI":"10.1093\/nar\/gkh359","article-title":"NRPS-PKS: a knowledge-based resource for analysis of NRPS\/PKS megasynthases","volume":"32","author":"MZ Ansari","year":"2004","journal-title":"Nucleic Acids Res"},{"key":"ref16","doi-asserted-by":"crossref","first-page":"874","DOI":"10.1039\/b810283j","article-title":"Bioinformatic perspectives on NRPS\/PKS megasynthases: advances and challenges","volume":"26","author":"H Jenke-Kodama","year":"2009","journal-title":"Nat Prod Rep"},{"key":"ref17","doi-asserted-by":"crossref","first-page":"530","DOI":"10.1111\/j.1574-6976.2006.00022.x","article-title":"Cyanobacterial peptides \u2013 nature&apos;s own combinatorial biosynthesis","volume":"30","author":"M Welker","year":"2006","journal-title":"FEMS Microbiol Rev"},{"key":"ref18","unstructured":"Molina R, Ag\u00fcero-Chapin G, P\u00e9rez-Gonz\u00e1lez MP (2011) TI2BioP (Topological Indices to BioPolymers) <italic>version 2.0.<\/italic>: Molecular Simulation and Drug Design (MSDD), Chemical Bioactives Center, Central University of Las Villas, Cuba."},{"key":"ref19","unstructured":"Statsoft (2008) STATISTICA 8.0 (data analysis software system for windows). version 8.0 ed."},{"key":"ref20","doi-asserted-by":"crossref","first-page":"1149","DOI":"10.1021\/jm0509849","article-title":"A QSAR model for in silico screening of MAO-A inhibitors. Prediction, synthesis, and biological assay of novel coumarins","volume":"49","author":"L Santana","year":"2006","journal-title":"J Med Chem"},{"key":"ref21","doi-asserted-by":"crossref","first-page":"502","DOI":"10.1021\/ci049662o","article-title":"In silico studies toward the discovery of new anti-HIV nucleoside compounds through the use of TOPS-MODE and 2D\/3D connectivity indices. 2. Purine derivatives","volume":"45","author":"S Vilar","year":"2005","journal-title":"J Chem Inf Model"},{"key":"ref22","doi-asserted-by":"crossref","first-page":"85","DOI":"10.1093\/protein\/12.2.85","article-title":"Twilight zone of protein sequence alignments","volume":"12","author":"B Rost","year":"1999","journal-title":"Protein Eng"},{"key":"ref23","doi-asserted-by":"crossref","first-page":"390","DOI":"10.1006\/jmbi.1995.0442","article-title":"A sequence property approach to searching protein databases","volume":"251","author":"U Hobohm","year":"1995","journal-title":"J Mol Biol"},{"key":"ref24","doi-asserted-by":"crossref","first-page":"798","DOI":"10.1093\/bioinformatics\/btn037","article-title":"ConFunc--functional annotation in the twilight zone","volume":"24","author":"MN Wass","year":"2008","journal-title":"Bioinformatics"},{"key":"ref25","doi-asserted-by":"crossref","first-page":"2710","DOI":"10.2174\/138161210792389207","article-title":"Review of QSAR models for enzyme classes of drug targets: Theoretical background and applications in parasites, hosts, and other organisms","volume":"16","author":"R Concu","year":"2010","journal-title":"Curr Pharm Des"},{"key":"ref26","doi-asserted-by":"crossref","first-page":"602","DOI":"10.1016\/j.ygeno.2007.01.008","article-title":"Simple alignment-free methods for protein classification: a case study from G-protein-coupled receptors","volume":"89","author":"PK Strope","year":"2007","journal-title":"Genomics"},{"key":"ref27","doi-asserted-by":"crossref","first-page":"811","DOI":"10.2174\/092986607781483778","article-title":"Prediction of protein structure classes with pseudo amino acid composition and fuzzy support vector machine network","volume":"14","author":"YS Ding","year":"2007","journal-title":"Protein Pept Lett"},{"key":"ref28","doi-asserted-by":"crossref","first-page":"167","DOI":"10.1016\/j.jtbi.2010.12.019","article-title":"Non-linear models based on simple topological indices to identify RNase III protein members","volume":"273","author":"G Aguero-Chapin","year":"2011","journal-title":"J Theor Biol"},{"key":"ref29","doi-asserted-by":"crossref","first-page":"727","DOI":"10.1002\/jcc.10222","article-title":"Prediction of protein secondary structure content by artificial neural network","volume":"24","author":"YD Cai","year":"2003","journal-title":"J Comput Chem"},{"key":"ref30","doi-asserted-by":"crossref","first-page":"179","DOI":"10.1016\/S0097-8485(01)00106-1","article-title":"Artificial neural network model for predicting protein subcellular location","volume":"26","author":"YD Cai","year":"2002","journal-title":"Comput Chem"},{"key":"ref31","doi-asserted-by":"crossref","first-page":"607","DOI":"10.1080\/07391102.2001.10506692","article-title":"Artificial neural network model for predicting membrane protein types","volume":"18","author":"YD Cai","year":"2001","journal-title":"J Biomol Struct Dyn"},{"key":"ref32","doi-asserted-by":"crossref","first-page":"386","DOI":"10.1016\/j.ab.2007.10.012","article-title":"PseAAC: a flexible web server for generating various kinds of protein pseudo amino acid composition","volume":"373","author":"HB Shen","year":"2008","journal-title":"Anal Biochem"},{"key":"ref33","doi-asserted-by":"crossref","first-page":"246","DOI":"10.1002\/prot.1035","article-title":"Prediction of protein cellular attributes using pseudo-amino acid composition","volume":"43","author":"KC Chou","year":"2001","journal-title":"Proteins"},{"key":"ref34","first-page":"121","article-title":"COPid: composition based protein identification","volume":"8","author":"M Kumar","year":"2008","journal-title":"In Silico Biol"},{"key":"ref35","doi-asserted-by":"crossref","first-page":"10","DOI":"10.1093\/bioinformatics\/bth466","article-title":"Using amphiphilic pseudo amino acid composition to predict enzyme subfamily classes","volume":"21","author":"KC Chou","year":"2005","journal-title":"Bioinformatics"},{"key":"ref36","doi-asserted-by":"crossref","unstructured":"Boekhorst J, Snel B (2007) Identification of homologs in insignificant blast hits by exploiting extrinsic gene properties. BMC Bioinformatics 8.","DOI":"10.1186\/1471-2105-8-356"},{"key":"ref37","doi-asserted-by":"crossref","first-page":"403","DOI":"10.1016\/S0022-2836(05)80360-2","article-title":"Basic Local Alignment Search Tool","volume":"215","author":"SF Altschul","year":"1990","journal-title":"J Mol Biol"},{"key":"ref38","doi-asserted-by":"crossref","first-page":"W273","DOI":"10.1093\/nar\/gkl237","article-title":"BAGEL: a web-based bacteriocin genome mining tool","volume":"34","author":"A de Jong","year":"2006","journal-title":"Nucleic Acids Res"},{"key":"ref39","doi-asserted-by":"crossref","unstructured":"Koetschan C, Forster F, Keller A, Schleicher T, Ruderisch B, <etal>et al<\/etal>.. (2009) The ITS2 Database III--sequences and structures for phylogeny. Nucleic Acids Res.","DOI":"10.1093\/nar\/gkp966"},{"key":"ref40","doi-asserted-by":"crossref","first-page":"702","DOI":"10.1002\/jcc.22903","article-title":"Very efficient search for protein alignment\u2013VESPA","volume":"33","author":"M Randic","year":"2012","journal-title":"J Comput Chem"},{"key":"ref41","doi-asserted-by":"crossref","first-page":"77","DOI":"10.1002\/jcc.23105","article-title":"Very efficient search for nucleotide alignments","volume":"34","author":"M Randic","year":"2013","journal-title":"J Comput Chem"},{"key":"ref42","doi-asserted-by":"crossref","first-page":"431","DOI":"10.1007\/s00726-010-0653-9","article-title":"TI2BioP: Topological Indices to BioPolymers. Its practical use to unravel cryptic bacteriocin-like domains","volume":"40","author":"G Aguero-Chapin","year":"2011","journal-title":"Amino Acids"},{"key":"ref43","doi-asserted-by":"crossref","first-page":"454","DOI":"10.1186\/1471-2105-9-454","article-title":"In silico analysis of methyltransferase domains involved in biosynthesis of secondary metabolites","volume":"9","author":"MZ Ansari","year":"2008","journal-title":"BMC Bioinformatics"},{"key":"ref44","doi-asserted-by":"crossref","first-page":"205","DOI":"10.1016\/j.cplett.2005.03.086","article-title":"Four-color map representation of DNA or RNA sequences and their numerical characterization","volume":"407","author":"M Randic","year":"2005","journal-title":"Chemical Physics Letters"},{"key":"ref45","first-page":"723","article-title":"Novel 2D maps and coupling numbers for protein sequences","volume":"580","author":"G Aguero-Chapin","year":"2006","journal-title":"The first QSAR study of polygalacturonases; isolation and prediction of a novel sequence from Psidium guajava L. FEBS Lett"},{"key":"ref46","doi-asserted-by":"crossref","first-page":"844","DOI":"10.1021\/ci950187r","article-title":"Spectral Moments of the Edge Adjacency Matrix in Molecular Graphs. 1. Definition and Applications to the Prediction of Physical Properties of Alkanes","volume":"36","author":"E Estrada","year":"1996","journal-title":"J Chem Inf Comput Sci"},{"key":"ref47","doi-asserted-by":"crossref","first-page":"5179","DOI":"10.1021\/ja00124a002","article-title":"A second generation force field for the simulation of proteins, nucleic acids, and organic molecules","volume":"117","author":"WD Cornell","year":"1995","journal-title":"J Am Chem Soc"},{"key":"ref48","doi-asserted-by":"crossref","first-page":"1005","DOI":"10.1016\/j.bmc.2004.11.040","article-title":"Atom, atom-type and total molecular linear indices as a promising approach for bioorganic and medicinal chemistry: theoretical and experimental assessment of a novel method for virtual screening and rational design of new lead anthelmintic","volume":"13","author":"Y Marrero-Ponce","year":"2005","journal-title":"Bioorg Med Chem"},{"key":"ref49","doi-asserted-by":"crossref","first-page":"5331","DOI":"10.1016\/j.bmc.2004.07.051","article-title":"3D-chiral quadratic indices of the \u2018molecular pseudograph\u2019s atom adjacency matrix&apos; and their application to central chirality codification: classification of ACE inhibitors and prediction of sigma-receptor antagonist activities","volume":"12","author":"Y Marrero-Ponce","year":"2004","journal-title":"Bioorg Med Chem"},{"key":"ref50","doi-asserted-by":"crossref","first-page":"5331","DOI":"10.1016\/j.bmc.2004.07.051","article-title":"3D-chiral quadratic indices of the \u2018molecular pseudograph\u2019s atom adjacency matrix&apos; and their application to central chirality codification: classification of ACE inhibitors and prediction of sigma-receptor antagonist activities","volume":"12","author":"YM Ponce","year":"2004","journal-title":"Bioorg Med Chem"},{"key":"ref51","unstructured":"Kutner MH, Nachtsheim CJ, Neter J, Li W (2005) Standardized Multiple Regression Model. Applied Linear Statistical Models. Fifth ed. New York: McGraw Hill. 271\u2013277."},{"key":"ref52","unstructured":"The MathWorks I, editor (2004) Neural network toolbox use\u0155s guide for use with MATLAB. Massachusetts: The Mathworks Inc."},{"key":"ref53","doi-asserted-by":"crossref","first-page":"863","DOI":"10.1162\/089976699300016476","article-title":"On cross validation for model selection","volume":"11","author":"I Rivals","year":"1999","journal-title":"Neural Comput"},{"key":"ref54","doi-asserted-by":"crossref","first-page":"4673","DOI":"10.1093\/nar\/22.22.4673","article-title":"CLUSTAL W: improving the sensitivity of progressive multiple sequence alignment through sequence weighting, position-specific gap penalties and weight matrix choice","volume":"22","author":"JD Thompson","year":"1994","journal-title":"Nucleic Acids Res"},{"key":"ref55","doi-asserted-by":"crossref","first-page":"564","DOI":"10.1080\/10635150701472164","article-title":"Improvement of phylogenies after removing divergent and ambiguously aligned blocks from protein sequence alignments","volume":"56","author":"G Talavera","year":"2007","journal-title":"Syst Biol"}],"container-title":["PLoS ONE"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/dx.plos.org\/10.1371\/journal.pone.0065926","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,5,8]],"date-time":"2020-05-08T22:26:57Z","timestamp":1588976817000},"score":1,"resource":{"primary":{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pone.0065926"}},"subtitle":[],"editor":[{"given":"Christos A.","family":"Ouzounis","sequence":"first","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2013,7,16]]},"references-count":55,"journal-issue":{"issue":"7","published-online":{"date-parts":[[2013,7,16]]}},"URL":"https:\/\/doi.org\/10.1371\/journal.pone.0065926","relation":{},"ISSN":["1932-6203"],"issn-type":[{"value":"1932-6203","type":"electronic"}],"subject":[],"published":{"date-parts":[[2013,7,16]]}}}