{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,11]],"date-time":"2026-04-11T02:17:26Z","timestamp":1775873846953,"version":"3.50.1"},"update-to":[{"DOI":"10.1371\/journal.pcbi.1007760","type":"new_version","label":"New version","source":"publisher","updated":{"date-parts":[[2020,7,30]],"date-time":"2020-07-30T00:00:00Z","timestamp":1596067200000}}],"reference-count":87,"publisher":"Public Library of Science (PLoS)","issue":"7","license":[{"start":{"date-parts":[[2020,7,20]],"date-time":"2020-07-20T00:00:00Z","timestamp":1595203200000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["www.ploscompbiol.org"],"crossmark-restriction":false},"short-container-title":["PLoS Comput Biol"],"DOI":"10.1371\/journal.pcbi.1007760","type":"journal-article","created":{"date-parts":[[2020,7,20]],"date-time":"2020-07-20T13:35:15Z","timestamp":1595252115000},"page":"e1007760","update-policy":"https:\/\/doi.org\/10.1371\/journal.pcbi.corrections_policy","source":"Crossref","is-referenced-by-count":3,"title":["A novel riboswitch classification based on imbalanced sequences achieved by machine learning"],"prefix":"10.1371","volume":"16","author":[{"given":"Solomon Shiferaw","family":"Beyene","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8909-8718","authenticated-orcid":true,"given":"Tianyi","family":"Ling","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8356-1203","authenticated-orcid":true,"given":"Blagoj","family":"Ristevski","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9677-1699","authenticated-orcid":true,"given":"Ming","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"340","published-online":{"date-parts":[[2020,7,20]]},"reference":[{"key":"pcbi.1007760.ref001","doi-asserted-by":"crossref","first-page":"455","DOI":"10.1146\/annurev-biophys-070816-034042","article-title":"Long-range interactions in riboswitch control of gene expression","volume":"46","author":"CP Jones","year":"2017","journal-title":"Annual review of biophysics"},{"issue":"6","key":"pcbi.1007760.ref002","doi-asserted-by":"crossref","first-page":"451","DOI":"10.1038\/nrm1403","article-title":"Gene regulation by riboswitches","volume":"5","author":"M Mandal","year":"2004","journal-title":"Nat Rev Mol Cell Biol"},{"key":"pcbi.1007760.ref003","article-title":"iLearn: an integrated platform and meta-learner for feature engineering, machine-learning analysis and modeling of DNA, RNA and protein sequence data","author":"Z Chen","year":"2019","journal-title":"Brief Bioinform"},{"issue":"21","key":"pcbi.1007760.ref004","doi-asserted-by":"crossref","first-page":"3012","DOI":"10.1093\/bioinformatics\/btu479","article-title":"A new approach for detecting riboswitches in DNA sequences","volume":"30","author":"JT Havill","year":"2014","journal-title":"Bioinformatics"},{"issue":"6","key":"pcbi.1007760.ref005","doi-asserted-by":"crossref","first-page":"867","DOI":"10.1016\/j.molcel.2011.08.024","article-title":"Prospects for riboswitch discovery and analysis","volume":"43","author":"RR Breaker","year":"2011","journal-title":"Mol Cell"},{"issue":"1\u20132","key":"pcbi.1007760.ref006","doi-asserted-by":"crossref","first-page":"17","DOI":"10.1016\/j.cell.2012.12.024","article-title":"A decade of riboswitches","volume":"152","author":"A Serganov","year":"2013","journal-title":"Cell"},{"issue":"11","key":"pcbi.1007760.ref007","doi-asserted-by":"crossref","first-page":"1031","DOI":"10.1038\/s41589-019-0391-6","article-title":"A newborn RNA switches its fate","volume":"15","author":"ML Rodgers","year":"2019","journal-title":"Nat Chem Biol"},{"key":"pcbi.1007760.ref008","doi-asserted-by":"crossref","first-page":"305","DOI":"10.1146\/annurev.biochem.78.070507.135656","article-title":"The structural and functional diversity of metabolite-binding riboswitches","volume":"78","author":"A Roth","year":"2009","journal-title":"Annu Rev Biochem"},{"issue":"Database issue","key":"pcbi.1007760.ref009","doi-asserted-by":"crossref","first-page":"D30","DOI":"10.1093\/nar\/gku1216","article-title":"GenBank","volume":"43","author":"DA Benson","year":"2015","journal-title":"Nucleic Acids Res"},{"issue":"30","key":"pcbi.1007760.ref010","doi-asserted-by":"crossref","first-page":"10615","DOI":"10.1021\/ja502873j","article-title":"Modular riboswitch toolsets for synthetic genetic control in diverse bacterial species","volume":"136","author":"CJ Robinson","year":"2014","journal-title":"J Am Chem Soc"},{"issue":"2","key":"pcbi.1007760.ref011","doi-asserted-by":"crossref","first-page":"54","DOI":"10.1016\/j.ncrna.2018.04.003","article-title":"Bacterial riboswitches and RNA thermometers: Nature and contributions to pathogenesis","volume":"3","author":"JM Abduljalil","year":"2018","journal-title":"Noncoding RNA Res"},{"issue":"4","key":"pcbi.1007760.ref012","doi-asserted-by":"crossref","first-page":"531","DOI":"10.1007\/s13353-016-0341-x","article-title":"Emerging applications of riboswitches\u2014from antibacterial targets to molecular tools","volume":"57","author":"P Machtel","year":"2016","journal-title":"J Appl Genet"},{"issue":"6","key":"pcbi.1007760.ref013","doi-asserted-by":"crossref","first-page":"644","DOI":"10.1261\/rna.5090103","article-title":"Metabolite-binding RNA domains are present in the genes of eukaryotes","volume":"9","author":"N Sudarsan","year":"2003","journal-title":"RNA"},{"issue":"4","key":"pcbi.1007760.ref014","doi-asserted-by":"crossref","first-page":"693","DOI":"10.1111\/tpj.12540","article-title":"Small molecules that interact with RNA: riboswitch\u2010based gene control and its involvement in metabolic regulation in plants and algae","volume":"79","author":"SE Bocobza","year":"2014","journal-title":"The Plant Journal"},{"issue":"11","key":"pcbi.1007760.ref015","doi-asserted-by":"crossref","first-page":"3437","DOI":"10.1105\/tpc.107.053645","article-title":"Riboswitch control of gene expression in plants by splicing and alternative 3' end processing of mRNAs","volume":"19","author":"A Wachter","year":"2007","journal-title":"Plant Cell"},{"issue":"3","key":"pcbi.1007760.ref016","doi-asserted-by":"crossref","DOI":"10.1515\/jib-2017-0052","article-title":"Biological Big Bytes: Integrative Analysis of Large Biological Datasets","volume":"14","author":"M Chen","year":"2017","journal-title":"J Integr Bioinform"},{"key":"pcbi.1007760.ref017","article-title":"Versatile interactions and bioinformatics analysis of noncoding RNAs","author":"Q Chen","year":"2018","journal-title":"Brief Bioinform"},{"issue":"Suppl 2","key":"pcbi.1007760.ref018","doi-asserted-by":"crossref","first-page":"S4","DOI":"10.1186\/1471-2105-14-S2-S4","article-title":"An enhanced computational platform for investigating the roles of regulatory RNA and for identifying functional RNA motifs","volume":"14","author":"TH Chang","year":"2013","journal-title":"BMC Bioinformatics"},{"issue":"D1","key":"pcbi.1007760.ref019","doi-asserted-by":"crossref","first-page":"D335","DOI":"10.1093\/nar\/gkx1038","article-title":"Rfam 13.0: shifting to a genome-centric resource for non-coding RNA families","volume":"46","author":"I Kalvari","year":"2018","journal-title":"Nucleic Acids Res"},{"issue":"18","key":"pcbi.1007760.ref020","doi-asserted-by":"crossref","first-page":"3541","DOI":"10.1093\/bioinformatics\/btz093","article-title":"RiboD: a comprehensive database for prokaryotic riboswitches","volume":"35","author":"S Mukherjee","year":"2019","journal-title":"Bioinformatics"},{"issue":"Web Server issue","key":"pcbi.1007760.ref021","doi-asserted-by":"crossref","first-page":"W154","DOI":"10.1093\/nar\/gkh352","article-title":"Riboswitch finder\u2014a tool for identification of riboswitch RNAs","volume":"32","author":"P Bengert","year":"2004","journal-title":"Nucleic Acids Res"},{"issue":"Web Server issue","key":"pcbi.1007760.ref022","doi-asserted-by":"crossref","first-page":"W690","DOI":"10.1093\/nar\/gki445","article-title":"RibEx: a web server for locating riboswitches and other conserved bacterial regulatory elements","volume":"33","author":"C Abreu-Goodger","year":"2005","journal-title":"Nucleic Acids Res"},{"issue":"7","key":"pcbi.1007760.ref023","doi-asserted-by":"crossref","first-page":"1426","DOI":"10.1261\/rna.1623809","article-title":"Computational identification of riboswitches based on RNA conserved functional sequences and conformations","volume":"15","author":"TH Chang","year":"2009","journal-title":"RNA"},{"issue":"3","key":"pcbi.1007760.ref024","doi-asserted-by":"crossref","first-page":"303","DOI":"10.1016\/S0959-440X(00)00088-9","article-title":"Calculating nucleic acid secondary structure","volume":"10","author":"M Zuker","year":"2000","journal-title":"Curr Opin Struct Biol"},{"issue":"2","key":"pcbi.1007760.ref025","first-page":"99","article-title":"Application of supervised machine learning algorithms for the classification of regulatory RNA riboswitches","volume":"16","author":"S Singh","year":"2017","journal-title":"Brief Funct Genomics"},{"key":"pcbi.1007760.ref026","doi-asserted-by":"crossref","first-page":"63","DOI":"10.1016\/j.biosystems.2018.09.001","article-title":"Classification of riboswitch sequences using k-mer frequencies","volume":"174","author":"HA Guillen-Ramirez","year":"2018","journal-title":"Biosystems"},{"issue":"11","key":"pcbi.1007760.ref027","doi-asserted-by":"crossref","first-page":"987","DOI":"10.1038\/nbt.2023","article-title":"How to apply de Bruijn graphs to genome assembly","volume":"29","author":"PE Compeau","year":"2011","journal-title":"Nature biotechnology"},{"issue":"5","key":"pcbi.1007760.ref028","doi-asserted-by":"crossref","first-page":"1792","DOI":"10.1093\/nar\/gkh340","article-title":"MUSCLE: multiple sequence alignment with high accuracy and high throughput","volume":"32","author":"RC Edgar","year":"2004","journal-title":"Nucleic acids research"},{"issue":"1","key":"pcbi.1007760.ref029","doi-asserted-by":"crossref","first-page":"517","DOI":"10.1186\/1471-2164-9-517","article-title":"A new method to compute K-mer frequencies and its application to annotate large repetitive plant genomes","volume":"9","author":"S Kurtz","year":"2008","journal-title":"BMC genomics"},{"key":"pcbi.1007760.ref030","unstructured":"Singh ND, Dhall A. Clustering and learning from imbalanced data. arXiv preprint arXiv:181100972. 2018."},{"issue":"1","key":"pcbi.1007760.ref031","doi-asserted-by":"crossref","first-page":"23","DOI":"10.1111\/j.1541-0420.2011.01645.x","article-title":"Dynamic logistic regression and dynamic model averaging for binary classification","volume":"68","author":"TH McCormick","year":"2012","journal-title":"Biometrics"},{"issue":"12","key":"pcbi.1007760.ref032","doi-asserted-by":"crossref","first-page":"3358","DOI":"10.1016\/j.patcog.2007.04.009","article-title":"Cost-sensitive boosting for classification of imbalanced data","volume":"40","author":"Y Sun","year":"2007","journal-title":"Pattern Recognition"},{"issue":"Aug","key":"pcbi.1007760.ref033","first-page":"975","article-title":"Probability estimates for multi-class classification by pairwise coupling","volume":"5","author":"T-F Wu","year":"2004","journal-title":"Journal of Machine Learning Research"},{"key":"pcbi.1007760.ref034","doi-asserted-by":"crossref","first-page":"321","DOI":"10.1613\/jair.953","article-title":"SMOTE: synthetic minority over-sampling technique","volume":"16","author":"NV Chawla","year":"2002","journal-title":"Journal of artificial intelligence research"},{"key":"pcbi.1007760.ref035","article-title":"Predicting bacterial virulence factors\u2013evaluation of machine learning and negative data strategies","author":"R Rentzsch","year":"2019","journal-title":"Briefings in Bioinformatics"},{"issue":"6","key":"pcbi.1007760.ref036","doi-asserted-by":"crossref","first-page":"614","DOI":"10.1093\/bib\/bbr019","article-title":"Computational challenges of sequence classification in microbiomic data","volume":"12","author":"P Ribeca","year":"2011","journal-title":"Briefings in Bioinformatics"},{"key":"pcbi.1007760.ref037","article-title":"A comprehensive review and performance evaluation of bioinformatics tools for HLA class I peptide-binding prediction","author":"S Mei","year":"2019","journal-title":"Briefings in Bioinformatics"},{"issue":"2","key":"pcbi.1007760.ref038","doi-asserted-by":"crossref","first-page":"482","DOI":"10.1093\/bib\/bbx135","article-title":"A rank-based algorithm of differential expression analysis for small cell line data with statistical control","volume":"20","author":"X Li","year":"2017","journal-title":"Briefings in Bioinformatics"},{"key":"pcbi.1007760.ref039","unstructured":"Woolson R. Wilcoxon signednedo Y, He J, et al. A rank-based algorithm of differential"},{"issue":"1","key":"pcbi.1007760.ref040","doi-asserted-by":"crossref","first-page":"121","DOI":"10.1186\/s12917-016-0745-1","article-title":"Redundant contribution of a Transient Receptor Potential cation channel Member 1 exon 11 single nucleotide polymorphism to equine congenital stationary night blindness","volume":"12","author":"ML Scott","year":"2016","journal-title":"BMC veterinary research"},{"issue":"12","key":"pcbi.1007760.ref041","doi-asserted-by":"crossref","first-page":"1218","DOI":"10.1038\/nsmb.1702","article-title":"Structural basis of ligand binding by a c-di-GMP riboswitch","volume":"16","author":"KD Smith","year":"2009","journal-title":"Nature structural & molecular biology"},{"issue":"6","key":"pcbi.1007760.ref042","doi-asserted-by":"crossref","first-page":"784","DOI":"10.1016\/j.molcel.2009.02.019","article-title":"Structural insights into riboswitch control of the biosynthesis of queuosine, a modified nucleotide found in the anticodon of tRNA","volume":"33","author":"M Kang","year":"2009","journal-title":"Molecular cell"},{"issue":"1","key":"pcbi.1007760.ref043","doi-asserted-by":"crossref","first-page":"25","DOI":"10.1261\/rna.771608","article-title":"Chemical basis of glycine riboswitch cooperativity","volume":"14","author":"M Kwon","year":"2008","journal-title":"Rna"},{"issue":"3","key":"pcbi.1007760.ref044","doi-asserted-by":"crossref","first-page":"259","DOI":"10.1016\/j.str.2007.02.001","article-title":"The THI-box riboswitch, or how RNA binds thiamin pyrophosphate","volume":"15","author":"J Miranda-Rios","year":"2007","journal-title":"Structure"},{"issue":"7097","key":"pcbi.1007760.ref045","doi-asserted-by":"crossref","first-page":"1172","DOI":"10.1038\/nature04819","article-title":"Structure of the S-adenosylmethionine riboswitch regulatory mRNA element","volume":"441","author":"RK Montange","year":"2006","journal-title":"Nature"},{"issue":"5","key":"pcbi.1007760.ref046","doi-asserted-by":"crossref","first-page":"822","DOI":"10.1261\/rna.988608","article-title":"The aptamer core of SAM-IV riboswitches mimics the ligand-binding site of SAM-I riboswitches","volume":"14","author":"Z Weinberg","year":"2008","journal-title":"Rna"},{"issue":"6","key":"pcbi.1007760.ref047","doi-asserted-by":"crossref","first-page":"691","DOI":"10.1016\/j.molcel.2008.01.012","article-title":"Riboswitches that sense S-adenosylhomocysteine and activate genes involved in coenzyme recycling","volume":"29","author":"JX Wang","year":"2008","journal-title":"Molecular cell"},{"issue":"2","key":"pcbi.1007760.ref048","doi-asserted-by":"crossref","first-page":"177","DOI":"10.1038\/nsmb.1371","article-title":"Structure of the SAM-II riboswitch bound to S-adenosylmethionine","volume":"15","author":"SD Gilbert","year":"2008","journal-title":"Nature structural & molecular biology"},{"issue":"25","key":"pcbi.1007760.ref049","doi-asserted-by":"crossref","first-page":"15908","DOI":"10.1073\/pnas.212628899","article-title":"An mRNA structure that controls gene expression by binding FMN","volume":"99","author":"WC Winkler","year":"2002","journal-title":"Proceedings of the National Academy of Sciences"},{"issue":"19","key":"pcbi.1007760.ref050","doi-asserted-by":"crossref","first-page":"2753","DOI":"10.1128\/JB.00476-16","article-title":"Identification and regulation of genes for cobalamin transport in the cyanobacterium Synechococcus sp. strain PCC 7002","volume":"198","author":"AA P\u00e9rez","year":"2016","journal-title":"Journal of bacteriology"},{"issue":"4","key":"pcbi.1007760.ref051","doi-asserted-by":"crossref","first-page":"918","DOI":"10.1111\/j.1365-2958.2008.06208.x","article-title":"A widespread riboswitch candidate that controls bacterial genes involved in molybdenum cofactor and tungsten cofactor metabolism","volume":"68","author":"EE Regulski","year":"2008","journal-title":"Molecular microbiology"},{"issue":"5","key":"pcbi.1007760.ref052","doi-asserted-by":"crossref","first-page":"878","DOI":"10.1016\/j.cell.2007.06.051","article-title":"Structure and mechanism of a metal-sensing regulatory RNA","volume":"130","author":"CE Dann","year":"2007","journal-title":"Cell"},{"issue":"4","key":"pcbi.1007760.ref053","doi-asserted-by":"crossref","first-page":"685","DOI":"10.1261\/rna.937308","article-title":"Confirmation of a second natural preQ1 aptamer class in Streptococcaceae bacteria","volume":"14","author":"MM Meyer","year":"2008","journal-title":"Rna"},{"issue":"6980","key":"pcbi.1007760.ref054","doi-asserted-by":"crossref","first-page":"281","DOI":"10.1038\/nature02362","article-title":"Control of gene expression by a natural metabolite-responsive ribozyme","volume":"428","author":"WC Winkler","year":"2004","journal-title":"Nature"},{"issue":"5","key":"pcbi.1007760.ref055","doi-asserted-by":"crossref","first-page":"577","DOI":"10.1016\/S0092-8674(03)00391-X","article-title":"Riboswitches control fundamental biochemical pathways in Bacillus subtilis and other bacteria","volume":"113","author":"M Mandal","year":"2003","journal-title":"Cell"},{"key":"pcbi.1007760.ref056","doi-asserted-by":"crossref","first-page":"421","DOI":"10.1186\/1471-2105-10-421","article-title":"BLAST+: architecture and applications","volume":"10","author":"C Camacho","year":"2009","journal-title":"BMC Bioinformatics"},{"key":"pcbi.1007760.ref057","article-title":"Protein functional annotation of simultaneously improved stability, accuracy and false discovery rate achieved by a sequence-based deep learning","author":"J Hong","year":"2019","journal-title":"Briefings in bioinformatics"},{"issue":"8","key":"pcbi.1007760.ref058","doi-asserted-by":"crossref","first-page":"e0155290","DOI":"10.1371\/journal.pone.0155290","article-title":"SVM-Prot 2016: a web-server for machine learning prediction of protein functional families from sequence irrespective of similarity","volume":"11","author":"YH Li","year":"2016","journal-title":"PloS one"},{"key":"pcbi.1007760.ref059","article-title":"SubMito-XGBoost: predicting protein submitochondrial localization by fusing multiple feature information and eXtreme gradient boosting","author":"B Yu","year":"2019","journal-title":"Bioinformatics"},{"issue":"1","key":"pcbi.1007760.ref060","doi-asserted-by":"crossref","first-page":"183","DOI":"10.3390\/ijms19010183","article-title":"Assessing the performances of protein function prediction algorithms from the perspectives of identification accuracy and false discovery rate","volume":"19","author":"C Yu","year":"2018","journal-title":"International journal of molecular sciences"},{"issue":"6","key":"pcbi.1007760.ref061","doi-asserted-by":"crossref","first-page":"481","DOI":"10.1111\/tpj.13180","article-title":"A naive Bayesian classifier for identifying plant microRNAs","volume":"86","author":"S Douglass","year":"2016","journal-title":"Plant J"},{"issue":"9","key":"pcbi.1007760.ref062","doi-asserted-by":"crossref","first-page":"1263","DOI":"10.1109\/TKDE.2008.239","article-title":"Learning from imbalanced data","volume":"21","author":"H He","year":"2009","journal-title":"IEEE Transactions on knowledge and data engineering"},{"issue":"21","key":"pcbi.1007760.ref063","doi-asserted-by":"crossref","first-page":"44","DOI":"10.5120\/16919-6729","article-title":"Comparison of nearest neighbor (ibk), regression by discretization and isotonic regression classification algorithms for precipitation classes prediction","volume":"96","author":"SM Mwagha","year":"2014","journal-title":"International Journal of Computer Applications"},{"issue":"5","key":"pcbi.1007760.ref064","doi-asserted-by":"crossref","first-page":"839","DOI":"10.1093\/bib\/bbt012","article-title":"Data construction for phosphorylation site prediction","volume":"15","author":"H Gong","year":"2014","journal-title":"Brief Bioinform"},{"issue":"5","key":"pcbi.1007760.ref065","doi-asserted-by":"crossref","first-page":"429","DOI":"10.3233\/IDA-2002-6504","article-title":"The class imbalance problem: A systematic study","volume":"6","author":"N Japkowicz","year":"2002","journal-title":"Intelligent data analysis"},{"key":"pcbi.1007760.ref066","volume-title":"Data Mining: Practical machine learning tools and techniques","author":"IH Witten","year":"2016"},{"key":"pcbi.1007760.ref067","first-page":"83","article-title":"Data mining concepts and techniques third edition","author":"J Han","year":"2011","journal-title":"The Morgan Kaufmann Series in Data Management Systems"},{"issue":"17","key":"pcbi.1007760.ref068","doi-asserted-by":"crossref","first-page":"2308","DOI":"10.1093\/bioinformatics\/btg299","article-title":"PDB file parser and structure class implemented in Python","volume":"19","author":"T Hamelryck","year":"2003","journal-title":"Bioinformatics"},{"issue":"1","key":"pcbi.1007760.ref069","doi-asserted-by":"crossref","first-page":"380","DOI":"10.1093\/nar\/gkh180","article-title":"Local homology recognition and distance measures in linear time using compressed amino acid alphabets","volume":"32","author":"RC Edgar","year":"2004","journal-title":"Nucleic Acids Research"},{"key":"pcbi.1007760.ref070","article-title":"A critical review of five machine learning-based algorithms for predicting protein stability changes upon mutation","author":"J Fang","year":"2019","journal-title":"Briefings in bioinformatics"},{"key":"pcbi.1007760.ref071","doi-asserted-by":"crossref","first-page":"177","DOI":"10.1016\/bs.mie.2019.05.026","article-title":"Using Rosetta for RNA homology modeling","volume":"623","author":"AM Watkins","year":"2019","journal-title":"Methods in enzymology"},{"key":"pcbi.1007760.ref072","doi-asserted-by":"crossref","unstructured":"Saghir H, Megherbi DB, editors. An efficient comparative machine learning-based metagenomics binning technique via using Random forest. 2013 IEEE International Conference on Computational Intelligence and Virtual Environments for Measurement Systems and Applications (CIVEMSA); 2013: IEEE.","DOI":"10.1109\/CIVEMSA.2013.6617419"},{"key":"pcbi.1007760.ref073","doi-asserted-by":"crossref","first-page":"358","DOI":"10.1186\/s12859-015-0793-8","article-title":"Fizzy: feature subset selection for metagenomics","volume":"16","author":"G Ditzler","year":"2015","journal-title":"BMC Bioinformatics"},{"issue":"24","key":"pcbi.1007760.ref074","doi-asserted-by":"crossref","first-page":"3745","DOI":"10.1093\/bioinformatics\/btw560","article-title":"Imbalanced multi-label learning for identifying antimicrobial peptides and their functional types","volume":"32","author":"W Lin","year":"2016","journal-title":"Bioinformatics"},{"key":"pcbi.1007760.ref075","doi-asserted-by":"crossref","unstructured":"Paper D, Paper D. Scikit-Learn Classifier Tuning from Complex Training Sets. Hands-on Scikit-Learn for Machine Learning Applications: Data Science Fundamentals with Python. 165-88.","DOI":"10.1007\/978-1-4842-5373-1_6"},{"key":"pcbi.1007760.ref076","doi-asserted-by":"crossref","unstructured":"He H, Garcia EA. Learning from Imbalanced Data IEEE Transactions on Knowledge and Data Engineering v. 21 n. 9. September; 2009.","DOI":"10.1109\/TKDE.2008.239"},{"issue":"Mar","key":"pcbi.1007760.ref077","first-page":"1157","article-title":"An introduction to variable and feature selection","volume":"3","author":"I Guyon","year":"2003","journal-title":"Journal of machine learning research"},{"issue":"1","key":"pcbi.1007760.ref078","first-page":"148","article-title":"Comprehensive assessment and performance improvement of effector protein predictors for bacterial secretion systems III, IV and VI","volume":"19","author":"Y An","year":"2018","journal-title":"Brief Bioinform"},{"key":"pcbi.1007760.ref079","doi-asserted-by":"crossref","first-page":"125","DOI":"10.1016\/j.jtbi.2018.01.023","article-title":"PREvaIL, an integrative approach for inferring catalytic residues using sequence, structural, and network features in a machine-learning framework","volume":"443","author":"J Song","year":"2018","journal-title":"Journal of theoretical biology"},{"issue":"1\u20133","key":"pcbi.1007760.ref080","doi-asserted-by":"crossref","first-page":"351","DOI":"10.1023\/A:1012431217818","article-title":"Convergence of a generalized SMO algorithm for SVM classifier design","volume":"46","author":"SS Keerthi","year":"2002","journal-title":"Machine Learning"},{"key":"pcbi.1007760.ref081","first-page":"1189","article-title":"Greedy function approximation: a gradient boosting machine","author":"JH Friedman","year":"2001","journal-title":"Annals of statistics"},{"key":"pcbi.1007760.ref082","volume-title":"Hybrid Methods for Feature Selection","author":"I Cheng","year":"2013"},{"issue":"4","key":"pcbi.1007760.ref083","doi-asserted-by":"crossref","first-page":"451","DOI":"10.1109\/5326.897072","article-title":"Neural networks for classification: a survey","volume":"30","author":"GP Zhang","year":"2000","journal-title":"IEEE Transactions on Systems, Man, and Cybernetics, Part C (Applications and Reviews)"},{"issue":"4","key":"pcbi.1007760.ref084","doi-asserted-by":"crossref","first-page":"472","DOI":"10.1093\/bioinformatics\/btt709","article-title":"Combining evolutionary information extracted from frequency profiles with sequence-based kernels for protein remote homology detection","volume":"30","author":"B Liu","year":"2014","journal-title":"Bioinformatics"},{"issue":"1","key":"pcbi.1007760.ref085","doi-asserted-by":"crossref","first-page":"127","DOI":"10.1186\/1471-2164-15-127","article-title":"Prediction and classification of ncRNAs using structural information","volume":"15","author":"B Panwar","year":"2014","journal-title":"BMC genomics"},{"issue":"suppl_2","key":"pcbi.1007760.ref086","doi-asserted-by":"crossref","first-page":"W345","DOI":"10.1093\/nar\/gkm391","article-title":"CPC: assess the protein-coding potential of transcripts using sequence features and support vector machine","volume":"35","author":"L Kong","year":"2007","journal-title":"Nucleic acids research"},{"issue":"4","key":"pcbi.1007760.ref087","doi-asserted-by":"crossref","first-page":"427","DOI":"10.1016\/j.ipm.2009.03.002","article-title":"A systematic analysis of performance measures for classification tasks","volume":"45","author":"M Sokolova","year":"2009","journal-title":"Information processing & management"}],"updated-by":[{"DOI":"10.1371\/journal.pcbi.1007760","type":"new_version","label":"New version","source":"publisher","updated":{"date-parts":[[2020,7,30]],"date-time":"2020-07-30T00:00:00Z","timestamp":1596067200000}}],"container-title":["PLOS Computational Biology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1007760","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,7,30]],"date-time":"2020-07-30T19:38:31Z","timestamp":1596137911000},"score":1,"resource":{"primary":{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1007760"}},"subtitle":[],"editor":[{"given":"Ilya","family":"Ioshikhes","sequence":"first","affiliation":[],"role":[{"role":"editor","vocabulary":"crossref"}]}],"short-title":[],"issued":{"date-parts":[[2020,7,20]]},"references-count":87,"journal-issue":{"issue":"7","published-online":{"date-parts":[[2020,7,20]]}},"URL":"https:\/\/doi.org\/10.1371\/journal.pcbi.1007760","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/2020.03.02.972778","asserted-by":"object"}]},"ISSN":["1553-7358"],"issn-type":[{"value":"1553-7358","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,7,20]]}}}