{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,27]],"date-time":"2026-02-27T06:11:35Z","timestamp":1772172695324,"version":"3.50.1"},"reference-count":44,"publisher":"Public Library of Science (PLoS)","issue":"10","license":[{"start":{"date-parts":[[2020,10,1]],"date-time":"2020-10-01T00:00:00Z","timestamp":1601510400000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["www.ploscompbiol.org"],"crossmark-restriction":false},"short-container-title":["PLoS Comput Biol"],"DOI":"10.1371\/journal.pcbi.1008174","type":"journal-article","created":{"date-parts":[[2020,10,1]],"date-time":"2020-10-01T13:27:54Z","timestamp":1601558874000},"page":"e1008174","update-policy":"https:\/\/doi.org\/10.1371\/journal.pcbi.corrections_policy","source":"Crossref","is-referenced-by-count":11,"title":["Metabolic pathway inference using multi-label classification with rich pathway features"],"prefix":"10.1371","volume":"16","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3407-1187","authenticated-orcid":true,"given":"Abdur Rahman","family":"M. A. Basher","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7047-6790","authenticated-orcid":true,"given":"Ryan J.","family":"McLaughlin","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4889-6876","authenticated-orcid":true,"given":"Steven J.","family":"Hallam","sequence":"additional","affiliation":[]}],"member":"340","published-online":{"date-parts":[[2020,10,1]]},"reference":[{"issue":"5594","key":"pcbi.1008174.ref001","doi-asserted-by":"crossref","first-page":"763","DOI":"10.1126\/science.1078563","article-title":"Life\u2019s complexity pyramid","volume":"298","author":"ZN Oltvai","year":"2002","journal-title":"Science"},{"key":"pcbi.1008174.ref002","doi-asserted-by":"crossref","first-page":"209","DOI":"10.1016\/j.mib.2016.04.014","article-title":"The information science of microbial ecology","volume":"31","author":"AS Hahn","year":"2016","journal-title":"Current opinion in microbiology"},{"issue":"1","key":"pcbi.1008174.ref003","doi-asserted-by":"crossref","first-page":"214","DOI":"10.1038\/s42003-019-0440-4","article-title":"Combined network analysis and machine learning allows the prediction of metabolic pathways from tomato metabolomics data","volume":"2","author":"D Toubiana","year":"2019","journal-title":"Communications Biology"},{"issue":"4","key":"pcbi.1008174.ref004","doi-asserted-by":"crossref","first-page":"195","DOI":"10.1016\/j.nbt.2008.12.009","article-title":"Next-generation DNA sequencing techniques","volume":"25","author":"WJ Ansorge","year":"2009","journal-title":"New biotechnology"},{"issue":"D1","key":"pcbi.1008174.ref005","doi-asserted-by":"crossref","first-page":"D353","DOI":"10.1093\/nar\/gkw1092","article-title":"KEGG: new perspectives on genomes, pathways, diseases and drugs","volume":"45","author":"M Kanehisa","year":"2017","journal-title":"Nucleic Acids Research"},{"issue":"D1","key":"pcbi.1008174.ref006","doi-asserted-by":"crossref","first-page":"D649","DOI":"10.1093\/nar\/gkx1132","article-title":"The reactome pathway knowledgebase","volume":"46","author":"A Fabregat","year":"2017","journal-title":"Nucleic acids research"},{"key":"pcbi.1008174.ref007","doi-asserted-by":"crossref","unstructured":"Caspi R, Billington R, Keseler IM, Kothari A, Krummenacker M, Midford PE, et al. The MetaCyc database of metabolic pathways and enzymes-a 2019 update. Nucleic acids research. 2019.","DOI":"10.1093\/nar\/gkz862"},{"issue":"4","key":"pcbi.1008174.ref008","doi-asserted-by":"crossref","first-page":"1085","DOI":"10.1093\/bib\/bbx085","article-title":"The BioCyc collection of microbial genomes and metabolic pathways","volume":"20","author":"PD Karp","year":"2017","journal-title":"Briefings in Bioinformatics"},{"issue":"suppl_1","key":"pcbi.1008174.ref009","doi-asserted-by":"crossref","first-page":"S225","DOI":"10.1093\/bioinformatics\/18.suppl_1.S225","article-title":"The pathway tools software","volume":"18","author":"PD Karp","year":"2002","journal-title":"Bioinformatics"},{"issue":"5","key":"pcbi.1008174.ref010","doi-asserted-by":"crossref","first-page":"877","DOI":"10.1093\/bib\/bbv079","article-title":"Pathway Tools version 19.0 update: software for pathway\/genome informatics and systems biology","volume":"17","author":"PD Karp","year":"2016","journal-title":"Briefings in bioinformatics"},{"issue":"1","key":"pcbi.1008174.ref011","article-title":"The EcoCyc Database","volume":"8","author":"PD Karp","year":"2018","journal-title":"EcoSal Plus"},{"issue":"1 Supplement","key":"pcbi.1008174.ref012","first-page":"lb192","article-title":"BioCyc: Online Resource for Genome and Metabolic Pathway Analysis","volume":"30","author":"R Caspi","year":"2016","journal-title":"The FASEB Journal"},{"issue":"1","key":"pcbi.1008174.ref013","doi-asserted-by":"crossref","first-page":"202","DOI":"10.1186\/1471-2105-14-202","article-title":"MetaPathways: a modular pipeline for constructing pathway\/genome databases from environmental sequence information","volume":"14","author":"KM Konwar","year":"2013","journal-title":"BMC bioinformatics"},{"issue":"1","key":"pcbi.1008174.ref014","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1186\/1471-2164-15-619","article-title":"Metabolic pathways for the whole community","volume":"15","author":"NW Hanson","year":"2014","journal-title":"BMC genomics"},{"issue":"20","key":"pcbi.1008174.ref015","doi-asserted-by":"crossref","first-page":"3345","DOI":"10.1093\/bioinformatics\/btv361","article-title":"MetaPathways v2. 5: quantitative functional, taxonomic and usability improvements","volume":"31","author":"KM Konwar","year":"2015","journal-title":"Bioinformatics"},{"key":"pcbi.1008174.ref016","article-title":"A geographically-diverse collection of 418 human gut microbiome pathway genome databases","volume":"4","author":"AS Hahn","year":"2017","journal-title":"Scientific Data"},{"issue":"8","key":"pcbi.1008174.ref017","doi-asserted-by":"crossref","first-page":"e1000465","DOI":"10.1371\/journal.pcbi.1000465","article-title":"A parsimony approach to biological pathway reconstruction\/inference for genomes and metagenomes","volume":"5","author":"Y Ye","year":"2009","journal-title":"PLoS Comput Biol"},{"issue":"1","key":"pcbi.1008174.ref018","first-page":"1","article-title":"Machine learning methods for metabolic pathway prediction","volume":"11","author":"JM Dale","year":"2010","journal-title":"BMC bioinformatics"},{"issue":"12","key":"pcbi.1008174.ref019","doi-asserted-by":"crossref","first-page":"2153","DOI":"10.1093\/bioinformatics\/bty065","article-title":"Selenzyme: Enzyme selection tool for pathway design","volume":"34","author":"P Carbonell","year":"2018","journal-title":"Bioinformatics"},{"key":"pcbi.1008174.ref020","doi-asserted-by":"crossref","first-page":"158","DOI":"10.1016\/j.ymben.2017.12.002","article-title":"RetroPath2. 0: A retrosynthesis workflow for metabolic engineers","volume":"45","author":"B Del\u00e9pine","year":"2018","journal-title":"Metabolic engineering"},{"issue":"12","key":"pcbi.1008174.ref021","doi-asserted-by":"crossref","first-page":"i278","DOI":"10.1093\/bioinformatics\/btw260","article-title":"Simultaneous prediction of enzyme orthologs from chemical transformation patterns for de novo metabolic pathway reconstruction","volume":"32","author":"Y Tabei","year":"2016","journal-title":"Bioinformatics"},{"issue":"11","key":"pcbi.1008174.ref022","doi-asserted-by":"crossref","first-page":"e1003918","DOI":"10.1371\/journal.pcbi.1003918","article-title":"BiomeNet: A Bayesian model for inference of metabolic divergence among microbial communities","volume":"10","author":"M Shafiei","year":"2014","journal-title":"PLoS Comput Biol"},{"issue":"3","key":"pcbi.1008174.ref023","doi-asserted-by":"crossref","first-page":"e1002981","DOI":"10.1371\/journal.pcbi.1002981","article-title":"Probabilistic inference of biochemical reactions in microbial communities from metagenomic sequences","volume":"9","author":"D Jiao","year":"2013","journal-title":"PLoS Comput Biol"},{"issue":"16","key":"pcbi.1008174.ref024","doi-asserted-by":"crossref","first-page":"1366","DOI":"10.1016\/j.cub.2011.06.051","article-title":"An interdependent metabolic patchwork in the nested symbiosis of mealybugs","volume":"21","author":"JP McCutcheon","year":"2011","journal-title":"Current Biology"},{"issue":"11","key":"pcbi.1008174.ref025","doi-asserted-by":"crossref","first-page":"1063","DOI":"10.1038\/nmeth.4458","article-title":"Critical assessment of metagenome interpretation\u2014a benchmark of metagenomics software","volume":"14","author":"A Sczyrba","year":"2017","journal-title":"Nature methods"},{"issue":"3","key":"pcbi.1008174.ref026","doi-asserted-by":"crossref","first-page":"R26","DOI":"10.1186\/gb-2011-12-3-r26","article-title":"Community transcriptomics reveals universal patterns of protein sequence conservation in natural microbial communities","volume":"12","author":"FJ Stewart","year":"2011","journal-title":"Genome biology"},{"key":"pcbi.1008174.ref027","first-page":"2825","article-title":"Scikit-learn: Machine Learning in Python","volume":"12","author":"F Pedregosa","year":"2011","journal-title":"Journal of Machine Learning Research"},{"issue":"2","key":"pcbi.1008174.ref028","doi-asserted-by":"crossref","first-page":"22","DOI":"10.1109\/MCSE.2011.37","article-title":"The NumPy array: a structure for efficient numerical computation","volume":"13","author":"Svd Walt","year":"2011","journal-title":"Computing in Science & Engineering"},{"key":"pcbi.1008174.ref029","unstructured":"Hagberg A, Swart P, S Chult D. Exploring network structure, dynamics, and function using NetworkX. Los Alamos National Lab.(LANL), Los Alamos, NM (United States); 2008."},{"key":"pcbi.1008174.ref030","doi-asserted-by":"crossref","unstructured":"Virtanen P, Gommers R, Oliphant TE, Haberland M, Reddy T, Cournapeau D, et al. SciPy 1.0\u2013Fundamental Algorithms for Scientific Computing in Python. arXiv e-prints. 2019; p. arXiv:1907.10121.","DOI":"10.1038\/s41592-019-0686-2"},{"issue":"1","key":"pcbi.1008174.ref031","doi-asserted-by":"crossref","first-page":"304","DOI":"10.1093\/nar\/28.1.304","article-title":"The ENZYME database in 2000","volume":"28","author":"A Bairoch","year":"2000","journal-title":"Nucleic acids research"},{"issue":"9","key":"pcbi.1008174.ref032","doi-asserted-by":"crossref","first-page":"3084","DOI":"10.1016\/j.patcog.2012.03.004","article-title":"An extensive experimental comparison of methods for multi-label learning","volume":"45","author":"G Madjarov","year":"2012","journal-title":"Pattern Recognition"},{"issue":"8","key":"pcbi.1008174.ref033","doi-asserted-by":"crossref","first-page":"1819","DOI":"10.1109\/TKDE.2013.39","article-title":"A review on multi-label learning algorithms","volume":"26","author":"ML Zhang","year":"2014","journal-title":"IEEE transactions on knowledge and data engineering"},{"key":"pcbi.1008174.ref034","doi-asserted-by":"crossref","first-page":"14","DOI":"10.1016\/j.ab.2014.10.014","article-title":"mPLR-Loc: An adaptive decision multi-label classifier based on penalized logistic regression for protein subcellular localization prediction","volume":"473","author":"S Wan","year":"2015","journal-title":"Analytical biochemistry"},{"issue":"2","key":"pcbi.1008174.ref035","doi-asserted-by":"crossref","first-page":"301","DOI":"10.1111\/j.1467-9868.2005.00503.x","article-title":"Regularization and variable selection via the elastic net","volume":"67","author":"H Zou","year":"2005","journal-title":"Journal of the Royal Statistical Society: Series B (Statistical Methodology)"},{"issue":"Mar","key":"pcbi.1008174.ref036","first-page":"1333","article-title":"Grafting: Fast, incremental feature selection by gradient descent in function space","volume":"3","author":"S Perkins","year":"2003","journal-title":"Journal of machine learning research"},{"key":"pcbi.1008174.ref037","unstructured":"Lee JD, Panageas I, Piliouras G, Simchowitz M, Jordan MI, Recht B. First-order Methods Almost Always Avoid Saddle Points. arXiv preprint arXiv:171007406. 2017."},{"key":"pcbi.1008174.ref038","volume-title":"Introduction to linear optimization","author":"D Bertsimas","year":"1997"},{"key":"pcbi.1008174.ref039","first-page":"145","article-title":"On the stratification of multi-label data","author":"K Sechidis","year":"2011","journal-title":"Machine Learning and Knowledge Discovery in Databases"},{"key":"pcbi.1008174.ref040","unstructured":"Wu XZ, Zhou ZH. A Unified View of Multi-Label Performance Measures. arXiv preprint arXiv:160900288. 2016."},{"key":"pcbi.1008174.ref041","doi-asserted-by":"crossref","DOI":"10.1007\/978-0-387-84858-7","volume-title":"The elements of statistical learning: data mining, inference and prediction","author":"T Hastie","year":"2009"},{"issue":"C","key":"pcbi.1008174.ref042","doi-asserted-by":"crossref","first-page":"26","DOI":"10.1016\/j.neucom.2014.11.086","article-title":"Evaluating the Classifier Behavior with Noisy Data Considering Performance and Robustness","volume":"176","author":"JA S\u00e1ez","year":"2016","journal-title":"Neurocomput"},{"issue":"8","key":"pcbi.1008174.ref043","doi-asserted-by":"crossref","first-page":"1798","DOI":"10.1109\/TPAMI.2013.50","article-title":"Representation Learning: A Review and New Perspectives","volume":"35","author":"Y Bengio","year":"2013","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"1","key":"pcbi.1008174.ref044","doi-asserted-by":"crossref","first-page":"17","DOI":"10.1109\/TKDE.2016.2598561","article-title":"A survey of heterogeneous information network analysis","volume":"29","author":"C Shi","year":"2017","journal-title":"IEEE Transactions on Knowledge and Data Engineering"}],"container-title":["PLOS Computational Biology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1008174","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,10,1]],"date-time":"2020-10-01T13:29:27Z","timestamp":1601558967000},"score":1,"resource":{"primary":{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1008174"}},"subtitle":[],"editor":[{"given":"William","family":"Cannon","sequence":"first","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2020,10,1]]},"references-count":44,"journal-issue":{"issue":"10","published-online":{"date-parts":[[2020,10,1]]}},"URL":"https:\/\/doi.org\/10.1371\/journal.pcbi.1008174","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/2020.02.02.919944","asserted-by":"object"}]},"ISSN":["1553-7358"],"issn-type":[{"value":"1553-7358","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,10,1]]}}}