{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,16]],"date-time":"2026-04-16T03:33:02Z","timestamp":1776310382453,"version":"3.50.1"},"reference-count":18,"publisher":"Oxford University Press (OUP)","issue":"12","license":[{"start":{"date-parts":[[2024,11,25]],"date-time":"2024-11-25T00:00:00Z","timestamp":1732492800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"name":"National Cancer Institute of the National Institutes of Health","award":["R01CA230551"],"award-info":[{"award-number":["R01CA230551"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,11,28]]},"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:sec>\n                  <jats:title>Summary<\/jats:title>\n                  <jats:p>LEfSe is a widely used Python package and Galaxy module for metagenomic biomarker discovery and visualization, utilizing the Kruskal\u2013Wallis test, Wilcoxon Rank-Sum test, and Linear Discriminant Analysis. R\/Bioconductor provides a large collection of tools for metagenomic data analysis but has lacked an implementation of this widely used algorithm, hindering benchmarking against other tools and incorporation into R workflows. We present the lefser package to provide comparable functionality within the R\/Bioconductor ecosystem of statistical analysis tools, with improvements to the original algorithm for performance, accuracy, and reproducibility. We benchmark the performance of lefser against the original algorithm using human and mouse metagenomic datasets.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Availability and implementation<\/jats:title>\n                  <jats:p>Our software, lefser, is distributed through the Bioconductor project (https:\/\/www.bioconductor.org\/packages\/release\/bioc\/html\/lefser.html), and all the source code is available in the GitHub repository https:\/\/github.com\/waldronlab\/lefser.<\/jats:p>\n               <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btae707","type":"journal-article","created":{"date-parts":[[2024,11,25]],"date-time":"2024-11-25T16:40:51Z","timestamp":1732552851000},"source":"Crossref","is-referenced-by-count":38,"title":["<i>lefser<\/i>: implementation of metagenomic biomarker discovery tool, <i>LEfSe<\/i>, in R"],"prefix":"10.1093","volume":"40","author":[{"given":"Asya","family":"Khleborodova","sequence":"first","affiliation":[{"name":"Institute for Implementation Science in Population Health, City University of New York School of Public Health , New York, NY 10027,","place":["United States"]},{"name":"Department of Epidemiology and Biostatistics, City University of New York School of Public Health , New York, NY 10027,","place":["United States"]}]},{"given":"Samuel D","family":"Gamboa-Tuz","sequence":"additional","affiliation":[{"name":"Institute for Implementation Science in Population Health, City University of New York School of Public Health , New York, NY 10027,","place":["United States"]},{"name":"Department of Epidemiology and Biostatistics, City University of New York School of Public Health , New York, NY 10027,","place":["United States"]}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3242-0582","authenticated-orcid":false,"given":"Marcel","family":"Ramos","sequence":"additional","affiliation":[{"name":"Institute for Implementation Science in Population Health, City University of New York School of Public Health , New York, NY 10027,","place":["United States"]},{"name":"Department of Epidemiology and Biostatistics, City University of New York School of Public Health , New York, NY 10027,","place":["United States"]}]},{"given":"Nicola","family":"Segata","sequence":"additional","affiliation":[{"name":"Cellular, Computational and Integrative Biology, University of Trento , Trento, Provo 38123,","place":["Italy"]},{"name":"European Institute of Oncology, Istituto di Ricovero e Cura a Carattere Scientifico , Milan 20139,","place":["Italy"]}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2725-0694","authenticated-orcid":false,"given":"Levi","family":"Waldron","sequence":"additional","affiliation":[{"name":"Institute for Implementation Science in Population Health, City University of New York School of Public Health , New York, NY 10027,","place":["United States"]},{"name":"Department of Epidemiology and Biostatistics, City University of New York School of Public Health , New York, NY 10027,","place":["United States"]}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9490-3061","authenticated-orcid":false,"given":"Sehyun","family":"Oh","sequence":"additional","affiliation":[{"name":"Institute for Implementation Science in Population Health, City University of New York School of Public Health , New York, NY 10027,","place":["United States"]},{"name":"Department of Epidemiology and Biostatistics, City University of New York School of Public Health , New York, NY 10027,","place":["United States"]}]}],"member":"286","published-online":{"date-parts":[[2024,11,25]]},"reference":[{"key":"2024122317384807000_btae707-B1","doi-asserted-by":"publisher","DOI":"10.7554\/eLife.65088","article-title":"Integrating taxonomic, functional, and strain-level profiling of diverse microbial communities with bioBakery 3","volume":"10","author":"Beghini","year":"2021","journal-title":"Elife"},{"key":"2024122317384807000_btae707-B2","doi-asserted-by":"publisher","author":"Bolar","year":"2019","DOI":"10.32614\/cran.package.stat"},{"key":"2024122317384807000_btae707-B3","doi-asserted-by":"crossref","first-page":"btac778","DOI":"10.1093\/bioinformatics\/btac778","article-title":"Benchdamic: benchmarking of differential abundance methods for microbiome data","volume":"39","author":"Calgaro","year":"2023","journal-title":"Bioinformatics"},{"key":"2024122317384807000_btae707-B4","doi-asserted-by":"crossref","first-page":"191","DOI":"10.1186\/s13059-020-02104-1","article-title":"Assessment of statistical methods from single cell, bulk RNA-Seq, and metagenomics applied to microbiome data","volume":"21","author":"Calgaro","year":"2020","journal-title":"Genome Biol"},{"key":"2024122317384807000_btae707-B5","doi-asserted-by":"crossref","first-page":"4027","DOI":"10.1093\/bioinformatics\/btac438","article-title":"microbiomeMarker: an R\/bioconductor package for microbiome marker identification and visualization","volume":"38","author":"Cao","year":"2022","journal-title":"Bioinformatics"},{"key":"2024122317384807000_btae707-B6","doi-asserted-by":"crossref","first-page":"292","DOI":"10.1016\/j.chom.2010.08.004","article-title":"Enterobacteriaceae act in concert with the gut microbiota to induce spontaneous and maternally transmitted colitis","volume":"8","author":"Garrett","year":"2010","journal-title":"Cell Host Microbe"},{"key":"2024122317384807000_btae707-B7","doi-asserted-by":"publisher","first-page":"790","DOI":"10.1038\/s41587-023-01872-y","article-title":"BugSigDB captures patterns of differential abundance across a broad range of host-associated microbial signatures","volume":"42","author":"Geistlinger","year":"2024","journal-title":"Nat Biotechnol"},{"key":"2024122317384807000_btae707-B8","doi-asserted-by":"crossref","first-page":"R80","DOI":"10.1186\/gb-2004-5-10-r80","article-title":"Bioconductor: open software development for computational biology and bioinformatics","volume":"5","author":"Gentleman","year":"2004","journal-title":"Genome Biol"},{"key":"2024122317384807000_btae707-B9","doi-asserted-by":"crossref","first-page":"1","DOI":"10.18637\/jss.v028.i08","article-title":"Implementing a class of permutation tests: the coin package","volume":"28","author":"Hothorn","year":"2008","journal-title":"J Stat Soft"},{"key":"2024122317384807000_btae707-B10","doi-asserted-by":"crossref","first-page":"143","DOI":"10.1016\/j.copbio.2016.01.017","article-title":"Functional metagenomics of extreme environments","volume":"38","author":"Mirete","year":"2016","journal-title":"Curr Opin Biotechnol"},{"key":"2024122317384807000_btae707-B11","doi-asserted-by":"crossref","first-page":"342","DOI":"10.1038\/s41467-022-28034-z","article-title":"Microbiome differential abundance methods produce different results across 38 datasets","volume":"13","author":"Nearing","year":"2022","journal-title":"Nat Commun"},{"key":"2024122317384807000_btae707-B12","doi-asserted-by":"publisher","author":"Ramos","year":"2022","DOI":"10.18129\/B9.BIOC.MICROBIOMEBENCHMARKDATA"},{"key":"2024122317384807000_btae707-B13","doi-asserted-by":"crossref","first-page":"R60","DOI":"10.1186\/gb-2011-12-6-r60","article-title":"Metagenomic biomarker discovery and explanation","volume":"12","author":"Segata","year":"2011","journal-title":"Genome Biol"},{"key":"2024122317384807000_btae707-B14","doi-asserted-by":"crossref","first-page":"494","DOI":"10.3389\/fmicb.2017.00494","article-title":"Comparative evaluation of four bacteria-specific primer pairs for 16S rRNA gene surveys","volume":"8","author":"Thijs","year":"2017","journal-title":"Front Microbiol"},{"key":"2024122317384807000_btae707-B15","doi-asserted-by":"crossref","first-page":"18132","DOI":"10.1073\/pnas.1011737107","article-title":"Bifidobacterium animalis subsp. lactis fermented milk product reduces inflammation by altering a niche for colitogenic microbes","volume":"107","author":"Veiga","year":"2010","journal-title":"Proc Natl Acad Sci USA"},{"key":"2024122317384807000_btae707-B16","volume-title":"Modern Applied Statistics with S. PDF","author":"Venables","year":"2003","edition":"4th ed"},{"key":"2024122317384807000_btae707-B17","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1080\/00031305.2019.1583913","article-title":"Moving to a world beyond \u2018p &lt; 0.05\u2019","volume":"73","author":"Wasserstein","year":"2019","journal-title":"Am Stat"},{"key":"2024122317384807000_btae707-B18","doi-asserted-by":"crossref","first-page":"766","DOI":"10.15252\/msb.20145645","article-title":"Potential of fecal microbiota for early-stage detection of colorectal cancer","volume":"10","author":"Zeller","year":"2014","journal-title":"Mol Syst Biol"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/advance-article-pdf\/doi\/10.1093\/bioinformatics\/btae707\/60811200\/btae707.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/40\/12\/btae707\/60811200\/btae707.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/40\/12\/btae707\/60811200\/btae707.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,23]],"date-time":"2024-12-23T17:41:31Z","timestamp":1734975691000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/doi\/10.1093\/bioinformatics\/btae707\/7908399"}},"subtitle":[],"editor":[{"given":"Peter","family":"Robinson","sequence":"additional","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2024,11,25]]},"references-count":18,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2024,11,28]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btae707","relation":{},"ISSN":["1367-4811"],"issn-type":[{"value":"1367-4811","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2024,12]]},"published":{"date-parts":[[2024,11,25]]},"article-number":"btae707"}}