{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,26]],"date-time":"2026-02-26T20:34:21Z","timestamp":1772138061787,"version":"3.50.1"},"reference-count":16,"publisher":"Oxford University Press (OUP)","issue":"5","license":[{"start":{"date-parts":[[2023,5,17]],"date-time":"2023-05-17T00:00:00Z","timestamp":1684281600000},"content-version":"vor","delay-in-days":16,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"name":"LOEWE"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,5,4]]},"abstract":"<jats:title>Abstract<\/jats:title>\n                  <jats:sec>\n                    <jats:title>Motivation<\/jats:title>\n                    <jats:p>Identifying organellar DNA, such as mitochondrial or plastid sequences, inside a whole genome assembly, remains challenging and requires biological background knowledge. To address this, we developed ODNA based on genome annotation and machine learning to fulfill.<\/jats:p>\n                  <\/jats:sec>\n                  <jats:sec>\n                    <jats:title>Results<\/jats:title>\n                    <jats:p>ODNA is a software that classifies organellar DNA sequences within a genome assembly by machine learning based on a predefined genome annotation workflow. We trained our model with 829\u200a769 DNA sequences from 405 genome assemblies and achieved high predictive performance (e.g. matthew's correlation coefficient of 0.61 for mitochondria and 0.73 for chloroplasts) on independent validation data, thus outperforming existing approaches significantly.<\/jats:p>\n                  <\/jats:sec>\n                  <jats:sec>\n                    <jats:title>Availability and implementation<\/jats:title>\n                    <jats:p>Our software ODNA is freely accessible as a web service at https:\/\/odna.mathematik.uni-marburg.de and can also be run in a docker container. The source code can be found at https:\/\/gitlab.com\/mosga\/odna and the processed data at Zenodo (DOI: 10.5281\/zenodo.7506483).<\/jats:p>\n                  <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btad326","type":"journal-article","created":{"date-parts":[[2023,5,17]],"date-time":"2023-05-17T11:06:14Z","timestamp":1684321574000},"source":"Crossref","is-referenced-by-count":2,"title":["ODNA: identification of organellar DNA by machine learning"],"prefix":"10.1093","volume":"39","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7678-7856","authenticated-orcid":false,"given":"Roman","family":"Martin","sequence":"first","affiliation":[{"name":"Department of Mathematics and Computer Science, Philipps University of Marburg , Hans-Meerwein-Str. 6 , Marburg 35043, Germany"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2690-2718","authenticated-orcid":false,"given":"Minh Kien","family":"Nguyen","sequence":"additional","affiliation":[{"name":"Department of Mathematics and Computer Science, Philipps University of Marburg , Hans-Meerwein-Str. 6 , Marburg 35043, Germany"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0113-2542","authenticated-orcid":false,"given":"Nick","family":"Lowack","sequence":"additional","affiliation":[{"name":"Department of Mathematics and Computer Science, Philipps University of Marburg , Hans-Meerwein-Str. 6 , Marburg 35043, Germany"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3108-8311","authenticated-orcid":false,"given":"Dominik","family":"Heider","sequence":"additional","affiliation":[{"name":"Department of Mathematics and Computer Science, Philipps University of Marburg , Hans-Meerwein-Str. 6 , Marburg 35043, Germany"},{"name":"Center for Synthetic Microbiology (SYNMIKRO), Philipps University of Marburg , Karl-von-Frisch-Str. 14 , Marburg 35043, Germany"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"286","published-online":{"date-parts":[[2023,5,17]]},"reference":[{"key":"2023053101314779600_btad326-B1","doi-asserted-by":"crossref","first-page":"892","DOI":"10.1111\/1755-0998.13160","article-title":"Mitofinder: efficient automated large-scale extraction of mitogenomic data in target enrichment phylogenomics","volume":"20","author":"Allio","year":"2020","journal-title":"Mol Ecol Resour"},{"key":"2023053101314779600_btad326-B2","doi-asserted-by":"crossref","first-page":"464","DOI":"10.21105\/joss.00464","article-title":"Chloroextractor: extraction and assembly of the chloroplast genome from whole genome shotgun data","volume":"3","author":"Ankenbrand","year":"2018","journal-title":"J Open Source Softw"},{"key":"2023053101314779600_btad326-B3","doi-asserted-by":"crossref","first-page":"59","DOI":"10.1038\/nmeth.3176","article-title":"Fast and sensitive protein alignment using diamond","volume":"12","author":"Buchfink","year":"2014","journal-title":"Nat Methods"},{"key":"2023053101314779600_btad326-B4","doi-asserted-by":"crossref","first-page":"9077","DOI":"10.1093\/nar\/gkab688","article-title":"tRNAscan-SE 2.0: improved detection and functional classification of transfer RNA genes","volume":"49","author":"Chan","year":"2021","journal-title":"Nucleic Acids Res"},{"key":"2023053101314779600_btad326-B5","doi-asserted-by":"crossref","first-page":"19","DOI":"10.1186\/s12859-015-0654-5","article-title":"Red: an intelligent, rapid, accurate tool for detecting repeats de-novo on the genomic scale","volume":"16","author":"Girgis","year":"2015","journal-title":"BMC Bioinformatics"},{"key":"2023053101314779600_btad326-B6","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1038\/s41597-020-0363-4","article-title":"Four high-quality draft genome assemblies of the marine heterotrophic nanoflagellate cafeteria roenbergensis","volume":"7","author":"Hackl","year":"2020","journal-title":"Sci Data"},{"key":"2023053101314779600_btad326-B7","doi-asserted-by":"crossref","first-page":"313","DOI":"10.1098\/rspb.2002.2218","article-title":"Biological identifications through DNA barcodes","volume":"270","author":"Hebert","year":"2003","journal-title":"Proc Biol Sci"},{"key":"2023053101314779600_btad326-B8","doi-asserted-by":"crossref","first-page":"1274","DOI":"10.1016\/j.cub.2016.03.053","article-title":"A eukaryote without a mitochondrial organelle","volume":"26","author":"Karnkowska","year":"2016","journal-title":"Curr Biol"},{"key":"2023053101314779600_btad326-B9","doi-asserted-by":"crossref","first-page":"345","DOI":"10.1186\/s13059-021-02567-w","article-title":"The economics of organellar gene loss and endosymbiotic gene transfer","volume":"22","author":"Kelly","year":"2021","journal-title":"Genome Biol"},{"key":"2023053101314779600_btad326-B10","doi-asserted-by":"crossref","first-page":"2520","DOI":"10.1093\/bioinformatics\/bts480","article-title":"Snakemake\u2014a scalable bioinformatics workflow engine","volume":"28","author":"K\u00f6ster","year":"2012","journal-title":"Bioinformatics"},{"key":"2023053101314779600_btad326-B11","doi-asserted-by":"crossref","first-page":"54","DOI":"10.1186\/1472-6750-11-54","article-title":"Isolation and analysis of high quality nuclear DNA with reduced organellar DNA for plant genome sequencing and resequencing","volume":"11","author":"Lutz","year":"2011","journal-title":"BMC Biotechnol"},{"key":"2023053101314779600_btad326-B12","doi-asserted-by":"crossref","first-page":"5514","DOI":"10.1093\/bioinformatics\/btaa1003","article-title":"Mosga: modular open-source genome annotator","volume":"36","author":"Martin","year":"2020","journal-title":"Bioinformatics"},{"key":"2023053101314779600_btad326-B13","doi-asserted-by":"crossref","first-page":"5504","DOI":"10.1016\/j.csbj.2021.09.024","article-title":"Mosga 2: comparative genomics and validation tools","volume":"19","author":"Martin","year":"2021","journal-title":"Comput Struct Biotechnol J"},{"key":"2023053101314779600_btad326-B14","doi-asserted-by":"crossref","first-page":"276","DOI":"10.1016\/S0168-9525(00)02024-2","article-title":"Emboss: the European molecular biology open software suite","volume":"16","author":"Rice","year":"2000","journal-title":"Trends Genet"},{"key":"2023053101314779600_btad326-B15","doi-asserted-by":"crossref","first-page":"952","DOI":"10.1080\/10635150500234674","article-title":"Between two extremes: mitochondrial DNA is neither the panacea nor the nemesis of phylogenetic and taxonomic inference","volume":"54","author":"Rubinoff","year":"2005","journal-title":"Syst Biol"},{"key":"2023053101314779600_btad326-B16","doi-asserted-by":"crossref","first-page":"270","DOI":"10.12688\/f1000research.21490.1","article-title":"Recent advances in understanding mitochondrial genome diversity","volume":"9","author":"Zardoya","year":"2020","journal-title":"F1000Res"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/advance-article-pdf\/doi\/10.1093\/bioinformatics\/btad326\/50374125\/btad326.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/39\/5\/btad326\/50492409\/btad326.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/39\/5\/btad326\/50492409\/btad326.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,31]],"date-time":"2023-05-31T01:12:02Z","timestamp":1685495522000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/doi\/10.1093\/bioinformatics\/btad326\/7169158"}},"subtitle":[],"editor":[{"given":"Inanc","family":"Birol","sequence":"additional","affiliation":[],"role":[{"role":"editor","vocabulary":"crossref"}]}],"short-title":[],"issued":{"date-parts":[[2023,5,1]]},"references-count":16,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2023,5,4]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btad326","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/2023.01.10.523051","asserted-by":"object"}]},"ISSN":["1367-4811"],"issn-type":[{"value":"1367-4811","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2023,5,1]]},"published":{"date-parts":[[2023,5,1]]},"article-number":"btad326"}}