{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,8]],"date-time":"2026-04-08T16:13:36Z","timestamp":1775664816127,"version":"3.50.1"},"reference-count":27,"publisher":"Oxford University Press (OUP)","issue":"12","license":[{"start":{"date-parts":[[2024,11,14]],"date-time":"2024-11-14T00:00:00Z","timestamp":1731542400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100009708","name":"Novo Nordisk Foundation","doi-asserted-by":"publisher","award":["NNF20OC0062606"],"award-info":[{"award-number":["NNF20OC0062606"]}],"id":[{"id":"10.13039\/501100009708","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,11,28]]},"abstract":"<jats:title>Abstract<\/jats:title>\n                  <jats:sec>\n                    <jats:title>Motivation<\/jats:title>\n                    <jats:p>Protein subcellular location prediction is a widely explored task in bioinformatics because of its importance in proteomics research. We propose DeepLocPro, an extension to the popular method DeepLoc, tailored specifically to archaeal and bacterial organisms.<\/jats:p>\n                  <\/jats:sec>\n                  <jats:sec>\n                    <jats:title>Results<\/jats:title>\n                    <jats:p>DeepLocPro is a multiclass subcellular location prediction tool for prokaryotic proteins, trained on experimentally verified data curated from UniProt and PSORTdb. DeepLocPro compares favorably to the PSORTb 3.0 ensemble method, surpassing its performance across multiple metrics in our benchmark experiment.<\/jats:p>\n                  <\/jats:sec>\n                  <jats:sec>\n                    <jats:title>Availability and implementation<\/jats:title>\n                    <jats:p>The DeepLocPro prediction tool is available online at https:\/\/ku.biolib.com\/deeplocpro and https:\/\/services.healthtech.dtu.dk\/services\/DeepLocPro-1.0\/.<\/jats:p>\n                  <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btae677","type":"journal-article","created":{"date-parts":[[2024,11,12]],"date-time":"2024-11-12T07:20:23Z","timestamp":1731396023000},"source":"Crossref","is-referenced-by-count":43,"title":["Predicting the subcellular location of prokaryotic proteins with DeepLocPro"],"prefix":"10.1093","volume":"40","author":[{"given":"Jaime","family":"Moreno","sequence":"first","affiliation":[{"name":"Department of Biology, University of Copenhagen , 2200 Copenhagen,","place":["Denmark"]},{"name":"AI & Digital Research, Novo Nordisk A\/S , 2760 M\u00e5l\u00f8v,","place":["Denmark"]}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9412-9643","authenticated-orcid":false,"given":"Henrik","family":"Nielsen","sequence":"additional","affiliation":[{"name":"Department of Health Technology, Technical University of Denmark , 2800 Lyngby,","place":["Denmark"]}]},{"given":"Ole","family":"Winther","sequence":"additional","affiliation":[{"name":"Department of Biology, University of Copenhagen , 2200 Copenhagen,","place":["Denmark"]},{"name":"Department of Applied Mathematics and Computer Science, Technical University of Denmark , 2800 Lyngby,","place":["Denmark"]}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1275-8065","authenticated-orcid":false,"given":"Felix","family":"Teufel","sequence":"additional","affiliation":[{"name":"Department of Biology, University of Copenhagen , 2200 Copenhagen,","place":["Denmark"]},{"name":"AI & Digital Research, Novo Nordisk A\/S , 2760 M\u00e5l\u00f8v,","place":["Denmark"]}]}],"member":"286","published-online":{"date-parts":[[2024,11,14]]},"reference":[{"key":"2024121400205174200_btae677-B1","doi-asserted-by":"publisher","first-page":"414","DOI":"10.1038\/nrmicro2576","article-title":"The archaeal cell envelope","volume":"9","author":"Albers","year":"2011","journal-title":"Nat Rev Microbiol"},{"key":"2024121400205174200_btae677-B2","doi-asserted-by":"publisher","first-page":"1315","DOI":"10.1038\/s41592-019-0598-1","article-title":"Unified rational protein engineering with sequence-based deep representation learning","volume":"16","author":"Alley","year":"2019","journal-title":"Nat Methods"},{"key":"2024121400205174200_btae677-B3","doi-asserted-by":"publisher","first-page":"3387","DOI":"10.1093\/bioinformatics\/btx431","article-title":"DeepLoc: prediction of protein subcellular localization using deep learning","volume":"33","author":"Almagro Armenteros","year":"2017","journal-title":"Bioinformatics"},{"key":"2024121400205174200_btae677-B4","doi-asserted-by":"publisher","first-page":"108114","DOI":"10.1016\/j.compbiomed.2024.108114","article-title":"mtx-COBRA: subcellular localization prediction for bacterial proteins","volume":"171","author":"Arora","year":"2024","journal-title":"Comput Biol Med"},{"key":"2024121400205174200_btae677-B5","doi-asserted-by":"publisher","first-page":"274","DOI":"10.1186\/1471-2105-10-274","article-title":"MultiLoc2: integrating phylogeny and gene ontology terms improves subcellular protein localization prediction","volume":"10","author":"Blum","year":"2009","journal-title":"BMC Bioinformatics"},{"key":"2024121400205174200_btae677-B6","doi-asserted-by":"publisher","first-page":"5363","DOI":"10.1021\/pr900665y","article-title":"SherLoc2: a high-accuracy hybrid method for predicting subcellular localization of proteins","volume":"8","author":"Briesemeister","year":"2009","journal-title":"J Proteome Res"},{"key":"2024121400205174200_btae677-B7","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4419-7692-5","volume-title":"Prokaryotic Antimicrobial Peptides: From Genes to Applications","author":"Drider","year":"2011"},{"key":"2024121400205174200_btae677-B8","doi-asserted-by":"publisher","first-page":"7112","DOI":"10.1109\/TPAMI.2021.3095381","article-title":"ProtTrans: toward understanding the language of life through self-supervised learning","volume":"44","author":"Elnaggar","year":"2022","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"2024121400205174200_btae677-B9","doi-asserted-by":"publisher","first-page":"i458","DOI":"10.1093\/bioinformatics\/bts390","article-title":"LocTree2 predicts localization for all domains of life","volume":"28","author":"Goldberg","year":"2012","journal-title":"Bioinformatics"},{"key":"2024121400205174200_btae677-B10","doi-asserted-by":"publisher","first-page":"367","DOI":"10.1016\/j.compbiolchem.2004.09.006","article-title":"Comparing two K-category assignments by a K-category correlation coefficient","volume":"28","author":"Gorodkin","year":"2004","journal-title":"Comput Biol Chem"},{"key":"2024121400205174200_btae677-B11","doi-asserted-by":"publisher","first-page":"bbaa302","DOI":"10.1093\/bib\/bbaa302","article-title":"GP4: an integrated Gram-positive protein prediction pipeline for subcellular localization mimicking bacterial sorting","volume":"22","author":"Grasso","year":"2021","journal-title":"Brief Bioinform"},{"key":"2024121400205174200_btae677-B12","doi-asserted-by":"publisher","first-page":"D803","DOI":"10.1093\/nar\/gkaa1095","article-title":"PSORTdb 4.0: expanded and redesigned bacterial and archaeal protein subcellular localization database incorporating new secondary localizations","volume":"49","author":"Lau","year":"2021","journal-title":"Nucleic Acids Res"},{"key":"2024121400205174200_btae677-B13","doi-asserted-by":"publisher","first-page":"1123","DOI":"10.1126\/science.ade2574","article-title":"Evolutionary-scale prediction of atomic-level protein structure with a language model","volume":"379","author":"Lin","year":"2023","journal-title":"Science"},{"key":"2024121400205174200_btae677-B14","doi-asserted-by":"publisher","first-page":"1425","DOI":"10.1016\/j.bbapap.2012.05.018","article-title":"MetaLocGramN: a meta-predictor of protein subcellular localization for gram-negative bacteria","volume":"1824","author":"Magnus","year":"2012","journal-title":"Biochim Biophys Acta"},{"key":"2024121400205174200_btae677-B15","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1111\/j.1574-6968.1990.tb04876.x","article-title":"Applications for biotechnology: present and future improvements in lactic acid bacteria","volume":"7","author":"McKay","year":"1990","journal-title":"FEMS Microbiol Rev"},{"key":"2024121400205174200_btae677-B16","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1007\/978-1-0716-3445-5_2","volume-title":"Bacterial Secretion Systems: Methods and Protocols","author":"Nielsen","year":"2024"},{"key":"2024121400205174200_btae677-B0970994","doi-asserted-by":"publisher","first-page":"3043","DOI":"10.1093\/bioinformatics\/btaa136","article-title":"PSORTm: A bacterial and archaeal protein subcellular localization prediction tool for metagenomics data","volume":"36","author":"Peabody","year":"2020","journal-title":"Bioinformatics"},{"key":"2024121400205174200_btae677-B17","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1155\/2002\/436561","article-title":"Perspectives on biotechnological applications of archaea","volume":"1","author":"Schiraldi","year":"2002","journal-title":"Archaea"},{"key":"2024121400205174200_btae677-B18","doi-asserted-by":"publisher","DOI":"10.1101\/2022.12.16.520742","article-title":"Protein language model for prediction of subcellular localization of protein sequences from gram-negative bacteria (ProtLM.SCL)","author":"Singh","year":"2022"},{"key":"2024121400205174200_btae677-B19","doi-asserted-by":"publisher","first-page":"vbab035","DOI":"10.1093\/bioadv\/vbab035","article-title":"Light attention predicts protein location from the language of life","volume":"1","author":"St\u00e4rk","year":"2021","journal-title":"Bioinform Adv"},{"key":"2024121400205174200_btae677-B20","doi-asserted-by":"publisher","first-page":"1023","DOI":"10.1038\/s41587-021-01156-3","article-title":"SignalP 6.0 predicts all five types of signal peptides using protein language models","volume":"40","author":"Teufel","year":"2022","journal-title":"Nat Biotechnol"},{"key":"2024121400205174200_btae677-B21","doi-asserted-by":"publisher","first-page":"lqad088","DOI":"10.1093\/nargab\/lqad088","article-title":"GraphPart: homology partitioning for biological sequence analysis","volume":"5","author":"Teufel","year":"2023","journal-title":"NAR Genom Bioinform"},{"key":"2024121400205174200_btae677-B22","doi-asserted-by":"publisher","first-page":"D523","DOI":"10.1093\/nar\/gkac1052","article-title":"UniProt: the universal protein knowledgebase in 2023","volume":"51","author":"The UniProt Consortium","year":"2023","journal-title":"Nucl Acids Res"},{"key":"2024121400205174200_btae677-B23","doi-asserted-by":"publisher","first-page":"W228","DOI":"10.1093\/nar\/gkac278","article-title":"DeepLoc 2.0: multi-label subcellular localization prediction using protein language models","volume":"50","author":"Thumuluri","year":"2022","journal-title":"Nucleic Acids Res"},{"key":"2024121400205174200_btae677-B24","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.chemolab.2016.12.014","article-title":"Gram-LocEN: interpretable prediction of subcellular multi-localization of Gram-positive and Gram-negative bacterial proteins","volume":"162","author":"Wan","year":"2017","journal-title":"Chemom Intell Lab Syst"},{"key":"2024121400205174200_btae677-B25","doi-asserted-by":"publisher","first-page":"1402","DOI":"10.1110\/ps.03479604","article-title":"Predicting subcellular localization of proteins for Gram-negative bacteria by support vector machines based on n-peptide compositions","volume":"13","author":"Yu","year":"2004","journal-title":"Protein Sci A Publ Protein Soc"},{"key":"2024121400205174200_btae677-B26","doi-asserted-by":"publisher","first-page":"1608","DOI":"10.1093\/bioinformatics\/btq249","article-title":"PSORTb 3.0: improved protein subcellular localization prediction with refined localization subcategories and predictive capabilities for all prokaryotes","volume":"26","author":"Yu","year":"2010","journal-title":"Bioinformatics"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/advance-article-pdf\/doi\/10.1093\/bioinformatics\/btae677\/60675515\/btae677.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/40\/12\/btae677\/60924512\/btae677.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/40\/12\/btae677\/60924512\/btae677.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,13]],"date-time":"2024-12-13T19:20:59Z","timestamp":1734117659000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/doi\/10.1093\/bioinformatics\/btae677\/7900293"}},"subtitle":[],"editor":[{"given":"Lenore","family":"Cowen","sequence":"additional","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2024,11,14]]},"references-count":27,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2024,11,28]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btae677","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/2024.01.04.574157","asserted-by":"object"}]},"ISSN":["1367-4811"],"issn-type":[{"value":"1367-4811","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2024,12]]},"published":{"date-parts":[[2024,11,14]]},"article-number":"btae677"}}