{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,20]],"date-time":"2026-02-20T00:55:41Z","timestamp":1771548941477,"version":"3.50.1"},"reference-count":36,"publisher":"Oxford University Press (OUP)","issue":"10","license":[{"start":{"date-parts":[[2025,9,24]],"date-time":"2025-09-24T00:00:00Z","timestamp":1758672000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"name":"Fonds de recherche du Qu\u00e9bec secteur Nature et technologies","award":["325947"],"award-info":[{"award-number":["325947"]}]},{"name":"CREATE Responsible Health and Healthcare Data Science"},{"DOI":"10.13039\/501100000038","name":"Natural Sciences and Engineering Research Council of Canada","doi-asserted-by":"crossref","id":[{"id":"10.13039\/501100000038","id-type":"DOI","asserted-by":"crossref"}]},{"name":"Mitacs Globalink Research program","award":["IT41138"],"award-info":[{"award-number":["IT41138"]}]},{"name":"Research Scholars\u2014Junior 1"},{"name":"Fonds de recherche du Qu\u00e9bec secteur Sant\u00e9","award":["307935"],"award-info":[{"award-number":["307935"]}]},{"name":"Bijzonder Onderzoeksfonds","award":["01P10022"],"award-info":[{"award-number":["01P10022"]}]},{"name":"2024 from the European Society of Clinical Microbiology and Infectious Diseases"},{"name":"Research Foundation\u2014Flanders","award":["1S15424N"],"award-info":[{"award-number":["1S15424N"]}]},{"name":"Compute Ontario"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,2]]},"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:sec>\n                  <jats:title>Summary<\/jats:title>\n                  <jats:p>SPAED is an accessible tool for the accurate segmentation of protein domains that leverages information contained in the predicted aligned error (PAE) matrix obtained from AlphaFold to better identify domain-linker boundaries and detect terminal disordered regions. On a dataset of 376 bacteriophage endolysins (proteins that degrade the bacterial cell wall), SPAED achieves a mean intersect-over-union score of 96% and a domain-boundary-distance score of 89% compared to 94% and 70%, respectively, for the state-of-the-art tool Chainsaw.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Availability and implementation<\/jats:title>\n                  <jats:p>Implemented in Python, SPAED is accessible on the web (https:\/\/spaed.ca) and available for download from https:\/\/github.com\/Rousseau-Team\/spaed or https:\/\/pypi.org\/project\/spaed. The data used to test SPAED can be found at https:\/\/doi.org\/10.5281\/zenodo.15285860.<\/jats:p>\n               <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btaf531","type":"journal-article","created":{"date-parts":[[2025,9,24]],"date-time":"2025-09-24T15:51:02Z","timestamp":1758729062000},"source":"Crossref","is-referenced-by-count":2,"title":["SPAED: harnessing AlphaFold output for accurate segmentation of phage endolysin domains"],"prefix":"10.1093","volume":"41","author":[{"ORCID":"https:\/\/orcid.org\/0009-0000-5796-8598","authenticated-orcid":false,"given":"Alexandre","family":"Boulay","sequence":"first","affiliation":[{"name":"Department of Biotechnology, Ghent University , Ghent B-9000,","place":["Belgium"]},{"name":"D\u00e9partement de biochimie, de microbiologie et de bio-informatique, Universit\u00e9 Laval , Qu\u00e9bec, QC, G1V 0A6,","place":["Canada"]},{"name":"Centre Nutrition, Sant\u00e9 et Soci\u00e9t\u00e9 (NUTRISS), Institute of Nutrition and Functional Foods (INAF), Universit\u00e9 Laval , Qu\u00e9bec, QC, G1V 0A6,","place":["Canada"]}]},{"given":"Emma","family":"Cremelie","sequence":"additional","affiliation":[{"name":"Department of Biotechnology, Ghent University , Ghent B-9000,","place":["Belgium"]}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0560-6023","authenticated-orcid":false,"given":"Clovis","family":"Galiez","sequence":"additional","affiliation":[{"name":"Univ. Grenoble Alpes, CNRS, Grenoble INP, LJK , Grenoble 38000,","place":["France"]}]},{"given":"Yves","family":"Briers","sequence":"additional","affiliation":[{"name":"Department of Biotechnology, Ghent University , Ghent B-9000,","place":["Belgium"]}]},{"given":"Elsa","family":"Rousseau","sequence":"additional","affiliation":[{"name":"Centre Nutrition, Sant\u00e9 et Soci\u00e9t\u00e9 (NUTRISS), Institute of Nutrition and Functional Foods (INAF), Universit\u00e9 Laval , Qu\u00e9bec, QC, G1V 0A6,","place":["Canada"]},{"name":"D\u00e9partement d\u2019informatique et de g\u00e9nie logiciel, Universit\u00e9 Laval , Qu\u00e9bec, QC, G1V 0A6,","place":["Canada"]},{"name":"Centre de Recherche en Donn\u00e9es Massives (CRDM), Universit\u00e9 Laval , Qu\u00e9bec, QC, G1V OA6,","place":["Canada"]},{"name":"Institut Intelligence et Donn\u00e9es (IID), Universit\u00e9 Laval , Qu\u00e9bec, QC, G1V 0A6,","place":["Canada"]}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7919-552X","authenticated-orcid":false,"given":"Roberto","family":"V\u00e1zquez","sequence":"additional","affiliation":[{"name":"Department of Biotechnology, Ghent University , Ghent B-9000,","place":["Belgium"]},{"name":"Centro de Investigaci\u00f3n Biom\u00e9dica en Red de Enfermedades Respiratorias (CIBERES) , Madrid 28029,","place":["Spain"]}]}],"member":"286","published-online":{"date-parts":[[2025,9,24]]},"reference":[{"key":"2025101607414973100_btaf531-B1","doi-asserted-by":"crossref","first-page":"493","DOI":"10.1038\/s41586-024-07487-w","article-title":"Accurate structure prediction of biomolecular interactions with AlphaFold 3","volume":"630","author":"Abramson","year":"2024","journal-title":"Nature"},{"key":"2025101607414973100_btaf531-B2","first-page":"33","volume-title":"Advances in Virus Research","author":"Cahill","year":"2019"},{"key":"2025101607414973100_btaf531-B3","doi-asserted-by":"crossref","first-page":"W732","DOI":"10.1093\/nar\/gkac370","article-title":"SWORD2: hierarchical analysis of protein 3D structures","volume":"50","author":"Cretin","year":"2022","journal-title":"Nucleic Acids Res"},{"key":"2025101607414973100_btaf531-B4","doi-asserted-by":"crossref","first-page":"1240","DOI":"10.3390\/v13071240","article-title":"PhaLP: a database for the study of phage lytic proteins and their evolution","volume":"13","author":"Criel","year":"2021","journal-title":"Viruses"},{"key":"2025101607414973100_btaf531-B5","doi-asserted-by":"crossref","first-page":"125","DOI":"10.1038\/s41579-019-0311-5","article-title":"Phage diversity, genomics and phylogeny","volume":"18","author":"Dion","year":"2020","journal-title":"Nat Rev Microbiol"},{"key":"2025101607414973100_btaf531-B6","doi-asserted-by":"crossref","first-page":"1740","DOI":"10.1093\/bioinformatics\/btz650","article-title":"Multi-scale structural analysis of proteins by deep semantic segmentation","volume":"36","author":"Eguchi","year":"2020","journal-title":"Bioinformatics"},{"key":"2025101607414973100_btaf531-B7","doi-asserted-by":"crossref","first-page":"624","DOI":"10.1016\/j.biotechadv.2017.12.009","article-title":"Synthetic biology of modular endolysins","volume":"36","author":"Gerstmans","year":"2018","journal-title":"Biotechnol Adv"},{"key":"2025101607414973100_btaf531-B8","doi-asserted-by":"crossref","first-page":"eaaz1136","DOI":"10.1126\/sciadv.aaz1136","article-title":"A VersaTile-driven platform for rapid hit-to-lead development of engineered lysins","volume":"6","author":"Gerstmans","year":"2020","journal-title":"Sci Adv"},{"key":"2025101607414973100_btaf531-B9","doi-asserted-by":"crossref","first-page":"2714","DOI":"10.1002\/elps.1150181505","article-title":"SWISS-MODEL and the Swiss-Pdb viewer: an environment for comparative protein modeling","volume":"18","author":"Guex","year":"1997","journal-title":"Electrophoresis"},{"key":"2025101607414973100_btaf531-B10","doi-asserted-by":"crossref","first-page":"10696","DOI":"10.1038\/s41598-022-14382-9","article-title":"AlphaFold2 models indicate that protein sequence determines both structure and dynamics","volume":"12","author":"Guo","year":"2022","journal-title":"Sci Rep"},{"key":"2025101607414973100_btaf531-B11","doi-asserted-by":"crossref","first-page":"583","DOI":"10.1038\/s41586-021-03819-2","article-title":"Highly accurate protein structure prediction with AlphaFold","volume":"596","author":"Jumper","year":"2021","journal-title":"Nature"},{"key":"2025101607414973100_btaf531-B12","doi-asserted-by":"crossref","first-page":"317","DOI":"10.1038\/nrmicro2315","article-title":"Bacteriophage resistance mechanisms","volume":"8","author":"Labrie","year":"2010","journal-title":"Nat Rev Microbiol"},{"key":"2025101607414973100_btaf531-B13","doi-asserted-by":"crossref","first-page":"8445","DOI":"10.1038\/s41467-023-43934-4","article-title":"Merizo: a rapid and accurate protein domain segmentation method using invariant point attention","volume":"14","author":"Lau","year":"2023","journal-title":"Nat Commun"},{"key":"2025101607414973100_btaf531-B14","doi-asserted-by":"publisher","first-page":"1395450","DOI":"10.3389\/fmolb.2024.1395450","article-title":"A pangenome analysis of ESKAPE bacteriophages: the underrepresentation may impact machine learning models","volume":"11","author":"Lee","year":"2024","journal-title":"Front Mol Biosci"},{"key":"2025101607414973100_btaf531-B15","doi-asserted-by":"crossref","first-page":"9851","DOI":"10.1073\/pnas.1207382109","article-title":"Hydrophobic forces and the length limit of foldable protein domains","volume":"109","author":"Lin","year":"2012","journal-title":"Proc Natl Acad Sci USA"},{"key":"2025101607414973100_btaf531-B16","doi-asserted-by":"crossref","first-page":"679","DOI":"10.1038\/s41592-022-01488-1","article-title":"ColabFold: making protein folding accessible to all","volume":"19","author":"Mirdita","year":"2022","journal-title":"Nat Methods"},{"key":"2025101607414973100_btaf531-B17","doi-asserted-by":"crossref","first-page":"7","DOI":"10.1002\/prot.25415","article-title":"Critical assessment of methods of protein structure prediction (CASP)\u2014Round XII","volume":"86","author":"Moult","year":"2018","journal-title":"Proteins"},{"key":"2025101607414973100_btaf531-B18","doi-asserted-by":"crossref","first-page":"76","DOI":"10.1007\/s00253-023-12839-z","article-title":"New bacteriophage-derived lysins, LysJ and LysF, with the potential to control Bacillus anthracis","volume":"108","author":"Nakonieczna","year":"2024","journal-title":"Appl Microbiol Biotechnol"},{"key":"2025101607414973100_btaf531-B19","doi-asserted-by":"crossref","first-page":"e3001740","DOI":"10.1371\/journal.pbio.3001740","article-title":"Phage endolysins are adapted to specific hosts and are evolutionarily dynamic","volume":"20","author":"Oechslin","year":"2022","journal-title":"PLoS Biol"},{"key":"2025101607414973100_btaf531-B20","doi-asserted-by":"crossref","first-page":"4558","DOI":"10.1128\/JVI.03277-12","article-title":"Molecular aspects and comparative genomics of bacteriophage endolysins","volume":"87","author":"Oliveira","year":"2013","journal-title":"J Virol"},{"key":"2025101607414973100_btaf531-B21","doi-asserted-by":"crossref","first-page":"e232","DOI":"10.1371\/journal.pcbi.0030232","article-title":"CATHEDRAL: a fast and effective algorithm to predict folds and domain boundaries from multidomain protein structures","volume":"3","author":"Redfern","year":"2007","journal-title":"PLoS Comput Biol"},{"key":"2025101607414973100_btaf531-B22","doi-asserted-by":"crossref","first-page":"5823","DOI":"10.1128\/JB.182.20.5823-5831.2000","article-title":"The N-Terminal region of the oenococcus oeniBacteriophage fOg44 lysin behaves as a bona fide signal peptide in Escherichia coli and as a cis-Inhibitory element, preventing lytic activity on oenococcal cells","volume":"182","author":"S\u00e3o-Jos\u00e9","year":"2000","journal-title":"J Bacteriol"},{"key":"2025101607414973100_btaf531-B23","doi-asserted-by":"crossref","first-page":"1147","DOI":"10.2217\/fmb.12.97","article-title":"Bacteriophage endolysins as novel antimicrobials","volume":"7","author":"Schmelcher","year":"2012","journal-title":"Future Microbiol"},{"key":"2025101607414973100_btaf531-B25","doi-asserted-by":"crossref","first-page":"183","DOI":"10.1002\/prot.20736","article-title":"Evaluation of domain prediction in CASP6","volume":"61","author":"Tai","year":"2005","journal-title":"Proteins"},{"key":"2025101607414973100_btaf531-B26","doi-asserted-by":"crossref","first-page":"137","DOI":"10.1002\/prot.21675","article-title":"Assessment of predictions submitted for the CASP7 domain prediction category","volume":"69","author":"Tress","year":"2007","journal-title":"Proteins"},{"key":"2025101607414973100_btaf531-B27","doi-asserted-by":"crossref","first-page":"5495","DOI":"10.1007\/s00253-022-12072-0","article-title":"Conversion of the free Cellvibrio japonicus xyloglucan degradation system to the cellulosomal mode","volume":"106","author":"Vanderstraeten","year":"2022","journal-title":"Appl Microbiol Biotechnol"},{"key":"2025101607414973100_btaf531-B28","doi-asserted-by":"crossref","first-page":"e00321-21","DOI":"10.1128\/JVI.00321-21","article-title":"Sequence-function relationships in phage-encoded bacterial cell wall lytic enzymes and their implications for Phage-Derived product design","volume":"95","author":"V\u00e1zquez","year":"2021","journal-title":"J Virol"},{"key":"2025101607414973100_btaf531-B29","doi-asserted-by":"publisher","DOI":"10.1007\/s12602-024-10309-0","article-title":"The new SH3b_T domain increases the structural and functional variability among SH3b-Like CBDs from staphylococcal phage endolysins","author":"V\u00e1zquez","year":"2024","journal-title":"Probiotics Antimicro Prot"},{"key":"2025101607414973100_btaf531-B30","doi-asserted-by":"crossref","first-page":"143093","DOI":"10.1016\/j.ijbiomac.2025.143093","article-title":"Diversity, structure-function relationships and evolution of cell wall-binding domains of staphylococcal phage endolysins","volume":"310","author":"V\u00e1zquez","year":"2025","journal-title":"Int J Biol Macromol"},{"key":"2025101607414973100_btaf531-B31","doi-asserted-by":"crossref","first-page":"1145","DOI":"10.1016\/j.csbj.2021.01.041","article-title":"Protein domain identification methods and online resources","volume":"19","author":"Wang","year":"2021","journal-title":"Comput Struct Biotechnol J"},{"key":"2025101607414973100_btaf531-B32","doi-asserted-by":"crossref","first-page":"1089","DOI":"10.1038\/s41586-023-06415-8","article-title":"De novo design of protein structure and function with RFdiffusion","volume":"620","author":"Watson","year":"2023","journal-title":"Nature"},{"key":"2025101607414973100_btaf531-B33","doi-asserted-by":"crossref","first-page":"btae296","DOI":"10.1093\/bioinformatics\/btae296","article-title":"Chainsaw: protein domain segmentation with fully convolutional neural networks","volume":"40","author":"Wells","year":"2024","journal-title":"Bioinformatics"},{"key":"2025101607414973100_btaf531-B34","doi-asserted-by":"crossref","first-page":"e0141541","DOI":"10.1371\/journal.pone.0141541","article-title":"Extending protein domain boundary predictors to detect discontinuous domains","volume":"10","author":"Xue","year":"2015","journal-title":"PLoS One"},{"key":"2025101607414973100_btaf531-B35","doi-asserted-by":"crossref","first-page":"e4548","DOI":"10.1002\/pro.4548","article-title":"DPAM: a domain parser for AlphaFold models","volume":"32","author":"Zhang","year":"2023","journal-title":"Protein Sci"},{"key":"2025101607414973100_btaf531-B36","doi-asserted-by":"crossref","first-page":"15930","DOI":"10.1073\/pnas.1905068116","article-title":"Assembling multidomain protein structures through analogous global structural alignments","volume":"116","author":"Zhou","year":"2019","journal-title":"Proc Natl Acad Sci USA"},{"key":"2025101607414973100_btaf531-B37","doi-asserted-by":"crossref","first-page":"btad070","DOI":"10.1093\/bioinformatics\/btad070","article-title":"A unified approach to protein domain parsing with inter-residue distance matrix","volume":"39","author":"Zhu","year":"2023","journal-title":"Bioinformatics"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/advance-article-pdf\/doi\/10.1093\/bioinformatics\/btaf531\/64373687\/btaf531.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/41\/10\/btaf531\/64373687\/btaf531.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/41\/10\/btaf531\/64373687\/btaf531.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,16]],"date-time":"2025-10-16T11:42:00Z","timestamp":1760614920000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/doi\/10.1093\/bioinformatics\/btaf531\/8262958"}},"subtitle":[],"editor":[{"given":"Arne","family":"Elofsson","sequence":"additional","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2025,9,24]]},"references-count":36,"journal-issue":{"issue":"10","published-print":{"date-parts":[[2025,10,2]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btaf531","relation":{},"ISSN":["1367-4803","1367-4811"],"issn-type":[{"value":"1367-4803","type":"print"},{"value":"1367-4811","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2025,10]]},"published":{"date-parts":[[2025,9,24]]},"article-number":"btaf531"}}