{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,29]],"date-time":"2025-10-29T13:28:07Z","timestamp":1761744487755,"version":"3.37.3"},"reference-count":10,"publisher":"Oxford University Press (OUP)","issue":"12","license":[{"start":{"date-parts":[[2017,2,10]],"date-time":"2017-02-10T00:00:00Z","timestamp":1486684800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/academic.oup.com\/journals\/pages\/about_us\/legal\/notices"}],"funder":[{"DOI":"10.13039\/501100004586","name":"Funda\u00e7\u00e3o de Amparo \u00e0 Pesquisa do Estado do Rio de Janeiro","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100004586","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017,6,15]]},"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:sec>\n                  <jats:title>Motivation<\/jats:title>\n                  <jats:p>Around 75% of all mass spectra remain unidentified by widely adopted proteomic strategies. We present DiagnoProt, an integrated computational environment that can efficiently cluster millions of spectra and use machine learning to shortlist high-quality unidentified mass spectra that are discriminative of different biological conditions.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Results<\/jats:title>\n                  <jats:p>We exemplify the use of DiagnoProt by shortlisting 4366 high-quality unidentified tandem mass spectra that are discriminative of different types of the Aspergillus fungus.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Availability and Implementation<\/jats:title>\n                  <jats:p>DiagnoProt, a demonstration video and a user tutorial are available at http:\/\/patternlabforproteomics.org\/diagnoprot.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Supplementary information<\/jats:title>\n                  <jats:p>Supplementary data are available at Bioinformatics online.<\/jats:p>\n               <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btx093","type":"journal-article","created":{"date-parts":[[2017,2,10]],"date-time":"2017-02-10T12:31:30Z","timestamp":1486729890000},"page":"1883-1885","source":"Crossref","is-referenced-by-count":6,"title":["DiagnoProt: a tool for discovery of new molecules by mass spectrometry"],"prefix":"10.1093","volume":"33","author":[{"given":"Andr\u00e9 R.F","family":"Silva","sequence":"first","affiliation":[{"name":"Systems Engineering and Computer Science Program, Federal University of Rio de Janeiro, Rio de Janeiro, Brazil"}]},{"given":"Diogo B","family":"Lima","sequence":"additional","affiliation":[{"name":"Institut Pasteur, Structural Mass Spectrometry and Proteomics Unit, Paris, France"}]},{"given":"Alejandro","family":"Leyva","sequence":"additional","affiliation":[{"name":"Analytical Biochemistry and Proteomics Unit, Institut Pasteur de Montevideo\/IIBCE, Montevideo, Uruguay"}]},{"given":"Rosario","family":"Duran","sequence":"additional","affiliation":[{"name":"Analytical Biochemistry and Proteomics Unit, Institut Pasteur de Montevideo\/IIBCE, Montevideo, Uruguay"}]},{"given":"Carlos","family":"Batthyany","sequence":"additional","affiliation":[{"name":"Analytical Biochemistry and Proteomics Unit, Institut Pasteur de Montevideo\/IIBCE, Montevideo, Uruguay"}]},{"given":"Priscila F","family":"Aquino","sequence":"additional","affiliation":[{"name":"Le\u00f4nidas and Maria Deane Institute, Fiocruz, Amazonas, Brazil"}]},{"given":"Juliana C","family":"Leal","sequence":"additional","affiliation":[{"name":"Le\u00f4nidas and Maria Deane Institute, Fiocruz, Amazonas, Brazil"}]},{"given":"Jimmy E","family":"Rodriguez","sequence":"additional","affiliation":[{"name":"Proteomics Unit, Chemistry Institute, Federal University of Rio de Janeiro, Rio de Janeiro, Brazil"}]},{"given":"Gilberto B","family":"Domont","sequence":"additional","affiliation":[{"name":"Proteomics Unit, Chemistry Institute, Federal University of Rio de Janeiro, Rio de Janeiro, Brazil"}]},{"given":"Marlon D.M","family":"Santos","sequence":"additional","affiliation":[{"name":"Carlos Chagas Institute, Computational Mass Spectrometry & Proteomics Group, Fiocruz, Paran\u00e1, Brazil"}]},{"given":"Julia","family":"Chamot-Rooke","sequence":"additional","affiliation":[{"name":"Institut Pasteur, Structural Mass Spectrometry and Proteomics Unit, Paris, France"}]},{"given":"Valmir C","family":"Barbosa","sequence":"additional","affiliation":[{"name":"Systems Engineering and Computer Science Program, Federal University of Rio de Janeiro, Rio de Janeiro, Brazil"}]},{"given":"Paulo C","family":"Carvalho","sequence":"additional","affiliation":[{"name":"Carlos Chagas Institute, Computational Mass Spectrometry & Proteomics Group, Fiocruz, Paran\u00e1, Brazil"},{"name":"Laboratory for Toxinology, Fiocruz, Rio de Janeiro, Brazil"}]}],"member":"286","published-online":{"date-parts":[[2017,2,10]]},"reference":[{"key":"2023020205492043700_btx093-B1","doi-asserted-by":"crossref","first-page":"5836","DOI":"10.1021\/pr300612x","article-title":"Are gastric cancer resection margin proteomic profiles more similar to those from controls or tumors?","volume":"11","author":"Aquino","year":"2012","journal-title":"J. Proteome Res"},{"key":"2023020205492043700_btx093-B2","doi-asserted-by":"crossref","first-page":"102","DOI":"10.1038\/nprot.2015.133","article-title":"Integrated analysis of shotgun proteomic data with PatternLab for proteomics 4.0","volume":"11","author":"Carvalho","year":"2015","journal-title":"Nat. Protoc"},{"key":"2023020205492043700_btx093-B3","doi-asserted-by":"crossref","first-page":"1865","DOI":"10.1007\/s13361-015-1179-x","article-title":"A deeper look into Comet\u2013implementation and features","volume":"26","author":"Eng","year":"2015","journal-title":"J. Am. Soc. Mass Spectrom"},{"key":"2023020205492043700_btx093-B4","doi-asserted-by":"crossref","first-page":"976","DOI":"10.1016\/1044-0305(94)80016-2","article-title":"An approach to correlate tandem mass spectral data of peptides with amino acid sequences in a protein database","volume":"5","author":"Eng","year":"1994","journal-title":"J. Am. Soc. Mass Spectrom"},{"key":"2023020205492043700_btx093-B5","doi-asserted-by":"crossref","first-page":"651","DOI":"10.1038\/nmeth.3902","article-title":"Recognizing millions of consistently unidentified spectra across hundreds of shotgun proteomics datasets","volume":"13","author":"Griss","year":"2016","journal-title":"Nat. Methods"},{"key":"2023020205492043700_btx093-B6","doi-asserted-by":"crossref","first-page":"2480","DOI":"10.1074\/mcp.M113.037002","article-title":"PepExplorer: a similarity-driven tool for analyzing de novo sequencing results","volume":"13","author":"Leprevost","year":"2014","journal-title":"Mol. Cell. Proteomics MCP"},{"key":"2023020205492043700_btx093-B7","doi-asserted-by":"crossref","first-page":"3241","DOI":"10.1021\/pr0603248","article-title":"Quality assessment of tandem mass spectra based on cumulative intensity normalization","volume":"5","author":"Na","year":"2006","journal-title":"J. Proteome Res"},{"key":"2023020205492043700_btx093-B8","doi-asserted-by":"crossref","first-page":"634","DOI":"10.1002\/pmic.200900459","article-title":"De novo sequencing of peptides by MS\/MS","volume":"10","author":"Seidler","year":"2010","journal-title":"Proteomics"},{"key":"2023020205492043700_btx093-B9","doi-asserted-by":"crossref","first-page":"828","DOI":"10.1038\/nbt.3597","article-title":"Sharing and community curation of mass spectrometry data with Global Natural Products Social Molecular Networking","volume":"34","author":"Wang","year":"2016","journal-title":"Nat. Biotechnol"},{"key":"2023020205492043700_btx093-B10","doi-asserted-by":"crossref","first-page":"1650","DOI":"10.1021\/ac015704l","article-title":"Analysis of quantitative proteomic data generated via multidimensional protein identification technology","volume":"74","author":"Washburn","year":"2002","journal-title":"Anal. Chem"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/33\/12\/1883\/49040085\/bioinformatics_33_12_1883.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/33\/12\/1883\/49040085\/bioinformatics_33_12_1883.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,2,2]],"date-time":"2023-02-02T05:52:37Z","timestamp":1675317157000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/33\/12\/1883\/2982301"}},"subtitle":[],"editor":[{"given":"John","family":"Hancock","sequence":"additional","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2017,2,10]]},"references-count":10,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2017,6,15]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btx093","relation":{},"ISSN":["1367-4803","1367-4811"],"issn-type":[{"type":"print","value":"1367-4803"},{"type":"electronic","value":"1367-4811"}],"subject":[],"published-other":{"date-parts":[[2017,6,15]]},"published":{"date-parts":[[2017,2,10]]}}}