{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T21:09:07Z","timestamp":1774904947194,"version":"3.50.1"},"reference-count":27,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2015,6,19]],"date-time":"2015-06-19T00:00:00Z","timestamp":1434672000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Cheminform"],"published-print":{"date-parts":[[2015,12]]},"DOI":"10.1186\/s13321-015-0072-8","type":"journal-article","created":{"date-parts":[[2015,6,18]],"date-time":"2015-06-18T10:44:06Z","timestamp":1434624246000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":23,"title":["The Chemical Validation and Standardization Platform (CVSP): large-scale automated validation of chemical structure datasets"],"prefix":"10.1186","volume":"7","author":[{"given":"Karen","family":"Karapetyan","sequence":"first","affiliation":[]},{"given":"Colin","family":"Batchelor","sequence":"additional","affiliation":[]},{"given":"David","family":"Sharpe","sequence":"additional","affiliation":[]},{"given":"Valery","family":"Tkachenko","sequence":"additional","affiliation":[]},{"given":"Antony J","family":"Williams","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,6,19]]},"reference":[{"key":"72_CR1","unstructured":"The Molfile Format. [\n                    http:\/\/goldbook.iupac.org\/MT06966.html\n                    \n                  ]"},{"key":"72_CR2","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1021\/ci00057a005","volume":"28","author":"D Weininger","year":"1988","unstructured":"Weininger D. SMILES 1, Introduction and encoding rules. J Chem Inf Comput Sci. 1988;28:31.","journal-title":"J Chem Inf Comput Sci"},{"key":"72_CR3","unstructured":"The IUPAC International Chemical Identifier (InChI). [\n                    http:\/\/www.iupac.org\/inchi\/\n                    \n                  ]"},{"key":"72_CR4","doi-asserted-by":"publisher","first-page":"7","DOI":"10.1186\/1758-2946-5-7","volume":"5","author":"S Heller","year":"2013","unstructured":"Heller S, McNaught A, Stein S, Tchekhovskoi D, Pletnev I. InChI - the worldwide chemical structure identifier standard. J Cheminf. 2013;5:7.","journal-title":"J Cheminf"},{"key":"72_CR5","unstructured":"Accelrys Draw. [\n                    http:\/\/accelrys.com\/products\/informatics\/cheminformatics\/draw\/\n                    \n                  ]"},{"key":"72_CR6","doi-asserted-by":"crossref","unstructured":"Williams AJ, Ekins S, Tkachenko V. Towards a Gold Standard: regarding quality in public domain chemistry databases and approaches to improving the situation. Drug Discov Today. 2012;13\u201314:685\u2013701.","DOI":"10.1016\/j.drudis.2012.02.013"},{"key":"72_CR7","doi-asserted-by":"publisher","first-page":"747","DOI":"10.1016\/j.drudis.2011.07.007","volume":"16","author":"AJ Williams","year":"2011","unstructured":"Williams AJ, Ekins S. A quality alert and call for improved curation of public chemistry databases. Drug Disc Today. 2011;16:747\u201350.","journal-title":"Drug Disc Today"},{"key":"72_CR8","doi-asserted-by":"publisher","first-page":"1123","DOI":"10.1021\/ed100697w","volume":"87","author":"H Pence","year":"2010","unstructured":"Pence H, Williams AJ. ChemSpider: An Online Chemical Information Resource. J Chem Educ. 2010;87:1123\u20134.","journal-title":"J Chem Educ"},{"key":"72_CR9","doi-asserted-by":"crossref","unstructured":"Williams AJ: ChemSpider: Integrating Structure-Based Resources Distributed Across the Internet. Enhancing Learning with Online Resources, Social Networking, and Digital Libraries. ACS Symposium Series. 1060: 2: 23-29.","DOI":"10.1021\/bk-2010-1060.ch002"},{"key":"72_CR10","doi-asserted-by":"publisher","first-page":"363","DOI":"10.1002\/9781118026038.ch22","volume-title":"Collaborative Computational Technologies for Biomedical Research","author":"AJ Williams","year":"2011","unstructured":"Williams AJ. Chemspider: A Platform for Crowdsourced Collaboration to Curate Data Derived From Public Compound Databases. In: Collaborative Computational Technologies for Biomedical Research. 2011. p. 363\u201386."},{"key":"72_CR11","doi-asserted-by":"publisher","first-page":"1188","DOI":"10.1016\/j.drudis.2012.05.016","volume":"17","author":"AJ Williams","year":"2012","unstructured":"Williams AJ, Harland L, Groth P, Pettifer S, Chichester C, Willighagen EL, et al. Open PHACTS: semantic interoperability for drug discovery. Drug Discov Today. 2012;17:1188\u201398.","journal-title":"Drug Discov Today"},{"key":"72_CR12","doi-asserted-by":"publisher","first-page":"843","DOI":"10.1016\/j.drudis.2013.05.008","volume":"18","author":"K Azzaoui","year":"2013","unstructured":"Azzaoui K, Jacoby E, Senger S, Rodriguez EC, Loza M, Zdrazil B, et al. Scientific competency questions as the basis for semantically enriched open pharmacological space development. Drug Discov Today. 2013;18:843\u201352.","journal-title":"Drug Discov Today"},{"key":"72_CR13","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1186\/1758-2946-5-23","volume":"5","author":"EL Willighagen","year":"2013","unstructured":"Willighagen EL, Waagmeester A, Spjuth O, Ansell P, Williams AJ, Tkachenko V, et al. The ChEMBL database as linked open data. J Cheminform. 2013;5:23.","journal-title":"J Cheminform"},{"key":"72_CR14","doi-asserted-by":"publisher","first-page":"D1100","DOI":"10.1093\/nar\/gkr777","volume":"40","author":"A Gaulton","year":"2012","unstructured":"Gaulton A, Bellis LJ, Bento AP, Chambers J, Davies M, Hersey A, et al. ChEMBL: a large-scale bioactivity database for drug discovery. Nucleic Acids Res. 2012;40:D1100\u20137.","journal-title":"Nucleic Acids Res"},{"key":"72_CR15","doi-asserted-by":"publisher","first-page":"D344","DOI":"10.1093\/nar\/gkm791","volume":"36","author":"K Degtyarenko","year":"2008","unstructured":"Degtyarenko K, de Matos P, Ennis M, Hastings J, Zbinden M, McNaught A, et al. ChEBI: a database and ontology for chemical entities of biological interest. Nucleic Acids Res. 2008;36:D344\u201350.","journal-title":"Nucleic Acids Res"},{"key":"72_CR16","doi-asserted-by":"publisher","first-page":"D668","DOI":"10.1093\/nar\/gkj067","volume":"34","author":"DS Wishart","year":"2006","unstructured":"Wishart DS, Knox C, Guo AC, Shrivastava S, Hassanali M, Stothard P, et al. DrugBank: a comprehensive resource for in silico drug discovery and exploration. Nucleic Acids Res. 2006;34:D668\u201372.","journal-title":"Nucleic Acids Res"},{"key":"72_CR17","doi-asserted-by":"publisher","first-page":"D901","DOI":"10.1093\/nar\/gkm958","volume":"36","author":"DS Wishart","year":"2008","unstructured":"Wishart DS, Knox C, Guo AC, Cheng D, Shrivastava S, Tzur D, et al. DrugBank: a knowledgebase for drugs, drug actions and drug targets. Nucleic Acids Res. 2008;36:D901\u20136.","journal-title":"Nucleic Acids Res"},{"issue":"Suppl. 1","key":"72_CR18","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1186\/1758-2946-3-S1-P4","volume":"3","author":"D Pavlov","year":"2011","unstructured":"Pavlov D, Rybalkin M, Karulin B, Kozhevnikov M, Savelyev A, Churinov A. Indigo: universal cheminformatics API. J Cheminf. 2011;3 Suppl 1:4.","journal-title":"J Cheminf"},{"key":"72_CR19","unstructured":"Open Eye ChemInformatics toolkit OEChem. [\n                    http:\/\/www.eyesopen.com\/oechem-tk\n                    \n                  ]"},{"key":"72_CR20","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1186\/1758-2946-3-33","volume":"3","author":"NM O\u2019Boyle","year":"2011","unstructured":"O\u2019Boyle NM, Banck M, James CA, Morley C, Vandermeersch T, Hutchison GR. Open Babel: An open chemical toolbox. J Cheminf. 2011;3:33.","journal-title":"J Cheminf"},{"key":"72_CR21","volume-title":"Open Source Software in Life Science Research","author":"A Day","year":"2012","unstructured":"Day A, Williams A, Batchelor C, Kidd R, Tkachenko V. Utilizing open source software to facilitate communication of chemistry at RSC. In: Harland L, Forster M, editors. Open Source Software in Life Science Research. Oxford: Woodhead Publishing; 2012."},{"key":"72_CR22","unstructured":"FDA Substance Registration System User\u2019s Guide Version 5c [\n                    http:\/\/www.fda.gov\/downloads\/ForIndustry\/DataStandards\/SubstanceRegistrationSystem-UniqueIngredientIdentifierUNII\/ucm127743.pdf\n                    \n                  ]"},{"key":"72_CR23","doi-asserted-by":"publisher","first-page":"D1035","DOI":"10.1093\/nar\/gkq1126","volume":"39","author":"C Knox","year":"2011","unstructured":"Knox C, Law V, Jewison T, Liu P, Ly S, Frolkis A, et al. DrugBank 3.0: a comprehensive resource for \u2018omics\u2019 research on drugs. Nucleic Acids Res. 2011;39:D1035.","journal-title":"Nucleic Acids Res"},{"key":"72_CR24","doi-asserted-by":"publisher","first-page":"283","DOI":"10.1007\/s11030-006-9041-5","volume":"10","author":"M Hassan","year":"2006","unstructured":"Hassan M, Brown RD, Varma-O'brien S, Rogers D. Cheminformatics analysis and learning in a data pipelining environment. Mol Divers. 2006;10:283\u201399.","journal-title":"Mol Divers"},{"key":"72_CR25","unstructured":"SciTegic Pipeline Pilot, version Version 7.5.2; 2009. [\n                    http:\/\/accelrys.com\/products\/scitegic\/\n                    \n                  ]"},{"key":"72_CR26","doi-asserted-by":"crossref","unstructured":"Berthold M, Cebron N, Dill F, Gabriel T, K\u00f6tter T, Meinl T, et al. In Data Analysis, Machine Learning and Applications. Edited by Preisach C, Burkhardt H, Schmidt-Thieme L, Decker R: Springer Berlin Heidelberg; 2008: 319\u2013326: Studies in Classification, Data Analysis, and Knowledge Organization.","DOI":"10.1007\/978-3-540-78246-9_38"},{"key":"72_CR27","unstructured":"PharmaSea. [\n                    http:\/\/www.pharma-sea.eu\/\n                    \n                  ]"}],"container-title":["Journal of Cheminformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-015-0072-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s13321-015-0072-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-015-0072-8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-015-0072-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,6,24]],"date-time":"2019-06-24T10:05:16Z","timestamp":1561370716000},"score":1,"resource":{"primary":{"URL":"https:\/\/jcheminf.biomedcentral.com\/articles\/10.1186\/s13321-015-0072-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,6,19]]},"references-count":27,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2015,12]]}},"alternative-id":["72"],"URL":"https:\/\/doi.org\/10.1186\/s13321-015-0072-8","relation":{},"ISSN":["1758-2946"],"issn-type":[{"value":"1758-2946","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,6,19]]},"assertion":[{"value":"28 October 2014","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 April 2015","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 June 2015","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"30"}}