{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,24]],"date-time":"2026-03-24T05:33:20Z","timestamp":1774330400579,"version":"3.50.1"},"reference-count":93,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2017,6,6]],"date-time":"2017-06-06T00:00:00Z","timestamp":1496707200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Cheminform"],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1186\/s13321-017-0220-4","type":"journal-article","created":{"date-parts":[[2017,6,6]],"date-time":"2017-06-06T12:21:22Z","timestamp":1496751682000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":342,"title":["The Chemistry Development Kit (CDK) v2.0: atom typing, depiction, molecular formulas, and substructure searching"],"prefix":"10.1186","volume":"9","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7542-0286","authenticated-orcid":false,"given":"Egon L.","family":"Willighagen","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7730-2646","authenticated-orcid":false,"given":"John W.","family":"Mayfield","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8682-7206","authenticated-orcid":false,"given":"Jonathan","family":"Alvarsson","sequence":"additional","affiliation":[]},{"given":"Arvid","family":"Berg","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9491-4134","authenticated-orcid":false,"given":"Lars","family":"Carlsson","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4322-6179","authenticated-orcid":false,"given":"Nina","family":"Jeliazkova","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5990-4157","authenticated-orcid":false,"given":"Stefan","family":"Kuhn","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6940-3006","authenticated-orcid":false,"given":"Tom\u00e1\u0161","family":"Pluskal","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4659-1446","authenticated-orcid":false,"given":"Miquel","family":"Rojas-Chert\u00f3","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8083-2864","authenticated-orcid":false,"given":"Ola","family":"Spjuth","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8368-6954","authenticated-orcid":false,"given":"Gilleain","family":"Torrance","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5301-3142","authenticated-orcid":false,"given":"Chris T.","family":"Evelo","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7403-8819","authenticated-orcid":false,"given":"Rajarshi","family":"Guha","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6966-0814","authenticated-orcid":false,"given":"Christoph","family":"Steinbeck","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,6,6]]},"reference":[{"issue":"1","key":"220_CR1","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1186\/1758-2946-3-37","volume":"3","author":"N O\u2019Boyle","year":"2011","unstructured":"O\u2019Boyle N, Guha R, Willighagen E, Adams S, Alvarsson J, Bradley JC et al (2011) Open Data, Open Source and Open Standards in chemistry: The Blue Obelisk five years on. J Cheminform 3(1):37","journal-title":"J Cheminform"},{"issue":"3","key":"220_CR2","doi-asserted-by":"publisher","first-page":"991","DOI":"10.1021\/ci050400b","volume":"46","author":"R Guha","year":"2006","unstructured":"Guha R, Howard MT, Hutchison GR, Murray-Rust P, Rzepa H, Steinbeck C et al (2006) The Blue Obelisk\u2014interoperability in chemical informatics. J Chem Inf Model 46(3):991\u2013998","journal-title":"J Chem Inf Model"},{"issue":"2","key":"220_CR3","doi-asserted-by":"publisher","first-page":"493","DOI":"10.1021\/ci025584y","volume":"43","author":"C Steinbeck","year":"2003","unstructured":"Steinbeck C, Han Y, Kuhn S, Horlacher O, Luttmann E, Willighagen E (2003) The Chemistry Development Kit (CDK): an open-source Java library for Chemo- and Bioinformatics. J Chem Inf Comput Sci 43(2):493\u2013500","journal-title":"J Chem Inf Comput Sci"},{"issue":"17","key":"220_CR4","doi-asserted-by":"publisher","first-page":"2111","DOI":"10.2174\/138161206777585274","volume":"12","author":"C Steinbeck","year":"2006","unstructured":"Steinbeck C, Hoppe C, Kuhn S, Floris M, Guha R, Willighagen EL (2006) Recent developments of the Chemistry Development Kit (CDK)\u2014an open-source java library for chemo- and bioinformatics. Curr Pharm Des 12(17):2111\u20132120","journal-title":"Curr Pharm Des"},{"key":"220_CR5","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1186\/1752-153X-2-24","volume":"2","author":"NM O\u2019Boyle","year":"2008","unstructured":"O\u2019Boyle NM, Hutchison GR (2008) Cinfony\u2013combining Open Source cheminformatics toolkits behind a common interface. Chem Cent J 2:24","journal-title":"Chem Cent J"},{"issue":"5","key":"220_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.18637\/jss.v018.i05","volume":"18","author":"R Guha","year":"2007","unstructured":"Guha R (2007) Chemical informatics functionality in R. J Stat Softw 18(5):1\u201316","journal-title":"J Stat Softw"},{"issue":"1","key":"220_CR7","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1758-2946-3-54","volume":"3","author":"A Truszkowski","year":"2011","unstructured":"Truszkowski A, Jayaseelan KV, Neumann S, Willighagen EL, Zielesny A, Steinbeck C (2011) New developments on the cheminformatics open workflow environment CDK-Taverna. J Cheminform 3(1):1\u201310","journal-title":"J Cheminform"},{"issue":"1","key":"220_CR8","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1186\/1471-2105-14-257","volume":"14","author":"S Beisken","year":"2013","unstructured":"Beisken S, Meinl T, Wiswedel B, de Figueiredo L, Berthold M, Steinbeck C (2013) KNIME-CDK: workflow-driven cheminformatics. BMC Bioinform 14(1):257","journal-title":"BMC Bioinform"},{"key":"220_CR9","unstructured":"ChemViz2: Cheminformatics App for Cytoscape; 2016. http:\/\/www.rbvi.ucsf.edu\/cytoscape\/chemViz2\/"},{"issue":"1","key":"220_CR10","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1186\/1758-2946-4-3","volume":"4","author":"KR Lawson","year":"2012","unstructured":"Lawson KR, Lawson J (2012) LICSS\u2014a chemical spreadsheet in microsoft excel. J Cheminform 4(1):3","journal-title":"J Cheminform"},{"issue":"1","key":"220_CR11","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1186\/1758-2946-3-3","volume":"3","author":"G Hinselmann","year":"2011","unstructured":"Hinselmann G, Rosenbaum L, Jahn A, Fechner N, Zell A (2011) jCompoundMapper: an open source Java library and command-line tool for chemical fingerprints. J Cheminform 3(1):3","journal-title":"J Cheminform"},{"issue":"8","key":"220_CR12","doi-asserted-by":"publisher","first-page":"581","DOI":"10.1038\/nchembio.187","volume":"5","author":"S Wetzel","year":"2009","unstructured":"Wetzel S, Klein K, Renner S, Rauh D, Oprea TI, Mutzel P et al (2009) Interactive exploration of chemical space with Scaffold Hunter. Nat Chem Biol 5(8):581\u2013583","journal-title":"Nat Chem Biol"},{"issue":"11\u201312","key":"220_CR13","doi-asserted-by":"publisher","first-page":"964","DOI":"10.1002\/minf.201300087","volume":"32","author":"K Klein","year":"2013","unstructured":"Klein K, Koch O, Kriege N, Mutzel P, Sch\u00e4fer T (2013) Visual analysis of biological activity data with Scaffold Hunter. Mol Inform 32(11\u201312):964\u2013975","journal-title":"Mol Inform"},{"issue":"1","key":"220_CR14","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1758-2946-4-21","volume":"4","author":"JE Peironcely","year":"2012","unstructured":"Peironcely JE, Rojas-Chert\u00f3 M, Fichera D, Reijmers T, Coulier L, Faulon JL et al (2012) OMG: open molecule generator. J Cheminform 4(1):1\u201313","journal-title":"J Cheminform"},{"issue":"7","key":"220_CR15","doi-asserted-by":"publisher","first-page":"1466","DOI":"10.1002\/jcc.21707","volume":"32","author":"CW Yap","year":"2011","unstructured":"Yap CW (2011) PaDEL-descriptor: an open source software to calculate molecular descriptors and fingerprints. J Comput Chem 32(7):1466\u20131474","journal-title":"J Comput Chem"},{"issue":"1","key":"220_CR16","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1186\/s13321-015-0109-z","volume":"7","author":"J Dong","year":"2015","unstructured":"Dong J, Cao DS, Miao HY, Liu S, Deng BC, Yun YH et al (2015) ChemDes: an integrated web-based platform for molecular descriptor and fingerprint computation. J Cheminform 7(1):60","journal-title":"J Cheminform"},{"key":"220_CR17","doi-asserted-by":"crossref","first-page":"3522","DOI":"10.1093\/bioinformatics\/btw491","volume":"32","author":"TV Sivakumar","year":"2016","unstructured":"Sivakumar TV, Giri V, Park JH, Kim TY, Bhaduri A (2016) ReactPRED: a tool to predict and analyze biochemical reactions. Bioinformatics 32:3522\u20133524","journal-title":"Bioinformatics"},{"issue":"1","key":"220_CR18","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1186\/1758-2946-1-12","volume":"1","author":"SA Rahman","year":"2009","unstructured":"Rahman SA, Bashton M, Holliday GL, Schrader R, Thornton JM (2009) Small Molecule Subgraph Detector (SMSD) toolkit. J Cheminform 1(1):12","journal-title":"J Cheminform"},{"issue":"2","key":"220_CR19","doi-asserted-by":"publisher","first-page":"171","DOI":"10.1038\/nmeth.2803","volume":"11","author":"SA Rahman","year":"2014","unstructured":"Rahman SA, Cuesta SM, Furnham N, Holliday GL, Thornton JM (2014) EC-BLAST: a tool to automatically search and compare enzyme reactions. Nat Methods 11(2):171\u2013174","journal-title":"Nat Methods"},{"issue":"13","key":"220_CR20","doi-asserted-by":"publisher","first-page":"2065","DOI":"10.1093\/bioinformatics\/btw096","volume":"32","author":"SA Rahman","year":"2016","unstructured":"Rahman SA, Torrance G, Baldacci L, Cuesta SM, Fenninger F, Gopal N et al (2016) Reaction Decoder Tool (RDT): extracting features from chemical reactions. Bioinformatics 32(13):2065\u20132066","journal-title":"Bioinformatics"},{"issue":"16","key":"220_CR21","doi-asserted-by":"publisher","first-page":"2051","DOI":"10.1093\/bioinformatics\/btt325","volume":"29","author":"M Rostkowski","year":"2013","unstructured":"Rostkowski M, Spjuth O, Rydberg P (2013) WhichCyp: prediction of cytochromes P450 inhibition. Bioinformatics 29(16):2051\u20132052","journal-title":"Bioinformatics"},{"issue":"1","key":"220_CR22","doi-asserted-by":"publisher","first-page":"362","DOI":"10.1186\/1471-2105-11-362","volume":"11","author":"L Carlsson","year":"2010","unstructured":"Carlsson L, Spjuth O, Adams S, Glen RC, Boyer S (2010) Use of historic metabolic biotransformation data as a means of anticipating metabolic sites using MetaPrint2D and Bioclipse. BMC Bioinform 11(1):362","journal-title":"BMC Bioinform"},{"issue":"1","key":"220_CR23","doi-asserted-by":"publisher","first-page":"148","DOI":"10.1186\/1471-2105-11-148","volume":"11","author":"S Wolf","year":"2010","unstructured":"Wolf S, Schmidt S, M\u00fcller-Hannemann M, Neumann S (2010) In silico fragmentation for computer assisted identification of metabolite mass spectra. BMC Bioinform 11(1):148","journal-title":"BMC Bioinform"},{"issue":"D1","key":"220_CR24","doi-asserted-by":"publisher","first-page":"D1054","DOI":"10.1093\/nar\/gkv1037","volume":"44","author":"C Southan","year":"2016","unstructured":"Southan C, Sharman JL, Benson HE, Faccenda E, Pawson AJ, Alexander SPH et al (2016) The IUPHAR\/BPS Guide to PHARMACOLOGY in 2016: towards curated quantitative interactions between 1300 protein targets and 6000 ligands. Nucleic Acids Res 44(D1):D1054\u2013D1068","journal-title":"Nucleic Acids Res"},{"issue":"D1","key":"220_CR25","doi-asserted-by":"publisher","first-page":"D380","DOI":"10.1093\/nar\/gkw952","volume":"45","author":"S Placzek","year":"2017","unstructured":"Placzek S, Schomburg I, Chang A, Jeske L, Ulbrich M, Tillack J et al (2017) BRENDA in 2017: new perspectives and new tools in BRENDA. Nucleic Acids Res 45(D1):D380\u2013D388","journal-title":"Nucleic Acids Res"},{"issue":"1","key":"220_CR26","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1186\/s13321-015-0082-6","volume":"7","author":"V Ruusmann","year":"2015","unstructured":"Ruusmann V, Sild S, Maran U (2015) QSAR DataBank repository: open and linked qualitative and quantitative structure activity relationship models. J Cheminform 7(1):35","journal-title":"J Cheminform"},{"issue":"1","key":"220_CR27","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1186\/1471-2105-8-59","volume":"8","author":"O Spjuth","year":"2007","unstructured":"Spjuth O, Helmus T, Willighagen EL, Kuhn S, Eklund M, Wagener J et al (2007) Bioclipse: an open source workbench for chemo- and bioinformatics. BMC Bioinform 8(1):59","journal-title":"BMC Bioinform"},{"issue":"1","key":"220_CR28","doi-asserted-by":"publisher","first-page":"397","DOI":"10.1186\/1471-2105-10-397","volume":"10","author":"O Spjuth","year":"2009","unstructured":"Spjuth O, Alvarsson J, Berg A, Eklund M, Kuhn S, M\u00e4sak C et al (2009) Bioclipse 2: a scriptable integration platform for the life sciences. BMC Bioinform 10(1):397","journal-title":"BMC Bioinform"},{"issue":"1","key":"220_CR29","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1758-2946-3-18","volume":"3","author":"N Jeliazkova","year":"2011","unstructured":"Jeliazkova N, Jeliazkov V (2011) AMBIT RESTful web services: an implementation of the OpenTox application programming interface. J Cheminform 3(1):1\u201318","journal-title":"J Cheminform"},{"issue":"8","key":"220_CR30","doi-asserted-by":"crossref","first-page":"707","DOI":"10.1002\/minf.201100028","volume":"30","author":"N Jeliazkova","year":"2011","unstructured":"Jeliazkova N, Kochev N (2011) AMBIT-SMARTS: efficient searching of chemical structures and fragments. Mol Inform 30(8):707\u2013720","journal-title":"Mol Inform"},{"issue":"5\u20136","key":"220_CR31","doi-asserted-by":"publisher","first-page":"481","DOI":"10.1002\/minf.201200133","volume":"32","author":"NT Kochev","year":"2013","unstructured":"Kochev NT, Paskaleva VH, Jeliazkova N (2013) Ambit-Tautomer: an open source tool for tautomer generation. Mol Inform 32(5\u20136):481\u2013504","journal-title":"Mol Inform"},{"issue":"7583","key":"220_CR32","doi-asserted-by":"publisher","first-page":"493","DOI":"10.1038\/nature16440","volume":"528","author":"CJ Marth","year":"2015","unstructured":"Marth CJ, Gallego GM, Lee JC, Lebold TP, Kulyk S, Kou KGM et al (2015) Network-analysis-guided synthesis of weisaconitine D and liljestrandinine. Nature 528(7583):493\u2013498","journal-title":"Nature"},{"key":"220_CR33","doi-asserted-by":"publisher","first-page":"6118","DOI":"10.1002\/chem.201604556","volume":"23","author":"MHS Segler","year":"2017","unstructured":"Segler MHS, Waller MP (2017) Modelling chemical reasoning to predict and invent reactions. Chem. Eur. J. 23:6118\u20136128","journal-title":"Chem Eur J"},{"issue":"1","key":"220_CR34","doi-asserted-by":"publisher","first-page":"39","DOI":"10.1186\/s13321-016-0151-5","volume":"8","author":"J Alvarsson","year":"2016","unstructured":"Alvarsson J, Lampa S, Schaal W, Andersson C, Wikberg JES, Spjuth O (2016) Large-scale ligand-based predictive modelling using support vector machines. J Cheminform. 8(1):39","journal-title":"J Cheminform."},{"issue":"1","key":"220_CR35","doi-asserted-by":"publisher","first-page":"38","DOI":"10.1186\/s13321-014-0038-2","volume":"6","author":"A Clark","year":"2014","unstructured":"Clark A, Sarker M, Ekins S (2014) New target prediction and visualization tools incorporating open source molecular fingerprints for TB Mobile 2.0. J Cheminform 6(1):38","journal-title":"J Cheminform"},{"key":"220_CR36","first-page":"173","volume-title":"Computational life sciences II. vol. 4216 of Lecture Notes in Computer Science","author":"E Cannon","year":"2006","unstructured":"Cannon E, Mitchell JBO (2006) Classifying the World Anti-Doping Agency\u2019s 2005 prohibited list using the Chemistry Development Kit fingerprint. In: Berthold MR, Glen R, Fischer I (eds) Computational life sciences II. vol. 4216 of Lecture Notes in Computer Science. Springer, Berlin, pp 173\u2013182"},{"issue":"1","key":"220_CR37","doi-asserted-by":"publisher","first-page":"14","DOI":"10.1186\/1758-2946-5-14","volume":"5","author":"O Spjuth","year":"2013","unstructured":"Spjuth O, Berg A, Adams S, Willighagen EL (2013) Applications of the InChI in cheminformatics with the CDK and Bioclipse. J Cheminform 5(1):14","journal-title":"J Cheminform"},{"issue":"1","key":"220_CR38","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1186\/1758-2946-6-3","volume":"6","author":"JW May","year":"2014","unstructured":"May JW, Steinbeck C (2014) Efficient ring perception for the Chemistry Development Kit. J Cheminform 6(1):3","journal-title":"J Cheminform"},{"key":"220_CR39","unstructured":"May JW (2014) Mischievous SMARTS Queries. http:\/\/efficientbits.blogspot.co.uk\/2014_03_01_archive.html"},{"key":"220_CR40","unstructured":"May JW (2015) Cheminformatics for genome-scale metabolic reconstructions. University of Cambridge. https:\/\/www.repository.cam.ac.uk\/handle\/1810\/246652"},{"key":"220_CR41","first-page":"30","volume":"7","author":"K Karapetyan","year":"2015","unstructured":"Karapetyan K, Batchelor C, Sharpe D, Tkachenko V, Williams A (2015) The Chemical Validation and Standardization Platform (CVSP): large-scale automated validation of chemical structure datasets. J Stat Softw 7:30","journal-title":"J Stat Softw"},{"issue":"3","key":"220_CR42","doi-asserted-by":"publisher","first-page":"707","DOI":"10.1021\/ci020345w","volume":"43","author":"JL Faulon","year":"2003","unstructured":"Faulon JL, Visco J, Donald P, Pophale RS (2003) The signature molecular descriptor. 1. Using extended valence sequences in QSAR and QSPR studies. J Chem Inf Comput Sci 43(3):707\u2013720","journal-title":"J Chem Inf Comput Sci"},{"issue":"2","key":"220_CR43","doi-asserted-by":"publisher","first-page":"427","DOI":"10.1021\/ci0341823","volume":"44","author":"JL Faulon","year":"2004","unstructured":"Faulon JL, Collins MJ, Carr RD (2004) The signature molecular descriptor. 4. Canonizing molecules using extended valence sequences. J Chem Inf Comput Sci 44(2):427\u2013436","journal-title":"J Chem Inf Comput Sci"},{"issue":"10","key":"220_CR44","doi-asserted-by":"publisher","first-page":"2647","DOI":"10.1021\/ci500361u","volume":"54","author":"J Alvarsson","year":"2014","unstructured":"Alvarsson J, Eklund M, Engkvist O, Spjuth O, Carlsson L, Wikberg JES et al (2014) Ligand-Based target prediction with signature fingerprints. J Chem Inf Model 54(10):2647\u20132653","journal-title":"J Chem Inf Model"},{"issue":"8","key":"220_CR45","doi-asserted-by":"publisher","first-page":"18407","DOI":"10.1021\/ci200242c","volume":"51","author":"O Spjuth","year":"2011","unstructured":"Spjuth O, Eklund M, Ahlberg Helgee E, Boyer S, Carlsson L (2011) Integrated decision support for assessing chemical liabilities. J Chem Inf Model 51(8):18407","journal-title":"J Chem Inf Model"},{"issue":"1","key":"220_CR46","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1021\/ci500580y","volume":"55","author":"BT Moghadam","year":"2015","unstructured":"Moghadam BT, Alvarsson J, Holm M, Eklund M, Carlsson L, Spjuth O (2015) Scaling predictive modeling in drug development with cloud computing. J Chem Inf Model 55(1):19\u201325","journal-title":"J Chem Inf Model"},{"issue":"11","key":"220_CR47","doi-asserted-by":"publisher","first-page":"32117","DOI":"10.1021\/ci500344v","volume":"54","author":"J Alvarsson","year":"2014","unstructured":"Alvarsson J, Eklund M, Andersson C, Carlsson L, Spjuth O, Wikberg JES (2014) Benchmarking study of parameter variation when using signature fingerprints together with support vector machines. J Chem Inf Model 54(11):32117","journal-title":"J Chem Inf Model"},{"issue":"18","key":"220_CR48","doi-asserted-by":"publisher","first-page":"1980","DOI":"10.2174\/156802612804910287","volume":"12","author":"O Spjuth","year":"2012","unstructured":"Spjuth O, Carlsson L, Alvarsson J, Georgiev V, Willighagen E, Eklund M (2012) Open source drug discovery with bioclipse. Curr Top Med Chem 12(18):1980\u20131986","journal-title":"Curr Top Med Chem"},{"issue":"1","key":"220_CR49","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1016\/j.bmcl.2012.10.102","volume":"23","author":"U Norinder","year":"2013","unstructured":"Norinder U, Ek ME (2013) QSAR investigation of NaV1.7 active compounds using the SVM\/signature approach and the bioclipse modeling platform. Bioorg Med Chem Lett 23(1):261\u2013263","journal-title":"Bioorg Med Chem Lett"},{"issue":"1","key":"220_CR50","doi-asserted-by":"publisher","first-page":"8","DOI":"10.1186\/1758-2946-2-8","volume":"2","author":"AM Clark","year":"2010","unstructured":"Clark AM (2010) Basic primitives for molecular diagram sketching. J Cheminform 2(1):8","journal-title":"J Cheminform"},{"issue":"3","key":"220_CR51","doi-asserted-by":"publisher","first-page":"291","DOI":"10.1002\/minf.201200171","volume":"32","author":"AM Clark","year":"2013","unstructured":"Clark AM (2013) Rendering molecular sketches for publication quality output. Mol Inform 32(3):291\u2013301","journal-title":"Mol Inform"},{"key":"220_CR52","volume-title":"Structure diagram generation","author":"HE Helson","year":"2007","unstructured":"Helson HE (2007) Structure diagram generation. Wiley, Oxford"},{"issue":"17","key":"220_CR53","doi-asserted-by":"publisher","first-page":"2376","DOI":"10.1093\/bioinformatics\/btr409","volume":"27","author":"M Rojas-Chert\u00f3","year":"2011","unstructured":"Rojas-Chert\u00f3 M, Kasper PT, Willighagen EL, Vreeken RJ, Hankemeier T, Reijmers TH (2011) Elemental composition determination based on MSn. Bioinformatics 27(17):2376\u20132383","journal-title":"Bioinformatics"},{"issue":"10","key":"220_CR54","doi-asserted-by":"publisher","first-page":"4396","DOI":"10.1021\/ac3000418","volume":"84","author":"T Pluskal","year":"2012","unstructured":"Pluskal T, Uehara T, Yanagida M (2012) Highly accurate chemical formula prediction tool utilizing high-resolution mass spectra, MS\/MS fragmentation, heuristic rules, and isotope pattern matching. Anal Chem 84(10):4396\u20134403","journal-title":"Anal Chem"},{"issue":"1","key":"220_CR55","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1471-2105-11-395","volume":"11","author":"T Pluskal","year":"2010","unstructured":"Pluskal T, Castillo S, Villar-Briones A, Ore\u0161i\u010d M (2010) MZmine 2: modular framework for processing, visualizing, and analyzing mass spectrometry-based molecular profile data. BMC Bioinform 11(1):1\u201311","journal-title":"BMC Bioinform"},{"issue":"41","key":"220_CR56","doi-asserted-by":"publisher","first-page":"12580","DOI":"10.1073\/pnas.1509788112","volume":"112","author":"K D\u00fchrkop","year":"2015","unstructured":"D\u00fchrkop K, Shen H, Meusel M, Rousu J, B\u00f6cker S (2015) Searching molecular structure databases with tandem mass spectra using CSI:FingerID. Proc Natl Acad Sci 112(41):12580\u201312585","journal-title":"Proc Natl Acad Sci"},{"issue":"2","key":"220_CR57","doi-asserted-by":"publisher","first-page":"218","DOI":"10.1093\/bioinformatics\/btn603","volume":"25","author":"S B\u00f6cker","year":"2009","unstructured":"B\u00f6cker S, Letzel MC, Lipt\u00e1k Z, Pervukhin A (2009) SIRIUS: decomposing isotope patterns for metabolite identification. Bioinformatics 25(2):218\u2013224","journal-title":"Bioinformatics"},{"key":"220_CR58","volume-title":"Knapsack problems: algorithms and computer implementations","author":"S Martello","year":"1990","unstructured":"Martello S, Toth P (1990) Knapsack problems: algorithms and computer implementations. Wiley, New York"},{"key":"220_CR59","doi-asserted-by":"crossref","unstructured":"D\u00fchrkop K, Ludwig M, Meusel M, B\u00f6cker S (2013) Faster mass decomposition. In: Proceedings of workshop on algorithms in bioinformatics (WABI 2013). Springer, pp 45\u201358. http:\/\/arxiv.org\/abs\/1307.7805","DOI":"10.1007\/978-3-642-40453-5_5"},{"issue":"4","key":"220_CR60","doi-asserted-by":"publisher","first-page":"591","DOI":"10.1093\/bioinformatics\/btm631","volume":"24","author":"S B\u00f6cker","year":"2008","unstructured":"B\u00f6cker S, Lipt\u00e1k Z, Martin M, Pervukhin A, Sudek H (2008) DECOMP from interpreting mass spectrometry peaks to solving the money changing problem. Bioinformatics 24(4):591\u2013593","journal-title":"Bioinformatics"},{"key":"220_CR61","doi-asserted-by":"crossref","unstructured":"B\u00f6cker S, Lipt\u00e1k Z (2005) Efficient mass decomposition. In: Proceedings of the 2005 ACM symposium on applied computing. ACM, pp 151\u2013157","DOI":"10.1145\/1066677.1066715"},{"issue":"1","key":"220_CR62","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1471-2105-8-105","volume":"8","author":"T Kind","year":"2007","unstructured":"Kind T, Fiehn O (2007) Seven golden rules for heuristic filtering of molecular formulas obtained by accurate mass spectrometry. BMC Bioinform 8(1):1\u201320","journal-title":"BMC Bioinform"},{"key":"220_CR63","doi-asserted-by":"publisher","first-page":"106","DOI":"10.1016\/j.chemolab.2016.03.002","volume":"153","author":"M Zhang","year":"2016","unstructured":"Zhang M, Zhang Z, Chen C, Lu H, Liang Y (2016) Parallel formula generator based on branch-and-bound algorithm for elucidating high resolution mass spectra. Chemometr Intell Lab Syst 153:106\u2013109","journal-title":"Chemometr Intell Lab Syst"},{"issue":"8","key":"220_CR64","doi-asserted-by":"publisher","first-page":"828","DOI":"10.1038\/nbt.3597","volume":"34","author":"M Wang","year":"2016","unstructured":"Wang M, Carver JJ, Phelan VV, Sanchez LM, Garg N, Peng Y et al (2016) Sharing and community curation of mass spectrometry data with Global Natural Products Social Molecular Networking. Nat Biotechnol 34(8):828\u2013837","journal-title":"Nat Biotechnol"},{"issue":"1","key":"220_CR65","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1021\/ci00057a005","volume":"28","author":"D Weininger","year":"1988","unstructured":"Weininger D (1988) SMILES, a chemical language and information system. 1. Introduction to methodology and encoding rules. J Chem Inf Comput Sci 28(1):31\u201336","journal-title":"J Chem Inf Comput Sci"},{"key":"220_CR66","unstructured":"May JW (2013) Beam. GitHub . https:\/\/github.com\/johnmay\/beam"},{"key":"220_CR67","unstructured":"ChemAxon Extended SMILES. http:\/\/onlinelibrarystatic.wiley.com\/marvin\/help\/formats\/cxsmiles-doc.html"},{"key":"220_CR68","unstructured":"May JW (2013) All the small things. http:\/\/efficientbits.blogspot.co.uk\/2013\/10\/all-small-things.html"},{"key":"220_CR69","unstructured":"May JW (2013) Improved substructure matching. http:\/\/efficientbits.blogspot.co.uk\/2013\/11\/improved-substructure-matching.html"},{"issue":"2","key":"220_CR70","doi-asserted-by":"publisher","first-page":"323","DOI":"10.1021\/ci030405d","volume":"44","author":"F Berger","year":"2004","unstructured":"Berger F, Flamm C, Gleiss PM, Leydold J, Stadler PF (2004) Counterexamples in chemical ring perception. J Chem Inf Comput Sci 44(2):323\u2013331","journal-title":"J Chem Inf Comput Sci"},{"issue":"5","key":"220_CR71","doi-asserted-by":"publisher","first-page":"986","DOI":"10.1021\/ci960013p","volume":"36","author":"J Figueras","year":"1996","unstructured":"Figueras J (1996) Ring perception using breadth-first search. J Chem Inf Comput Sci 36(5):986\u2013991","journal-title":"J Chem Inf Comput Sci"},{"key":"220_CR72","unstructured":"Daylight Chemical Information Systems Inc. http:\/\/www.daylight.com"},{"issue":"3","key":"220_CR73","doi-asserted-by":"publisher","first-page":"244","DOI":"10.1021\/ci00007a012","volume":"32","author":"A Dalby","year":"1992","unstructured":"Dalby A, Nourse JG, Hounshell WD, Gushurst AKI, Grier DL, Leland BA et al (1992) Description of several chemical structure file formats used by computer programs developed at Molecular Design Limited. J Chem Inf Comput Sci 32(3):244\u2013255","journal-title":"J Chem Inf Comput Sci"},{"key":"220_CR74","unstructured":"CTfile Formats. http:\/\/accelrys.com\/products\/collaborative-science\/biovia-draw\/ctfile-no-fee.html"},{"issue":"4","key":"220_CR75","doi-asserted-by":"publisher","first-page":"447","DOI":"10.1021\/ci00004a003","volume":"31","author":"AJ Gushurst","year":"1991","unstructured":"Gushurst AJ, Nourse JG, Hounshell WD, Leland BA, Raich DG (1991) The substance module: the representation, storage, and searching of complex structures. J Chem Inf Comput Sci 31(4):447\u2013454","journal-title":"J Chem Inf Comput Sci"},{"issue":"1","key":"220_CR76","doi-asserted-by":"publisher","first-page":"93","DOI":"10.3390\/50100093","volume":"5","author":"S Krause","year":"2000","unstructured":"Krause S, Willighagen E, Steinbeck C (2000) JChemPaint\u2014using the collaborative forces of the internet to develop a free editor for 2D chemical structures. Molecules 5(1):93\u201398","journal-title":"Molecules"},{"key":"220_CR77","doi-asserted-by":"publisher","unstructured":"Willighagen E, Howard M (2007) Fast and scriptable molecular graphics in web browsers without Java3D. Nature Precedings. doi: 10.1038\/npre.2007.50.1","DOI":"10.1038\/npre.2007.50.1"},{"key":"220_CR78","doi-asserted-by":"publisher","first-page":"1250","DOI":"10.1107\/S0021889810030256","volume":"43","author":"RM Hanson","year":"2010","unstructured":"Hanson RM (2010) Jmol\u2014a paradigm shift in crystallographic visualization. J Appl Crystallogr 43:1250\u20131260","journal-title":"J Appl Crystallogr"},{"key":"220_CR79","unstructured":"Linux kernel, Version numbering. https:\/\/en.wikipedia.org\/wiki\/Linux_kernel#Version_numbering"},{"key":"220_CR80","unstructured":"Willighagen EL (2011) Groovy Cheminformatics with the Chemistry Development Kit. 1.4.1-0 ed. Figshare. https:\/\/doi.org\/10.6084\/m9.figshare.2057790.v1"},{"issue":"D1","key":"220_CR81","doi-asserted-by":"publisher","first-page":"D456","DOI":"10.1093\/nar\/gks1146","volume":"41","author":"J Hastings","year":"2013","unstructured":"Hastings J, de Matos P, Dekker A, Ennis M, Harsha B, Kale N et al (2013) The ChEBI reference database and ontology for biologically relevant chemistry: enhancements for 2013. Nucleic Acids Res 41(D1):D456.","journal-title":"Nucleic Acids Res"},{"issue":"D1","key":"220_CR82","doi-asserted-by":"publisher","first-page":"D1083","DOI":"10.1093\/nar\/gkt1031","volume":"42","author":"AP Bento","year":"2014","unstructured":"Bento AP, Gaulton A, Hersey A, Bellis LJ, Chambers J, Davies M et al (2014) The ChEMBL bioactivity database: an update. Nucleic Acids Res 42(D1):D1083.","journal-title":"Nucleic Acids Res"},{"issue":"1","key":"220_CR83","doi-asserted-by":"publisher","first-page":"P36","DOI":"10.1186\/1758-2946-5-S1-P36","volume":"5","author":"A Dalke","year":"2013","unstructured":"Dalke A (2013) The FPS fingerprint format and chemfp toolkit. J Cheminform 5(1):P36.","journal-title":"J Cheminform"},{"issue":"1","key":"220_CR84","doi-asserted-by":"publisher","first-page":"36","DOI":"10.1186\/s13321-016-0148-0","volume":"8","author":"NM O\u2019Boyle","year":"2016","unstructured":"O\u2019Boyle NM, Sayle RA (2016) Comparing structural fingerprints using a literature-based similarity benchmark. J Cheminform 8(1):36.","journal-title":"J Cheminform"},{"key":"220_CR85","unstructured":"Authors (2015) https:\/\/github.com\/cdk\/cdk\/blob\/master\/pom.xml"},{"issue":"5","key":"220_CR86","doi-asserted-by":"publisher","first-page":"742","DOI":"10.1021\/ci100050t","volume":"50","author":"D Rogers","year":"2010","unstructured":"Rogers D, Hahn M (2010) Extended-connectivity fingerprints. J Chem Inf Model 50(5):742\u2013754","journal-title":"J Chem Inf Model"},{"key":"220_CR87","doi-asserted-by":"publisher","first-page":"1039","DOI":"10.1021\/ci00028a014","volume":"35","author":"LH Hall","year":"1995","unstructured":"Hall LH, Kier LB (1995) Electrotopological state indices for atom types: a novel combination of electronic, topological, and valence state information. J Chem Inf Model 35:1039\u20131045","journal-title":"J Chem Inf Model"},{"issue":"21","key":"220_CR88","doi-asserted-by":"publisher","first-page":"251825","DOI":"10.1093\/bioinformatics\/btn479","volume":"24","author":"J Klekota","year":"2008","unstructured":"Klekota J, Roth FP (2008) Chemical substructures that enrich for biological activity. Bioinformatics 24(21):251825","journal-title":"Bioinformatics"},{"issue":"2","key":"220_CR89","doi-asserted-by":"publisher","first-page":"386","DOI":"10.1021\/ci0496797","volume":"45","author":"D Vidal","year":"2005","unstructured":"Vidal D, Thormann M, Pons M (2005) LINGO, an efficient holographic text based method to calculate biophysical properties and intermolecular similarities. J Chem Inf Model 45(2):386\u2013393","journal-title":"J Chem Inf Model"},{"key":"220_CR90","unstructured":"PubChem Substructure Fingerprint v1.3. ftp:\/\/ftp.ncbi.nlm.nih.gov\/pubchem\/specifications\/pubchem_fingerprints.txt [cited Friday 4 July 2014]"},{"issue":"1","key":"220_CR91","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1186\/1758-2946-3-44","volume":"3","author":"P Murray-Rust","year":"2011","unstructured":"Murray-Rust P, Rzepa HS (2011) CML: Evolution and design. J Cheminform 3(1):44","journal-title":"J Cheminform"},{"issue":"8","key":"220_CR92","doi-asserted-by":"publisher","first-page":"793","DOI":"10.1002\/jcc.540150802","volume":"15","author":"WD Ihlenfeldt","year":"1994","unstructured":"Ihlenfeldt WD, Gasteiger J (1994) Hash codes for the identification and classification of molecular structure elements. J Comput Chem 15(8):793\u2013813","journal-title":"J Comput Chem"},{"key":"220_CR93","unstructured":"Hicklin J, Moler C, Webb P, Boisvert RF, Miller B, Pozo R et\u00a0al (2012) JAMA: a Java Matrix Package. http:\/\/math.nist.gov\/javanumerics\/jama\/"}],"updated-by":[{"DOI":"10.1186\/s13321-017-0231-1","type":"erratum","label":"Erratum","source":"publisher","updated":{"date-parts":[[2017,9,20]],"date-time":"2017-09-20T00:00:00Z","timestamp":1505865600000}}],"container-title":["Journal of Cheminformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-017-0220-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s13321-017-0220-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-017-0220-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T00:30:49Z","timestamp":1750293049000},"score":1,"resource":{"primary":{"URL":"https:\/\/jcheminf.biomedcentral.com\/articles\/10.1186\/s13321-017-0220-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,6,6]]},"references-count":93,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2017,12]]}},"alternative-id":["220"],"URL":"https:\/\/doi.org\/10.1186\/s13321-017-0220-4","relation":{},"ISSN":["1758-2946"],"issn-type":[{"value":"1758-2946","type":"electronic"}],"subject":[],"published":{"date-parts":[[2017,6,6]]},"assertion":[{"value":"25 October 2016","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 May 2017","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 June 2017","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 September 2017","order":4,"name":"change_date","label":"Change Date","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"Erratum","order":5,"name":"change_type","label":"Change Type","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"An erratum to this article has been published.","order":6,"name":"change_details","label":"Change Details","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"33"}}