{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,17]],"date-time":"2026-06-17T04:32:53Z","timestamp":1781670773632,"version":"3.54.5"},"reference-count":45,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2011,10,14]],"date-time":"2011-10-14T00:00:00Z","timestamp":1318550400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/2.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Cheminform"],"published-print":{"date-parts":[[2011,12]]},"DOI":"10.1186\/1758-2946-3-41","type":"journal-article","created":{"date-parts":[[2011,11,1]],"date-time":"2011-11-01T20:17:01Z","timestamp":1320178621000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":166,"title":["OSCAR4: a flexible architecture for chemical text-mining"],"prefix":"10.1186","volume":"3","author":[{"given":"David M","family":"Jessop","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Sam E","family":"Adams","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Egon L","family":"Willighagen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Lezan","family":"Hawizy","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Peter","family":"Murray-Rust","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2011,10,14]]},"reference":[{"key":"222_CR1","doi-asserted-by":"publisher","first-page":"544","DOI":"10.1021\/ci980324v","volume":"38","author":"N Kemp","year":"1998","unstructured":"Kemp N, Lynch M: Extraction of Information from the Text of Chemical Patents. 1. Identification of Specific Chemical Names. J Chem Inf Comput Sci. 1998, 38: 544-551. 10.1021\/ci980324v.","journal-title":"J Chem Inf Comput Sci"},{"key":"222_CR2","first-page":"176","volume-title":"Proc AMIA Symp","author":"WJ Wilbur","year":"1999","unstructured":"Wilbur WJ, Hazard JF, Divita G, Mork JG, Aronson AR, Browne AC: Analysis of Biomedical Text for Chemical Names: A Comparison of Three Methods. Proc AMIA Symp. 1999, 176-180."},{"issue":"Suppl. 2","key":"222_CR3","doi-asserted-by":"publisher","first-page":"S3","DOI":"10.1186\/1471-2105-7-S2-S3","volume":"7","author":"JF Wren","year":"2006","unstructured":"Wren JF: A scalable machine-learning approach to recognize chemical names within large text databases. BMC Bioinformatics. 2006, 7 (Suppl. 2): S3-","journal-title":"BMC Bioinformatics"},{"key":"222_CR4","doi-asserted-by":"publisher","first-page":"268","DOI":"10.1093\/bioinformatics\/btn181","volume":"24","author":"R Klinger","year":"2008","unstructured":"Klinger R, Kol\u00e1\u0159ik C, Fluck J, Hofmann-Apitius M, Friedrich CM: Detection of IUPAC and IUPAC-like chemical names. Bioinformatics. 2008, 24: 268-276. 10.1093\/bioinformatics\/btn181.","journal-title":"Bioinformatics"},{"key":"222_CR5","doi-asserted-by":"publisher","first-page":"2983","DOI":"10.1093\/bioinformatics\/btp535","volume":"25","author":"KM Hettne","year":"2009","unstructured":"Hettne KM, Stierum RH, Schuemie MJ, Hendriksen PJM, Schijvenaars BJA, van Mulligen EM, Kleinjans J, Kors JA: A dictionary to identify small molecules and drugs in free text. Bioinformatics. 2009, 25: 2983-2991. 10.1093\/bioinformatics\/btp535.","journal-title":"Bioinformatics"},{"key":"222_CR6","doi-asserted-by":"publisher","first-page":"263","DOI":"10.1021\/ci800332w","volume":"49","author":"D Jiao","year":"2009","unstructured":"Jiao D, Wild DJ: Extraction of CYP Chemical Interactions from Biomedical Literature Using Natural Language Processing Methods. J Chem Inf Comput Sci. 2009, 49: 263-269. 10.1021\/ci800332w.","journal-title":"J Chem Inf Comput Sci"},{"key":"222_CR7","first-page":"51","volume-title":"Proceedings of the Workshop on building and evaluating resources for biomedical text mining (6th edition of the Language Resources and Evaluation Conference","author":"C Kol\u00e1\u0159ik","year":"2008","unstructured":"Kol\u00e1\u0159ik C, Klinger R, Friedrich CM, Hofmann-Apitius M, Fluck J: Chemical Names: Terminological Resources and Corpora Annotation. Proceedings of the Workshop on building and evaluating resources for biomedical text mining (6th edition of the Language Resources and Evaluation Conference. 2008, Marrakech, Marokko, 51-58."},{"key":"222_CR8","doi-asserted-by":"publisher","first-page":"942","DOI":"10.1007\/978-3-642-02481-8_144","volume-title":"Distributed Computing, Artificial Intelligence, Bioinformatics, Soft Computing, and Ambient Assisted Living","author":"T Grego","year":"2009","unstructured":"Grego T, Pezik P, Couto FM, Rebholz-Chuhmann D: Identification of Chemical Entities in Patent Documents. Distributed Computing, Artificial Intelligence, Bioinformatics, Soft Computing, and Ambient Assisted Living. 2009, Berlin, Germany. Springer-Verlag, 942-949."},{"key":"222_CR9","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1186\/1758-2946-2-3","volume":"2","author":"KM Hettne","year":"2010","unstructured":"Hettne KM, Williams AJ, van Mulligen EM, Kleinjans J, Tkachenko V, Kors JA: Automatic vs manual curation of a multi-source chemical dictionary: the impact on text mining. Journal of Cheminformatics. 2010, 2: 3-10.1186\/1758-2946-2-3.","journal-title":"Journal of Cheminformatics"},{"key":"222_CR10","first-page":"152","volume-title":"Advances in Multidisciplinary Retrieval","author":"B M\u00fcller","year":"2006","unstructured":"M\u00fcller B, Klinger R, Gurulingappa H, Mevissen H, Hofmann-Apitius M, Fluck J, Friedrich CM: Abstracts versus Full Texts and Patents: A Quantitative Analysis of Biomedical Entities. Advances in Multidisciplinary Retrieval. 2006, Springer-Verlag, 152-165."},{"key":"222_CR11","doi-asserted-by":"publisher","first-page":"Article 12","DOI":"10.1145\/1961209.1961215","volume":"29","author":"B Sun","year":"2011","unstructured":"Sun B, Mitra P, Giles CL, Mueller KT: Identifying, Indexing and Ranking Chemical Formulae and Chemical Names in Digital Documents. ACM Trans. Inf. Syst. 2011, 29: Article 12-","journal-title":"ACM Trans. Inf. Syst"},{"key":"222_CR12","doi-asserted-by":"publisher","first-page":"739","DOI":"10.1021\/ci100384d","volume":"51","author":"DM Lowe","year":"2011","unstructured":"Lowe DM, Corbett PT, Murray-Rust P, Glen RC: Chemical name to structure: OPSIN, an open source solution. J Chem Inf Model. 2011, 51: 739-753. 10.1021\/ci100384d.","journal-title":"J Chem Inf Model"},{"key":"222_CR13","unstructured":"OPSIN, Open Parser for Systematic IUPAC Nomenclature. Accessed 2011-06-15, [http:\/\/opsin.ch.cam.ac.uk\/]"},{"key":"222_CR14","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1186\/1758-2946-3-17","volume":"3","author":"L Hawizy","year":"2011","unstructured":"Hawizy L, Jessop DM, Adams N, Murray-Rust P: ChemicalTagger: A tool for semantic text-mining in chemistry. J Cheminf. 2011, 3: 17-10.1186\/1758-2946-3-17.","journal-title":"J Cheminf"},{"key":"222_CR15","unstructured":"ChemicalTagger. Accessed 2011-06-15, [http:\/\/chemicaltagger.ch.cam.ac.uk\/]"},{"key":"222_CR16","doi-asserted-by":"publisher","first-page":"3067","DOI":"10.1039\/b411699m","volume":"2","author":"SE Adams","year":"2004","unstructured":"Adams SE, Goodman JM, Kidd RJ, McNaught AD, Murray-Rust P, Norton FR, Townsend JA, Waudby CA: Experimental data checker: better information for organic chemists. Org Biomol Chem. 2004, 2: 3067-3070. 10.1039\/b411699m.","journal-title":"Org Biomol Chem"},{"key":"222_CR17","unstructured":"RSC Experimental Data Checker. Accessed 2011-06-15, [http:\/\/www.rsc.org\/Publishing\/Journals\/guidelines\/AuthorGuidelines\/AuthoringTools\/ExperimentalDataChecker\/index.asp]"},{"key":"222_CR18","first-page":"107","volume-title":"Computational Life Sciences II, Second International Symposium, CompLife 2006 Cambridge, UK, September 27-29, 2006, Proceedings. Lecture Notes in Computer Science","author":"P Corbett","year":"2006","unstructured":"Corbett P, Murray-Rust P: High-Throughput Identification of Chemistry in Life Science Texts. Computational Life Sciences II, Second International Symposium, CompLife 2006 Cambridge, UK, September 27-29, 2006, Proceedings. Lecture Notes in Computer Science. Edited by: Berthold MR, Glen RC, Fischer I. 2006, Heidelberg: Springer, 107-118."},{"issue":"Suppl 11","key":"222_CR19","doi-asserted-by":"publisher","first-page":"S4","DOI":"10.1186\/1471-2105-9-S11-S4","volume":"9","author":"P Corbett","year":"2008","unstructured":"Corbett P, Copestake A: Cascaded classifiers for confidence-based chemical named entity recognition. BMC Bioinformatics. 2008, 9 (Suppl 11): S4-10.1186\/1471-2105-9-S11-S4.","journal-title":"BMC Bioinformatics"},{"key":"222_CR20","unstructured":"UIMA. Accessed 2011-06-15, [http:\/\/uima.apache.org\/]"},{"key":"222_CR21","unstructured":"U-Compare. Accessed 2011-06-15, [http:\/\/u-compare.org\/]"},{"key":"222_CR22","doi-asserted-by":"publisher","first-page":"1997","DOI":"10.1093\/bioinformatics\/btp289","volume":"25","author":"Y Kano","year":"2009","unstructured":"Kano Y, Baumgartner W, McCrohon L, Ananiadou S, Cohen KB, Hunter L, Tsujii J: U-compare: Share and compare text mining tools with UIMA. Bioinformatics. 2009, 25: 1997-1998. 10.1093\/bioinformatics\/btp289.","journal-title":"Bioinformatics"},{"key":"222_CR23","doi-asserted-by":"publisher","first-page":"e20181","DOI":"10.1371\/journal.pone.0020181","volume":"6","author":"B Kolluru","year":"2011","unstructured":"Kolluru B, Hawizy L, Murray-Rust P, Tsuji J, Ananiadou S: Using workflows to explore and optimise named entity recognition for chemistry. PLoS ONE. 2011, 6: e20181-10.1371\/journal.pone.0020181.","journal-title":"PLoS ONE"},{"key":"222_CR24","volume-title":"PhD thesis","author":"DM Jessop","year":"2011","unstructured":"Jessop DM: Information extraction from chemical patents. PhD thesis. 2011, University of Cambridge: Cambridge, UK"},{"key":"222_CR25","doi-asserted-by":"publisher","first-page":"40","DOI":"10.1186\/1758-2946-3-40","volume":"3","author":"DM Jessop","year":"2011","unstructured":"Jessop DM, Adams SE, Murray-Rust P: Mining chemical information from Open patents. J Cheminf. 2011, 3: 40-10.1186\/1758-2946-3-S1-P40.","journal-title":"J Cheminf"},{"key":"222_CR26","first-page":"12","volume-title":"Chemistry International","author":"A McNaught","year":"2006","unstructured":"McNaught A: The IUPAC International Chemical Identifier. Chemistry International. 2006, 12-14. November-December"},{"key":"222_CR27","unstructured":"IUPAC International Chemical Indentifier. Accessed 2011-06-15, [http:\/\/www.iupac.org\/inchi\/]"},{"key":"222_CR28","doi-asserted-by":"crossref","unstructured":"Hearst MA: Automatic acquisition of hyponyms from large text corpora. COLING '92 Proceedings of the 14th conference on Computational linguistics-Volume. 2: 539-545.","DOI":"10.3115\/992133.992154"},{"key":"222_CR29","unstructured":"YourKit java profiler. Accessed 2011-06-15, [http:\/\/www.yourkit.com\/]"},{"key":"222_CR30","unstructured":"OSCAR3 alpha 5. Accessed 2011-06-15, [http:\/\/sourceforge.net\/projects\/oscar3-chem\/]"},{"key":"222_CR31","first-page":"57","volume-title":"Proceedings of BioNLP 2007: Biological, translational, and clinical language processing (ACL 2007 workshop)","author":"P Corbett","year":"2007","unstructured":"Corbett P, Batchelor C, Teufel S: Annotation of Chemical Named Entities. Proceedings of BioNLP 2007: Biological, translational, and clinical language processing (ACL 2007 workshop). 2007, 57-64."},{"key":"222_CR32","doi-asserted-by":"crossref","unstructured":"Taverna. Accessed 2011-06-15, [http:\/\/www.taverna.org.uk\/]","DOI":"10.1590\/S1413-85572011000200018"},{"key":"222_CR33","unstructured":"Bioclipse. Accessed 2011-06-15, [http:\/\/www.bioclipse.net\/]"},{"key":"222_CR34","unstructured":"OSCAR4 Launch. Accessed 2011-06-15, [http:\/\/sms.cam.ac.uk\/collection\/1130934]"},{"key":"222_CR35","doi-asserted-by":"publisher","first-page":"2111","DOI":"10.2174\/138161206777585274","volume":"12","author":"C Steinbeck","year":"2006","unstructured":"Steinbeck C, Hoppe C, Kuhn S, Floris M, Guha R, Willighagen EL: Recent Developments of the Chemistry Development Kit (CDK)-An Open-Source Java Library for Chemo- and Bioinformatics. Curr Pharm Des. 2006, 12: 2111-2120. 10.2174\/138161206777585274.","journal-title":"Curr Pharm Des"},{"key":"222_CR36","doi-asserted-by":"publisher","first-page":"493","DOI":"10.1021\/ci025584y","volume":"43","author":"C Steinbeck","year":"2003","unstructured":"Steinbeck C, Han Y, Kuhn S, Horlacher O, Luttman E, Willighagen E: The Chemistry Development Kit (CDK): An Open-Source Java Library for Chemo- and Bioinformatics. J Chem Inf Comput Sci. 2003, 43: 493-500. 10.1021\/ci025584y.","journal-title":"J Chem Inf Comput Sci"},{"key":"222_CR37","unstructured":"Chemical Development Kit (CDK). Accessed 2011-06-15, [http:\/\/sourceforge.net\/projects\/cdk\/]"},{"issue":"Suppl. 1","key":"222_CR38","first-page":"D344","volume":"36","author":"K Degtyarenko","year":"2008","unstructured":"Degtyarenko K, de Matos P, Ennis M, Hastings J, Zbinden M, McNaught A, Alcantara R, Darsow M, Guedj M, Ashburner M: ChEBI: a database and ontology for chemical entities of biological interest. Nucl Acids Res. 2008, 36 (Suppl. 1): D344-D350.","journal-title":"Nucl Acids Res"},{"issue":"Suppl. 1","key":"222_CR39","first-page":"D249","volume":"38","author":"P de Matos","year":"2009","unstructured":"de Matos P, Alc\u00e1ntara R, Dekker A, Ennis M, Hastings J, Haug K, Spiteri I, Turner S, Steinbeck C: Chemical Entities of Biological Interest: an update. Nucl Acids Res. 2009, 38 (Suppl. 1): D249-D254.","journal-title":"Nucl Acids Res"},{"key":"222_CR40","unstructured":"ChEBI. Accessed 2011-06-15, [http:\/\/www.ebi.ac.uk\/chebi\/]"},{"key":"222_CR41","unstructured":"FIX ontology. Accessed 2011-06-15, [http:\/\/www.berkeleybop.org\/ontologies\/owl\/FIX]"},{"key":"222_CR42","unstructured":"REX ontology. Accessed 2011-06-15, [http:\/\/www.berkeleybop.org\/ontologies\/owl\/REX]"},{"key":"222_CR43","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1021\/ci00057a005","volume":"28","author":"D Weininger","year":"1988","unstructured":"Weininger D: SMILES, a chemical language and information system. 1. Introduction to methodology and encoding rules. J Chem Inf Comput Sci. 1988, 28: 31-36. 10.1021\/ci00057a005.","journal-title":"J Chem Inf Comput Sci"},{"key":"222_CR44","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1021\/ci00062a008","volume":"29","author":"D Weininger","year":"1989","unstructured":"Weininger D, Weininger A, Weininger JL: SMILES. 2. Algorithm for generation of unique SMILES notation. J Chem Inf Comput Sci. 1989, 29: 97-101. 10.1021\/ci00062a008.","journal-title":"J Chem Inf Comput Sci"},{"key":"222_CR45","doi-asserted-by":"publisher","first-page":"928","DOI":"10.1021\/ci990052b","volume":"39","author":"P Murray-Rust","year":"1999","unstructured":"Murray-Rust P, Rzepa HS: Chemical Markup, XML and the Worldwide Web. 1. Basic Principles. J Chem Inf Comput Sci. 1999, 39: 928-942. 10.1021\/ci990052b.","journal-title":"J Chem Inf Comput Sci"}],"container-title":["Journal of Cheminformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/1758-2946-3-41.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/1758-2946-3-41\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/1758-2946-3-41.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,13]],"date-time":"2025-03-13T15:14:59Z","timestamp":1741878899000},"score":1,"resource":{"primary":{"URL":"https:\/\/jcheminf.biomedcentral.com\/articles\/10.1186\/1758-2946-3-41"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011,10,14]]},"references-count":45,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2011,12]]}},"alternative-id":["222"],"URL":"https:\/\/doi.org\/10.1186\/1758-2946-3-41","relation":{},"ISSN":["1758-2946"],"issn-type":[{"value":"1758-2946","type":"electronic"}],"subject":[],"published":{"date-parts":[[2011,10,14]]},"assertion":[{"value":"23 June 2011","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 October 2011","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 October 2011","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"41"}}