{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,28]],"date-time":"2026-03-28T07:25:17Z","timestamp":1774682717994,"version":"3.50.1"},"reference-count":38,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2026,2,12]],"date-time":"2026-02-12T00:00:00Z","timestamp":1770854400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2026,2,12]],"date-time":"2026-02-12T00:00:00Z","timestamp":1770854400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"DOI":"10.13039\/100010269","name":"Wellcome Trust","doi-asserted-by":"publisher","award":["104104\/A\/14\/Z"],"award-info":[{"award-number":["104104\/A\/14\/Z"]}],"id":[{"id":"10.13039\/100010269","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100010269","name":"Wellcome Trust","doi-asserted-by":"publisher","award":["228142\/Z\/23\/Z"],"award-info":[{"award-number":["228142\/Z\/23\/Z"]}],"id":[{"id":"10.13039\/100010269","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100010767","name":"Innovative Medicines Initiative","doi-asserted-by":"publisher","award":["875510"],"award-info":[{"award-number":["875510"]}],"id":[{"id":"10.13039\/501100010767","id-type":"DOI","asserted-by":"publisher"}]},{"name":"EMBL\u00b4s European Bioinformatics Institute (EMBL-EBI)"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Cheminform"],"DOI":"10.1186\/s13321-026-01165-x","type":"journal-article","created":{"date-parts":[[2026,2,12]],"date-time":"2026-02-12T16:27:51Z","timestamp":1770913671000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Integrating artificial intelligence and manual curation to enhance bioassay annotations in ChEMBL"],"prefix":"10.1186","volume":"18","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-1772-6487","authenticated-orcid":false,"given":"Ines","family":"Smit","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2217-4629","authenticated-orcid":false,"given":"Melissa F.","family":"Adasme","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7875-1259","authenticated-orcid":false,"given":"Emma","family":"Manners","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1242-1481","authenticated-orcid":false,"given":"Sybilla","family":"Corbett","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3562-1328","authenticated-orcid":false,"given":"Nicolas","family":"Bosc","sequence":"additional","affiliation":[]},{"given":"Hoang-My-Anh","family":"Do","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8178-0253","authenticated-orcid":false,"given":"Andrew R.","family":"Leach","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4879-2003","authenticated-orcid":false,"given":"Noel M.","family":"O\u2019Boyle","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9395-1515","authenticated-orcid":false,"given":"Barbara","family":"Zdrazil","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,2,12]]},"reference":[{"key":"1165_CR1","doi-asserted-by":"publisher","first-page":"D1180","DOI":"10.1093\/nar\/gkad1004","volume":"52","author":"B Zdrazil","year":"2024","unstructured":"Zdrazil B, Felix E, Hunter F et al (2024) The ChEMBL database in 2023: a drug discovery platform spanning multiple bioactivity data types and time periods. Nucleic Acids Res 52:D1180\u2013D1192. https:\/\/doi.org\/10.1093\/nar\/gkad1004","journal-title":"Nucleic Acids Res"},{"key":"1165_CR2","doi-asserted-by":"publisher","DOI":"10.1038\/sdata.2016.18","volume":"3","author":"MD Wilkinson","year":"2016","unstructured":"Wilkinson MD, Dumontier M, Aalbersberg IjJ et al (2016) The FAIR guiding principles for scientific data management and stewardship. Sci Data 3:160018. https:\/\/doi.org\/10.1038\/sdata.2016.18","journal-title":"Sci Data"},{"key":"1165_CR3","doi-asserted-by":"publisher","first-page":"661","DOI":"10.1038\/nrd3503","volume":"10","author":"S Orchard","year":"2011","unstructured":"Orchard S, Al-Lazikani B, Bryant S et al (2011) Minimum information about a bioactive entity (MIABE). Nat Rev Drug Discov 10:661\u2013669. https:\/\/doi.org\/10.1038\/nrd3503","journal-title":"Nat Rev Drug Discov"},{"key":"1165_CR4","doi-asserted-by":"publisher","first-page":"D1373","DOI":"10.1093\/nar\/gkac956","volume":"51","author":"S Kim","year":"2023","unstructured":"Kim S, Chen J, Cheng T et al (2023) PubChem 2023 update. Nucleic Acids Res 51:D1373\u2013D1380. https:\/\/doi.org\/10.1093\/nar\/gkac956","journal-title":"Nucleic Acids Res"},{"key":"1165_CR5","doi-asserted-by":"publisher","DOI":"10.1186\/1471-2105-12-257","volume":"12","author":"U Visser","year":"2011","unstructured":"Visser U, Abeyruwan S, Vempati U et al (2011) BioAssay ontology (BAO): a semantic description of bioassays and high-throughput screening results. BMC Bioinformatics 12:257. https:\/\/doi.org\/10.1186\/1471-2105-12-257","journal-title":"BMC Bioinformatics"},{"key":"1165_CR6","unstructured":"The BioAssay Ontology (BAO). http:\/\/bioassayontology.org\/. Accessed 16 Jan 2025"},{"key":"1165_CR7","doi-asserted-by":"publisher","DOI":"10.1186\/2041-1480-5-S1-S5","volume":"5","author":"S Abeyruwan","year":"2014","unstructured":"Abeyruwan S, Vempati UD, K\u00fc\u00e7\u00fck-McGinty H et al (2014) Evolving BioAssay ontology (BAO): modularization, integration and applications. J Biomed Semantics 5:S5. https:\/\/doi.org\/10.1186\/2041-1480-5-S1-S5","journal-title":"J Biomed Semantics"},{"key":"1165_CR8","doi-asserted-by":"publisher","first-page":"1188","DOI":"10.1016\/j.drudis.2012.05.016","volume":"17","author":"AJ Williams","year":"2012","unstructured":"Williams AJ, Harland L, Groth P et al (2012) Open PHACTS: semantic interoperability for drug discovery. Drug Discov Today 17:1188\u20131198. https:\/\/doi.org\/10.1016\/j.drudis.2012.05.016","journal-title":"Drug Discov Today"},{"key":"1165_CR9","unstructured":"Pistoia Alliance DataFAIRy Bioassay Pilot\u2014PubChem Data Source. https:\/\/pubchem.ncbi.nlm.nih.gov\/source\/24682. Accessed 20 Jan 2026"},{"key":"1165_CR10","doi-asserted-by":"publisher","first-page":"224","DOI":"10.1016\/j.chembiol.2017.11.009","volume":"25","author":"J Tang","year":"2018","unstructured":"Tang J, Tanoli Z-R, Ravikumar B et al (2018) Drug Target Commons: A Community Effort to Build a Consensus Knowledge Base for Drug-Target Interactions. Cell Chem Biol 25:224-229.e2. https:\/\/doi.org\/10.1016\/j.chembiol.2017.11.009","journal-title":"Cell Chem Biol"},{"key":"1165_CR11","doi-asserted-by":"publisher","DOI":"10.1093\/bib\/bbab350","volume":"23","author":"Z Tanoli","year":"2022","unstructured":"Tanoli Z, Aldahdooh J, Alam F et al (2022) Minimal information for chemosensitivity assays (MICHA): a next-generation pipeline to enable the FAIRification of drug screening experiments. Brief Bioinform 23:bbab350. https:\/\/doi.org\/10.1093\/bib\/bbab350","journal-title":"Brief Bioinform"},{"key":"1165_CR12","doi-asserted-by":"publisher","DOI":"10.7717\/peerj.524","volume":"2","author":"AM Clark","year":"2014","unstructured":"Clark AM, Bunin BA, Litterman NK et al (2014) Fast and accurate semantic annotation of bioassays exploiting a hybrid of machine learning and user confirmation. PeerJ 2:e524. https:\/\/doi.org\/10.7717\/peerj.524","journal-title":"PeerJ"},{"key":"1165_CR13","unstructured":"cdd\/bioassay-express: BioAssay Express by Collaborative Drug Discovery. https:\/\/github.com\/cdd\/bioassay-express. Accessed 25 July 2025"},{"key":"1165_CR14","doi-asserted-by":"publisher","first-page":"7013","DOI":"10.1021\/acs.jcim.5c00603","volume":"65","author":"L Schoenmaker","year":"2025","unstructured":"Schoenmaker L, Sastrokarijo EG, Heitman LH et al (2025) Toward assay-aware bioactivity model(er)s: getting a grip on biological context. J Chem Inf Model 65:7013\u20137023. https:\/\/doi.org\/10.1021\/acs.jcim.5c00603","journal-title":"J Chem Inf Model"},{"key":"1165_CR15","doi-asserted-by":"publisher","first-page":"885","DOI":"10.1007\/s10822-015-9860-5","volume":"29","author":"G Papadatos","year":"2015","unstructured":"Papadatos G, Gaulton A, Hersey A, Overington JP (2015) Activity, assay and target data curation and quality in the ChEMBL database. J Comput Aided Mol Des 29:885\u2013896. https:\/\/doi.org\/10.1007\/s10822-015-9860-5","journal-title":"J Comput Aided Mol Des"},{"key":"1165_CR16","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0061007","volume":"8","author":"T Kalliokoski","year":"2013","unstructured":"Kalliokoski T, Kramer C, Vulpetti A, Gedeck P (2013) Comparability of mixed IC\u2085\u2080 data - a statistical analysis. PLoS ONE 8:e61007. https:\/\/doi.org\/10.1371\/journal.pone.0061007","journal-title":"PLoS ONE"},{"key":"1165_CR17","doi-asserted-by":"publisher","first-page":"1560","DOI":"10.1021\/acs.jcim.4c00049","volume":"64","author":"GA Landrum","year":"2024","unstructured":"Landrum GA, Riniker S (2024) Combining IC50 or Ki values from different sources is a source of significant noise. J Chem Inf Model 64:1560\u20131567. https:\/\/doi.org\/10.1021\/acs.jcim.4c00049","journal-title":"J Chem Inf Model"},{"key":"1165_CR18","doi-asserted-by":"publisher","first-page":"D609","DOI":"10.1093\/nar\/gkae1010","volume":"53","author":"UniProt Consortium","year":"2025","unstructured":"UniProt Consortium (2025) UniProt: the universal protein knowledgebase in 2025. Nucleic Acids Res 53:D609\u2013D617. https:\/\/doi.org\/10.1093\/nar\/gkae1010","journal-title":"Nucleic Acids Res"},{"key":"1165_CR19","doi-asserted-by":"publisher","DOI":"10.1186\/2041-1480-5-37","volume":"5","author":"S Sarntivijai","year":"2014","unstructured":"Sarntivijai S, Lin Y, Xiang Z et al (2014) CLO: the cell line ontology. J Biomed Semantics 5:37. https:\/\/doi.org\/10.1186\/2041-1480-5-37","journal-title":"J Biomed Semantics"},{"key":"1165_CR20","doi-asserted-by":"publisher","first-page":"1112","DOI":"10.1093\/bioinformatics\/btq099","volume":"26","author":"J Malone","year":"2010","unstructured":"Malone J, Holloway E, Adamusiak T et al (2010) Modeling sample variables with an Experimental Factor Ontology. Bioinformatics 26:1112\u20131118. https:\/\/doi.org\/10.1093\/bioinformatics\/btq099","journal-title":"Bioinformatics"},{"key":"1165_CR21","doi-asserted-by":"publisher","first-page":"25","DOI":"10.7171\/jbt.18-2902-002","volume":"29","author":"A Bairoch","year":"2018","unstructured":"Bairoch A (2018) The Cellosaurus, a cell-line knowledge resource. J Biomol Tech 29:25\u201338. https:\/\/doi.org\/10.7171\/jbt.18-2902-002","journal-title":"J Biomol Tech"},{"key":"1165_CR22","doi-asserted-by":"publisher","DOI":"10.1186\/s13326-016-0088-7","volume":"7","author":"AD Diehl","year":"2016","unstructured":"Diehl AD, Meehan TF, Bradford YM et al (2016) The Cell Ontology 2016: enhanced content, modularization, and ontology interoperability. J Biomed Semantics 7:44. https:\/\/doi.org\/10.1186\/s13326-016-0088-7","journal-title":"J Biomed Semantics"},{"key":"1165_CR23","doi-asserted-by":"publisher","first-page":"D431","DOI":"10.1093\/nar\/gkz1023","volume":"48","author":"V Stathias","year":"2020","unstructured":"Stathias V, Turner J, Koleti A et al (2020) LINCS data portal 2.0: next generation access point for perturbation-response signatures. Nucleic Acids Res 48:D431\u2013D439. https:\/\/doi.org\/10.1093\/nar\/gkz1023","journal-title":"Nucleic Acids Res"},{"key":"1165_CR24","doi-asserted-by":"publisher","DOI":"10.1186\/2041-1480-5-21","volume":"5","author":"MA Haendel","year":"2014","unstructured":"Haendel MA, Balhoff JP, Bastian FB et al (2014) Unification of multi-species vertebrate anatomy ontologies for comparative biology in Uberon. J Biomed Semantics 5:21. https:\/\/doi.org\/10.1186\/2041-1480-5-21","journal-title":"J Biomed Semantics"},{"key":"1165_CR25","doi-asserted-by":"publisher","first-page":"D507","DOI":"10.1093\/nar\/gkq968","volume":"39","author":"M Gremse","year":"2011","unstructured":"Gremse M, Chang A, Schomburg I et al (2011) The BRENDA Tissue Ontology (BTO): the first all-integrating ontology of all organisms for enzyme sources. Nucleic Acids Res 39:D507-513. https:\/\/doi.org\/10.1093\/nar\/gkq968","journal-title":"Nucleic Acids Res"},{"key":"1165_CR26","unstructured":"Bioregistry - CALIPHO Group Ontology of Human Anatomy. https:\/\/bioregistry.io\/registry\/caloha. Accessed 10 June 2025."},{"key":"1165_CR27","unstructured":"chembl_35_schema.png (PNG Image, 6139\u00a0\u00d7\u00a07557 pixels)\u2014Scaled (17%). https:\/\/ftp.ebi.ac.uk\/pub\/databases\/chembl\/ChEMBLdb\/latest\/chembl_35_schema.png. Accessed 10 June 2025."},{"key":"1165_CR28","unstructured":"Introduction | ChEMBL Data Deposition Guide. 2023. https:\/\/chembl.gitbook.io\/chembl-data-deposition-guide. Accessed 23 July 2025."},{"key":"1165_CR29","doi-asserted-by":"publisher","DOI":"10.1038\/sdata.2018.230","volume":"5","author":"FMI Hunter","year":"2018","unstructured":"Hunter FMI, L. Atkinson F, Bento AP et al (2018) A large-scale dataset of in vivo pharmacology assay results. Sci Data 5:180230. https:\/\/doi.org\/10.1038\/sdata.2018.230","journal-title":"Sci Data"},{"key":"1165_CR30","unstructured":"In search of the perfect assay description. In: In search of the perfect assay description. https:\/\/chembl.blogspot.com\/2023\/12\/in-search-of-perfect-assay-description.html. Accessed 10 June 2025."},{"key":"1165_CR31","doi-asserted-by":"publisher","DOI":"10.1039\/d4md00735b","author":"C Tredup","year":"2024","unstructured":"Tredup C, Ackloo S, Beck H et al (2024) Toward target 2035: EUbOPEN - a public-private partnership to enable & unlock biology in the open. RSC Med Chem. https:\/\/doi.org\/10.1039\/d4md00735b","journal-title":"RSC Med Chem"},{"key":"1165_CR32","unstructured":"NBCI Taxonomy. https:\/\/www.ncbi.nlm.nih.gov\/taxonomy. Accessed 16 Jan 2025."},{"key":"1165_CR33","unstructured":"ChemRxiv. Excuse me, there is a mutant in my bioactivity soup! A comprehensive analysis of the genetic variability landscape of bioactivity databases and its effect on activity modelling | Biological and Medicinal Chemistry | ChemRxiv | Cambridge Open Engage. https:\/\/chemrxiv.org\/engage\/chemrxiv\/article-details\/66729e49c9c6a5c07ad1b0a8. Accessed 1 July 2025."},{"key":"1165_CR34","unstructured":"Arunmozhi. 2025. https:\/\/github.com\/tecoholic\/ner-annotator. Accessed 23 July 2025."},{"key":"1165_CR35","doi-asserted-by":"publisher","DOI":"10.1093\/database\/baae119","volume":"2024","author":"RS Gon\u00e7alves","year":"2024","unstructured":"Gon\u00e7alves RS, Payne J, Tan A et al (2024) The text2term tool to map free-text descriptions of biomedical terms to ontologies. Database 2024:baae119. https:\/\/doi.org\/10.1093\/database\/baae119","journal-title":"Database"},{"key":"1165_CR36","unstructured":"Bioassay Annotations. https:\/\/ftp.ebi.ac.uk\/pub\/databases\/chembl\/assayannotation\/. Accessed 31 July 2025."},{"key":"1165_CR37","unstructured":"explosion\/projects. 2025. https:\/\/github.com\/explosion\/projects. Accessed 23 July 2025."},{"key":"1165_CR38","unstructured":"BioAssay Ontology|NCBO BioPortal. https:\/\/bioportal.bioontology.org\/ontologies\/BAO. Accessed 23 July 2025."}],"updated-by":[{"DOI":"10.1186\/s13321-026-01181-x","type":"correction","label":"Correction","source":"publisher","updated":{"date-parts":[[2026,3,27]],"date-time":"2026-03-27T00:00:00Z","timestamp":1774569600000}}],"container-title":["Journal of Cheminformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-026-01165-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s13321-026-01165-x","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-026-01165-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,28]],"date-time":"2026-03-28T06:37:34Z","timestamp":1774679854000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1186\/s13321-026-01165-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,12]]},"references-count":38,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2026,12]]}},"alternative-id":["1165"],"URL":"https:\/\/doi.org\/10.1186\/s13321-026-01165-x","relation":{},"ISSN":["1758-2946"],"issn-type":[{"value":"1758-2946","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,2,12]]},"assertion":[{"value":"5 September 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"31 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 February 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 March 2026","order":5,"name":"change_date","label":"Change Date","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"Correction","order":6,"name":"change_type","label":"Change Type","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"A Correction to this paper has been published:","order":7,"name":"change_details","label":"Change Details","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"https:\/\/doi.org\/10.1186\/s13321-026-01181-x","URL":"https:\/\/doi.org\/10.1186\/s13321-026-01181-x","order":8,"name":"change_details","label":"Change Details","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Barbara Zdrazil is Co-Editor-in-Chief of the\u00a0Journal of Cheminformatics.\u00a0B.Z. did not partcipate in the peer review or decision making process for this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"24"}}