{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T08:00:26Z","timestamp":1776844826605,"version":"3.51.2"},"reference-count":25,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,10,13]],"date-time":"2025-10-13T00:00:00Z","timestamp":1760313600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,10,13]],"date-time":"2025-10-13T00:00:00Z","timestamp":1760313600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Cheminform"],"DOI":"10.1186\/s13321-025-01105-1","type":"journal-article","created":{"date-parts":[[2025,10,13]],"date-time":"2025-10-13T07:50:55Z","timestamp":1760341855000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Enhanced Thompson sampling by roulette wheel selection for screening ultralarge combinatorial libraries"],"prefix":"10.1186","volume":"17","author":[{"given":"Hongtao","family":"Zhao","sequence":"first","affiliation":[]},{"given":"Eva","family":"Nittinger","sequence":"additional","affiliation":[]},{"given":"Melissa A.","family":"Yu","sequence":"additional","affiliation":[]},{"given":"Symon","family":"Gathiaka","sequence":"additional","affiliation":[]},{"given":"W. Patrick","family":"Walters","sequence":"additional","affiliation":[]},{"given":"Christian","family":"Tyrchan","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,10,13]]},"reference":[{"key":"1105_CR1","doi-asserted-by":"publisher","first-page":"1148","DOI":"10.1016\/j.drudis.2019.02.013","volume":"24","author":"T Hoffmann","year":"2019","unstructured":"Hoffmann T, Gastreich M (2019) The next level in chemical space navigation: going far beyond enumerable compound libraries. Drug Discov Today 24:1148\u20131156","journal-title":"Drug Discov Today"},{"key":"1105_CR2","doi-asserted-by":"publisher","DOI":"10.1002\/minf.202400114","volume":"43","author":"MV Protopopov","year":"2024","unstructured":"Protopopov MV, Tararina VV, Bonachera F et al (2024) The freedom space - a new set of commercially available molecules for hit discovery. Mol Inform 43:e202400114","journal-title":"Mol Inform"},{"key":"1105_CR3","doi-asserted-by":"publisher","first-page":"2021","DOI":"10.1021\/acs.jcim.2c00224","volume":"62","author":"WA Warr","year":"2022","unstructured":"Warr WA, Nicklaus MC, Nicolaou CA, Rarey M (2022) Exploration of Ultralarge Compound Collections for Drug Discovery. J Chem Inf Model 62:2021\u20132034","journal-title":"J Chem Inf Model"},{"key":"1105_CR4","doi-asserted-by":"publisher","first-page":"5773","DOI":"10.1021\/acs.jcim.3c01239","volume":"63","author":"T Sivula","year":"2023","unstructured":"Sivula T, Yetukuri L, Kalliokoski T et al (2023) Machine learning-boosted docking enables the efficient structure-based virtual screening of Giga-scale enumerated chemical libraries. J Chem Inf Model 63:5773\u20135783","journal-title":"J Chem Inf Model"},{"key":"1105_CR5","doi-asserted-by":"publisher","first-page":"663","DOI":"10.1038\/s41586-020-2117-z","volume":"580","author":"C Gorgulla","year":"2020","unstructured":"Gorgulla C, Boeszoermenyi A, Wang Z-F et al (2020) An open-source drug discovery platform enables ultra-large virtual screens. Nature 580:663\u2013668","journal-title":"Nature"},{"key":"1105_CR6","doi-asserted-by":"publisher","DOI":"10.1101\/2023.04.25.537981","author":"C Gorgulla","year":"2023","unstructured":"Gorgulla C, Cecchini D, Nigam A et al (2023) AI-enhanced adaptive virtual screening platform enabling exploration of 69 billion molecules discovers structurally validated FSP1 inhibitors. bioRxiv. https:\/\/doi.org\/10.1101\/2023.04.25.537981","journal-title":"bioRxiv"},{"key":"1105_CR7","doi-asserted-by":"publisher","DOI":"10.1016\/j.drudis.2024.103985","volume":"29","author":"L Wang","year":"2024","unstructured":"Wang L, Zhou Z, Yang X et al (2024) The present state and challenges of active learning in drug discovery. Drug Discov Today 29:103985","journal-title":"Drug Discov Today"},{"key":"1105_CR8","doi-asserted-by":"publisher","first-page":"2612","DOI":"10.1021\/acs.jcim.3c01661","volume":"64","author":"E Marin","year":"2024","unstructured":"Marin E, Kovaleva M, Kadukova M et al (2024) Regression-based active learning for accessible acceleration of ultra-large library docking. J Chem Inf Model 64:2612\u20132623","journal-title":"J Chem Inf Model"},{"key":"1105_CR9","doi-asserted-by":"publisher","first-page":"7866","DOI":"10.1039\/D0SC06805E","volume":"12","author":"DE Graff","year":"2021","unstructured":"Graff DE, Shakhnovich EI, Coley CW (2021) Accelerating high-throughput virtual screening through molecular pool-based active learning. Chem Sci 12:7866\u20137881","journal-title":"Chem Sci"},{"key":"1105_CR10","doi-asserted-by":"publisher","first-page":"673","DOI":"10.1038\/s41586-023-05905-z","volume":"616","author":"AV Sadybekov","year":"2023","unstructured":"Sadybekov AV, Katritch V (2023) Computational approaches streamlining drug discovery. Nature 616:673\u2013685","journal-title":"Nature"},{"key":"1105_CR11","doi-asserted-by":"publisher","first-page":"452","DOI":"10.1038\/s41586-021-04220-9","volume":"601","author":"AA Sadybekov","year":"2022","unstructured":"Sadybekov AA, Sadybekov AV, Liu Y et al (2022) Synthon-based ligand discovery in virtual libraries of over 11 billion compounds. Nature 601:452\u2013459","journal-title":"Nature"},{"key":"1105_CR12","doi-asserted-by":"publisher","first-page":"6447","DOI":"10.1038\/s41467-022-33981-8","volume":"13","author":"P Beroza","year":"2022","unstructured":"Beroza P, Crawford JJ, Ganichkin O et al (2022) Chemical space docking enables large-scale structure-based virtual screening to discover ROCK1 kinase inhibitors. Nat Commun 13:6447","journal-title":"Nat Commun"},{"key":"1105_CR13","doi-asserted-by":"publisher","first-page":"1251","DOI":"10.1021\/acs.jcim.3c01865","volume":"64","author":"C Cheng","year":"2024","unstructured":"Cheng C, Beroza P (2024) Shape-aware synthon search (SASS) for virtual screening of synthon-based chemical spaces. J Chem Inf Model 64:1251\u20131260","journal-title":"J Chem Inf Model"},{"key":"1105_CR14","doi-asserted-by":"publisher","first-page":"1158","DOI":"10.1021\/acs.jcim.3c01790","volume":"64","author":"K Klarich","year":"2024","unstructured":"Klarich K, Goldman B, Kramer T et al (2024) Thompson sampling\u2500an efficient method for searching ultralarge synthesis on demand databases. J Chem Inf Model 64:1158\u20131171","journal-title":"J Chem Inf Model"},{"key":"1105_CR15","doi-asserted-by":"publisher","DOI":"10.1126\/sciadv.ads7187","volume":"11","author":"GJ Correy","year":"2025","unstructured":"Correy GJ, Rachman MM, Togo T et al (2025) Exploration of structure-activity relationships for the SARS-CoV-2 macrodomain from shape-based fragment linking and active learning. Sci Adv 11:eads7187","journal-title":"Sci Adv"},{"key":"1105_CR16","doi-asserted-by":"publisher","first-page":"2193","DOI":"10.1016\/j.physa.2011.12.004","volume":"391","author":"A Lipowski","year":"2012","unstructured":"Lipowski A, Lipowska D (2012) Roulette-wheel selection via stochastic acceptance. Physica A Stat Mech Appl 391:2193\u20132196","journal-title":"Physica A Stat Mech Appl"},{"key":"1105_CR17","doi-asserted-by":"publisher","DOI":"10.1201\/b16018","volume-title":"Bayesian data analysis","author":"A Gelman","year":"2013","unstructured":"Gelman A, Carlin JB, Stern HS et al (2013) Bayesian data analysis, 3rd edn. CRC Press, Hoboken","edition":"3"},{"key":"1105_CR18","doi-asserted-by":"publisher","first-page":"1489","DOI":"10.1021\/jm040163o","volume":"48","author":"TS Rush 3rd","year":"2005","unstructured":"Rush TS 3rd, Grant JA, Mosyak L, Nicholls A (2005) A shape-based 3-D scaffold hopping method and its application to a bacterial protein-protein interaction. J Med Chem 48:1489\u20131495","journal-title":"J Med Chem"},{"key":"1105_CR19","unstructured":"eMolecules eXplore. In: eMolecules. https:\/\/www.emolecules.com\/products\/explore. Accessed 26 Aug 2025"},{"key":"1105_CR20","doi-asserted-by":"publisher","DOI":"10.3390\/ijms24076581","volume":"24","author":"G Graziano","year":"2023","unstructured":"Graziano G, Stefanachi A, Contino M et al (2023) Multicomponent reaction-assisted drug discovery: a time- and cost-effective green approach speeding up identification and optimization of anticancer drugs. Int J Mol Sci 24:6581","journal-title":"Int J Mol Sci"},{"key":"1105_CR21","doi-asserted-by":"publisher","first-page":"177","DOI":"10.1021\/ci049714+","volume":"45","author":"JJ Irwin","year":"2005","unstructured":"Irwin JJ, Shoichet BK (2005) ZINC\u2013a free database of commercially available compounds for virtual screening. J Chem Inf Model 45:177\u2013182","journal-title":"J Chem Inf Model"},{"key":"1105_CR22","doi-asserted-by":"publisher","first-page":"2287","DOI":"10.1021\/acs.jmedchem.3c02070","volume":"67","author":"AJ Woodhead","year":"2024","unstructured":"Woodhead AJ, Erlanson DA, de Esch IJP et al (2024) Fragment-to-lead medicinal chemistry publications in 2022. J Med Chem 67:2287\u20132304","journal-title":"J Med Chem"},{"key":"1105_CR23","doi-asserted-by":"publisher","first-page":"572","DOI":"10.1021\/ci100031x","volume":"50","author":"PCD Hawkins","year":"2010","unstructured":"Hawkins PCD, Skillman AG, Warren GL et al (2010) Conformer generation with OMEGA: algorithm and validation using high quality structures from the Protein Databank and Cambridge Structural Database. J Chem Inf Model 50:572\u2013584","journal-title":"J Chem Inf Model"},{"key":"1105_CR24","doi-asserted-by":"publisher","first-page":"325","DOI":"10.1007\/978-1-4842-2199-0_8","volume-title":"Practical Hadoop ecosystem: a definitive guide to Hadoop-related frameworks and tools","author":"D Vohra","year":"2016","unstructured":"Vohra D (2016) Apache parquet. In: Vohra D (ed) Practical Hadoop ecosystem: a definitive guide to Hadoop-related frameworks and tools. Springer, Berlin, pp 325\u2013335"},{"key":"1105_CR25","doi-asserted-by":"publisher","first-page":"16796","DOI":"10.1021\/acs.jmedchem.4c01632","volume":"67","author":"Y Wu","year":"2024","unstructured":"Wu Y, Liu F, Glenn I et al (2024) Identifying artifacts from large library docking. J Med Chem 67:16796\u201316806","journal-title":"J Med Chem"}],"updated-by":[{"DOI":"10.1186\/s13321-025-01113-1","type":"correction","label":"Correction","source":"publisher","updated":{"date-parts":[[2025,10,21]],"date-time":"2025-10-21T00:00:00Z","timestamp":1761004800000}}],"container-title":["Journal of Cheminformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-025-01105-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s13321-025-01105-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13321-025-01105-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T05:34:48Z","timestamp":1761111288000},"score":1,"resource":{"primary":{"URL":"https:\/\/jcheminf.biomedcentral.com\/articles\/10.1186\/s13321-025-01105-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,13]]},"references-count":25,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["1105"],"URL":"https:\/\/doi.org\/10.1186\/s13321-025-01105-1","relation":{},"ISSN":["1758-2946"],"issn-type":[{"value":"1758-2946","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,10,13]]},"assertion":[{"value":"23 April 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 September 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 October 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 October 2025","order":5,"name":"change_date","label":"Change Date","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"Correction","order":6,"name":"change_type","label":"Change Type","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"A Correction to this paper has been published:","order":7,"name":"change_details","label":"Change Details","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"https:\/\/doi.org\/10.1186\/s13321-025-01113-1","URL":"https:\/\/doi.org\/10.1186\/s13321-025-01113-1","order":8,"name":"change_details","label":"Change Details","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"H.Z., E.N., M.Y., S.G., and C.T. are employees of AstraZeneca and may own stock or stock options in the company. P.W. is an employee of Relay Therapeutics and may also own stock or stock options.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"154"}}