{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,26]],"date-time":"2025-11-26T21:57:14Z","timestamp":1764194234692},"reference-count":15,"publisher":"Oxford University Press (OUP)","issue":"22","license":[{"start":{"date-parts":[[2017,8,2]],"date-time":"2017-08-02T00:00:00Z","timestamp":1501632000000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by-nc\/4.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017,11,15]]},"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:sec>\n                  <jats:title>Motivation<\/jats:title>\n                  <jats:p>Biobanks are indispensable for large-scale genetic\/epidemiological studies, yet it remains difficult for researchers to determine which biobanks contain data matching their research questions.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Results<\/jats:title>\n                  <jats:p>To overcome this, we developed a new matching algorithm that identifies pairs of related data elements between biobanks and research variables with high precision and recall. It integrates lexical comparison, Unified Medical Language System ontology tagging and semantic query expansion. The result is BiobankUniverse, a fast matchmaking service for biobanks and researchers. Biobankers upload their data elements and researchers their desired study variables, BiobankUniverse automatically shortlists matching attributes between them. Users can quickly explore matching potential and search for biobanks\/data elements matching their research. They can also curate matches and define personalized data-universes.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Availability and implementation<\/jats:title>\n                  <jats:p>BiobankUniverse is available at http:\/\/biobankuniverse.com or can be downloaded as part of the open source MOLGENIS suite at http:\/\/github.com\/molgenis\/molgenis.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Supplementary information<\/jats:title>\n                  <jats:p>Supplementary data are available at Bioinformatics online.<\/jats:p>\n               <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btx478","type":"journal-article","created":{"date-parts":[[2017,8,1]],"date-time":"2017-08-01T11:19:46Z","timestamp":1501586386000},"page":"3627-3634","source":"Crossref","is-referenced-by-count":4,"title":["BiobankUniverse: automatic matchmaking between datasets for biobank data discovery and integration"],"prefix":"10.1093","volume":"33","author":[{"given":"Chao","family":"Pang","sequence":"first","affiliation":[{"name":"Department of Genetics, Genomics Coordination Center, University Medical Center Groningen, University of Groningen, Groningen, The Netherlands"},{"name":"Department of Epidemiology, University Medical Center Groningen, University of Groningen, Groningen, The Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fleur","family":"Kelpin","sequence":"additional","affiliation":[{"name":"Department of Genetics, Genomics Coordination Center, University Medical Center Groningen, University of Groningen, Groningen, The Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"David","family":"van Enckevort","sequence":"additional","affiliation":[{"name":"Department of Genetics, Genomics Coordination Center, University Medical Center Groningen, University of Groningen, Groningen, The Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Niina","family":"Eklund","sequence":"additional","affiliation":[{"name":"Department of Public Health Solutions, National Institute for Health and Welfare, Helsinki, Finland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kaisa","family":"Silander","sequence":"additional","affiliation":[{"name":"Department of Public Health Solutions, National Institute for Health and Welfare, Helsinki, Finland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dennis","family":"Hendriksen","sequence":"additional","affiliation":[{"name":"Department of Genetics, Genomics Coordination Center, University Medical Center Groningen, University of Groningen, Groningen, The Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mark","family":"de Haan","sequence":"additional","affiliation":[{"name":"Department of Genetics, Genomics Coordination Center, University Medical Center Groningen, University of Groningen, Groningen, The Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jonathan","family":"Jetten","sequence":"additional","affiliation":[{"name":"Department of Genetics, Genomics Coordination Center, University Medical Center Groningen, University of Groningen, Groningen, The Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tommy","family":"de Boer","sequence":"additional","affiliation":[{"name":"Department of Genetics, Genomics Coordination Center, University Medical Center Groningen, University of Groningen, Groningen, The Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bart","family":"Charbon","sequence":"additional","affiliation":[{"name":"Department of Genetics, Genomics Coordination Center, University Medical Center Groningen, University of Groningen, Groningen, The Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Petr","family":"Holub","sequence":"additional","affiliation":[{"name":"Biobanking and BioMolecular Resources Research Infrastructure (BBMRI-ERIC), Graz, Austria"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hans","family":"Hillege","sequence":"additional","affiliation":[{"name":"Department of Epidemiology, University Medical Center Groningen, University of Groningen, Groningen, The Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Morris A","family":"Swertz","sequence":"additional","affiliation":[{"name":"Department of Genetics, Genomics Coordination Center, University Medical Center Groningen, University of Groningen, Groningen, The Netherlands"},{"name":"Department of Epidemiology, University Medical Center Groningen, University of Groningen, Groningen, The Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"286","published-online":{"date-parts":[[2017,8,2]]},"reference":[{"key":"2023051308375586100_btx478-B1","doi-asserted-by":"crossref","first-page":"1383","DOI":"10.1093\/ije\/dyq139","article-title":"Quality, quantity and harmony: the DataSHaPER approach to integrating data across bioclinical studies","volume":"39","author":"Fortier","year":"2010","journal-title":"Int. J. Epidemiol"},{"key":"2023051308375586100_btx478-B100","doi-asserted-by":"crossref","first-page":"298","DOI":"10.1089\/bio.2015.0070","article-title":"Toward Global Biobank Integration by Implementation of the Minimum Information About BIobank Data Sharing (MIABIS 2.0 Core)","volume":"14","author":"Merino-Martinez","year":"2016","journal-title":"Biopreserv. Biobank"},{"key":"2023051308375586100_btx478-B2","doi-asserted-by":"crossref","first-page":"559","DOI":"10.1089\/bio.2016.0088","article-title":"BBMRI-ERIC Directory: 515 Biobanks with Over 60 Million Biological Samples","volume":"14","author":"Holub","year":"2016","journal-title":"Biopreserv. Biobank"},{"key":"2023051308375586100_btx478-B3","author":"Maelstrom Research","year":"2015"},{"key":"2023051308375586100_btx478-B4","doi-asserted-by":"crossref","first-page":"69","DOI":"10.1300\/J104v43n03_04","article-title":"SKOS: Simple Knowledge Organisation for the Web","volume":"43","author":"Miles","year":"2007","journal-title":"Catalog. Classif. Q"},{"key":"2023051308375586100_btx478-B5","doi-asserted-by":"crossref","first-page":"343","DOI":"10.1089\/bio.2012.0003","article-title":"A minimum data set for sharing biobank samples, information, and data: MIABIS","volume":"10","author":"Norlin","year":"2012","journal-title":"Biopreserv. Biobank"},{"key":"2023051308375586100_btx478-B6","doi-asserted-by":"crossref","first-page":"65","DOI":"10.1136\/amiajnl-2013-002577","article-title":"BiobankConnect: software to rapidly connect data elements for pooled analysis across biobanks using ontological and lexical indexing","volume":"22","author":"Pang","year":"2015","journal-title":"J. Am. Med. Inf. Assoc"},{"key":"2023051308375586100_btx478-B7","doi-asserted-by":"crossref","first-page":"btw155","DOI":"10.1093\/bioinformatics\/btw155","article-title":"MOLGENIS\/connect: a system for semi-automatic integration of heterogeneous phenotype data with applications in biobanks","volume":"32","author":"Pang","year":"2016","journal-title":"Bioinformatics"},{"key":"2023051308375586100_btx478-B8","first-page":"1532","author":"Pennington","year":"2014"},{"key":"2023051308375586100_btx478-B9","doi-asserted-by":"crossref","first-page":"1172","DOI":"10.1093\/ije\/dyu229","article-title":"Cohort Profile: LifeLines, a three-generation cohort study and biobank","volume":"44","author":"Scholtens","year":"2015","journal-title":"Int. J. Epidemiol"},{"key":"2023051308375586100_btx478-B10","author":"Shima","year":"2011"},{"key":"2023051308375586100_btx478-B11","doi-asserted-by":"crossref","first-page":"S12","DOI":"10.1186\/1471-2105-11-S12-S12","article-title":"The MOLGENIS toolkit: rapid prototyping of biosoftware at the push of a button","volume":"11","author":"Swertz","year":"2010","journal-title":"BMC Bioinformatics"},{"key":"2023051308375586100_btx478-B12","author":"The Apache Software Foundation","year":"2006"},{"key":"2023051308375586100_btx478-B13","author":"Wolffenbuttel","year":"2013"},{"key":"2023051308375586100_btx478-B14","author":"Wu","year":"1994"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/33\/22\/3627\/50307278\/bioinformatics_33_22_3627.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/33\/22\/3627\/50307278\/bioinformatics_33_22_3627.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,13]],"date-time":"2023-05-13T08:38:13Z","timestamp":1683967093000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/33\/22\/3627\/4060551"}},"subtitle":[],"editor":[{"given":"Jonathan","family":"Wren","sequence":"additional","affiliation":[],"role":[{"role":"editor","vocabulary":"crossref"}]}],"short-title":[],"issued":{"date-parts":[[2017,8,2]]},"references-count":15,"journal-issue":{"issue":"22","published-print":{"date-parts":[[2017,11,15]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btx478","relation":{},"ISSN":["1367-4803","1367-4811"],"issn-type":[{"value":"1367-4803","type":"print"},{"value":"1367-4811","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2017,11,15]]},"published":{"date-parts":[[2017,8,2]]}}}