{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,12]],"date-time":"2026-02-12T10:26:04Z","timestamp":1770891964594,"version":"3.50.1"},"reference-count":72,"publisher":"Ubiquity Press, Ltd.","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026,2,12]]},"DOI":"10.5334\/dsj-2026-006","type":"journal-article","created":{"date-parts":[[2026,2,12]],"date-time":"2026-02-12T09:34:37Z","timestamp":1770888877000},"source":"Crossref","is-referenced-by-count":0,"title":["Bridging the Data Discovery Gap: User-Centric Recommendations for Research Data Repositories"],"prefix":"10.5334","volume":"25","author":[{"given":"Mingfang","family":"Wu","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6423-7427","authenticated-orcid":false,"given":"Felicitas","family":"L\u00f6ffler","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1793-9615","authenticated-orcid":false,"given":"Brigitte","family":"Mathiak","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0222-4273","authenticated-orcid":false,"given":"Fotis","family":"Psomopoulos","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1900-4162","authenticated-orcid":false,"given":"Uwe","family":"Schindler","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7180-0246","authenticated-orcid":false,"given":"Amir","family":"Aryani","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0388-015X","authenticated-orcid":false,"given":"Jordi Bodera","family":"Sempere","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2910-8085","authenticated-orcid":false,"given":"Antica","family":"Culina","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3883-4169","authenticated-orcid":false,"given":"Andreas","family":"Czerniak","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2554-180X","authenticated-orcid":false,"given":"Chris","family":"Erdmann","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5475-8632","authenticated-orcid":false,"given":"Kathleen","family":"Gregory","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2036-8350","authenticated-orcid":false,"given":"Nick","family":"Juty","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7702-4495","authenticated-orcid":false,"given":"Allyson","family":"Lister","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6504-4598","authenticated-orcid":false,"given":"Ying-Hsang","family":"Liu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4831-9489","authenticated-orcid":false,"given":"Samantha","family":"Pearman-Kanza","sequence":"additional","affiliation":[]}],"member":"3285","reference":[{"key":"key20260212093430_B1","article-title":"\u2018Prov-Dominoes: An approach for knowledge discovery from provenance data\u2019","volume":"245","year":"2024","journal-title":"Expert Systems with Applications"},{"key":"key20260212093430_B2","article-title":"\u2018Semantic approaches for query expansion: Taxonomy, challenges, and future research directions\u2019","year":"2025","journal-title":"PeerJ Computer Science"},{"issue":"6","key":"key20260212093430_B3","article-title":"Retrieval augmented generation for large language models in healthcare: A systematic review","volume":"4","year":"2025","journal-title":"PLOS Digital Health"},{"key":"key20260212093430_B4","unstructured":"Bergold, J. and Thomas, S. (2012) \u2018Participatory research methods: A methodological approach in motion\u2019, Historical Social Research\/Historische Sozialforschung, 37(4), pp. 191\u2013222. Available at: https:\/\/www.jstor.org\/stable\/41756482"},{"issue":"1","key":"key20260212093430_B5","article-title":"\u2018Improving discovery and use of NASA\u2019s Earth observation data through metadata quality assessments\u2019","volume":"20","year":"2021","journal-title":"Data Science Journal"},{"issue":"1\/2","key":"key20260212093430_B6","first-page":"1","article-title":"\u2018The Scholix framework for interoperability in data-literature information exchange\u2019","volume":"23","year":"2017","journal-title":"D-Lib Magazine"},{"issue":"1","key":"key20260212093430_B7","article-title":"\u2018The FAIR assessment conundrum: Reflections on tools and metrics\u2019","volume":"23","year":"2024","journal-title":"Data Science Journal"},{"key":"key20260212093430_B8","article-title":"\u2018Large language models for text classification: From zero-shot learning to instruction-tuning\u2019","year":"2025","journal-title":"Sociological Methods & Research"},{"key":"key20260212093430_B9","article-title":"\u2018Data communities: A new model for supporting STEM data sharing\u2019","year":"2019","journal-title":"Ithaka S+R"},{"key":"key20260212093430_B10","author":"CoreTrustSeal Standards and Certification Board","year":"2022","journal-title":"CoreTrustSeal requirements 2023\u20132025 (V01.00)"},{"key":"key20260212093430_B11","author":"DataCite","year":"2024","journal-title":"DataCite thriving communities: 3000 repositories and counting"},{"key":"key20260212093430_B12","author":"DataCite Metadata Working Group","year":"2024","journal-title":"DataCite metadata schema for the publication and citation of research data and other research outputs"},{"issue":"1","key":"key20260212093430_B13","doi-asserted-by":"crossref","first-page":"533","DOI":"10.1002\/aris.2010.1440440119","article-title":"\u2018Confessional methods and everyday life information seeking\u2019","volume":"44","year":"2010","journal-title":"Annual Review of Information Science and Technology"},{"issue":"3","key":"key20260212093430_B14","doi-asserted-by":"crossref","first-page":"337","DOI":"10.1093\/jamia\/ocx134","article-title":"\u2018User needs analysis and usability assessment of DataMed \u2013 a biomedical data discovery index\u2019","volume":"25","year":"2018","journal-title":"Journal of the American Medical Informatics Association"},{"key":"key20260212093430_B15","article-title":"\u2018PANGAEA \u2013 Data publisher for earth & environmental Science\u2019","volume":"10","year":"2023","journal-title":"Scientific Data"},{"issue":"4","key":"key20260212093430_B16","doi-asserted-by":"crossref","first-page":"327","DOI":"10.1037\/h0061470","article-title":"\u2018The critical incident technique\u2019","volume":"51","year":"1954","journal-title":"Psychological Bulletin"},{"key":"key20260212093430_B17","first-page":"32","article-title":"\u2018Using collection descriptions to enhance an aggregation of harvested item-level metadata\u2019","year":"2005"},{"key":"key20260212093430_B18","unstructured":"Friedrich, T. (2020). Looking for data: Information seeking behaviour of survey data users (Doctoral dissertation). Humboldt-Universit\u00e4t zu Berlin. Available at: 10.18452\/22173"},{"key":"key20260212093430_B19","article-title":"\u2018Retrieval-augmented generation for large language models: A surve\u2019, arXiv:2312.10997v5 [cs.CL]","year":"2023"},{"key":"key20260212093430_B20","year":"2024","journal-title":"WorldFAIR (D2.3) (version 1)"},{"issue":"2","key":"key20260212093430_B21","article-title":"\u2018Lost or found? Discovering data needed for research\u2019","volume":"2","year":"2020","journal-title":"Harvard Data Science Review"},{"key":"key20260212093430_B22","article-title":"WorldFAIR (D2.2)","year":"2024","journal-title":"WorldFAIR\u2019s experience with FIPs (second set of FAIR implementation profiles for each case study) (version 1)"},{"issue":"4","key":"key20260212093430_B23","doi-asserted-by":"crossref","first-page":"626","DOI":"10.1108\/EL-11-2016-0243","article-title":"\u2018Social science data repositories in data deluge: A case study of ICPSR\u2019s workflow and practices\u2019","volume":"35","year":"2017","journal-title":"The Electronic Library"},{"key":"key20260212093430_B24","first-page":"1485","article-title":"\u2018Characterising dataset search queries\u2019","year":"2018"},{"key":"key20260212093430_B25","doi-asserted-by":"crossref","first-page":"147","DOI":"10.1134\/S199508022301016X","article-title":"\u2018Difficulties of FAIR principles implementation in cross-domain research infrastructures\u2019","volume":"44","year":"2023","journal-title":"Lobachevskii Journal of Math"},{"key":"key20260212093430_B26","article-title":"\u2018Talking datasets\u2014Understanding data sense-making behaviours\u2019","volume":"146","year":"2021","journal-title":"International Journal of Human-Computer Studies"},{"key":"key20260212093430_B27","first-page":"1277","article-title":"\u2018The Trials and Tribulations of Working with Structured Data: a Study on Information Seeking Behaviour\u2019","year":"2017"},{"key":"key20260212093430_B28","article-title":"\u2018A survey of current practices in data search services\u2019","volume":"V1","year":"2018","journal-title":"Mendeley Data"},{"issue":"1","key":"key20260212093430_B29","article-title":"\u2018Versioning data is about more than revisions: A conceptual framework and proposed principles\u2019","volume":"20","year":"2021","journal-title":"Data Science Journal"},{"key":"key20260212093430_B30","article-title":"\u2018FAIR assessment tools: Evaluating use and performance\u2019","volume":"27","year":"2022","journal-title":"NanoImpact"},{"key":"key20260212093430_B31","year":"2023","journal-title":"Towards a data quality framework for EOSC (1.0.0)"},{"key":"key20260212093430_B32","first-page":"128","article-title":"\u2018Direct, orienting, and scenic paths: How users navigate search in a research data archive\u2019","year":"2023"},{"key":"key20260212093430_B33","unstructured":"Lang, J.M. and Benbow, M.E. (2013) \u2018Species interactions and competition\u2019, Nature Education Knowledge, 4(4), p. 8. Available at: https:\/\/www.nature.com\/scitable\/knowledge\/library\/species-interactions-and-competition-102131429\/"},{"key":"key20260212093430_B34","year":"2023","journal-title":"FAIRsharing in a nutshell"},{"key":"key20260212093430_B35","year":"2022","journal-title":"Elicitation of data discovery contexts: An interview study (1.0)"},{"key":"key20260212093430_B36","year":"2023","journal-title":"Elicitation of contexts for discovering clinical trials and related health data: An interview study (V1.0)"},{"issue":"3","key":"key20260212093430_B37","article-title":"\u2018Dataset search in biodiversity research: Do metadata in data repositories reflect scholarly information needs?\u2019","volume":"16","year":"2021","journal-title":"PLoS ONE"},{"key":"key20260212093430_B38","article-title":"\u2018Semantic search for biological datasets: A usability study on modes of querying and explaining search results\u2019","year":"2023"},{"key":"key20260212093430_B39","year":"2019","journal-title":"The OpenAIRE research graph data model"},{"issue":"4","key":"key20260212093430_B40","doi-asserted-by":"crossref","first-page":"41","DOI":"10.1145\/1121949.1121979","article-title":"\u2018Exploratory search: from finding to understanding\u2019","volume":"49","year":"2006","journal-title":"Communications of the ACM"},{"issue":"4","key":"key20260212093430_B41","doi-asserted-by":"crossref","first-page":"649","DOI":"10.1002\/asi.24962","article-title":"\u2018Data, not documents: Moving beyond theories of information-seeking behavior to advance data discovery\u2019","volume":"76","year":"2025","journal-title":"Journal of the Association for Information Science and Technology"},{"key":"key20260212093430_B42","article-title":"\u2018OpenRefine: An approachable open tool to clean research data\u2019","volume":"170","year":"2022","journal-title":"Bulletin \u2013 Association of Canadian Map Libraries and Archives (ACMLA)"},{"issue":"5","key":"key20260212093430_B43","doi-asserted-by":"crossref","first-page":"1605","DOI":"10.1016\/j.ipm.2019.04.007","article-title":"\u2018A knowledge-based semantic framework for query expansion\u2019","volume":"56","year":"2019","journal-title":"Information Processing & Management"},{"key":"key20260212093430_B44","unstructured":"National Library of Medicine (2021) SNOMED CT to ICD-10-CM map. Available at: https:\/\/www.nlm.nih.gov\/research\/umls\/mapping_projects\/snomedct_to_icd10cm.html."},{"key":"key20260212093430_B45","unstructured":"NISO (National Information Standards Organization) (2004) Understanding metadata. Bethesda: NISO Press. Available at: https:\/\/www.niso.org\/standards\/resources\/UnderstandingMetadata.pdf."},{"issue":"1","key":"key20260212093430_B46","article-title":"\u2018Harmonizing quality measures of FAIRness assessment towards machine-actionable quality information\u2019","volume":"17","year":"2024","journal-title":"International Journal of Digital Earth"},{"key":"key20260212093430_B47","volume-title":"Software Engineering: A Practitioner\u2019s Approach","year":"2015","edition":"8th"},{"issue":"3","key":"key20260212093430_B48","article-title":"\u2018Analytics and privacy: Using Matomo in EBSCO\u2019s discovery service\u2019","volume":"39","year":"2020","journal-title":"Information Technology and Libraries"},{"issue":"1","key":"key20260212093430_B49","doi-asserted-by":"crossref","first-page":"66","DOI":"10.1108\/JD-12-2021-0245","article-title":"\u2018Large-scale analysis of query logs to profile users for dataset search\u2019","volume":"79","year":"2023","journal-title":"Journal of Documentation"},{"key":"key20260212093430_B50","volume-title":"Designing the user interface: Strategies for effective human-computer interaction","year":"2016","edition":"6th"},{"key":"key20260212093430_B51","article-title":"\u2018Improving dense retrieval models with LLM augmented data for dataset search\u2019","volume":"294","year":"2024","journal-title":"Knowledge-Based Systems"},{"key":"key20260212093430_B52","doi-asserted-by":"crossref","first-page":"189","DOI":"10.1146\/annurev-statistics-033121-112921","article-title":"\u2018Statistical data privacy: A song of privacy and Uutility\u2019","volume":"10","year":"2023","journal-title":"Annual Review of Statistics and Its Application"},{"key":"key20260212093430_B53","first-page":"428","article-title":"\u2018Interdisciplinary searching as a use case for vocabulary mapping\u2019","year":"2020"},{"issue":"4","key":"key20260212093430_B54","article-title":"\u2018Discovering datasets on the web scale: Challenges and recommendations for Google dataset search\u2019","year":"2024","journal-title":"Harvard Data Science Review"},{"key":"key20260212093430_B55","article-title":"\u2018Journal production guidance for software and data citations\u2019","volume":"10","year":"2023","journal-title":"Scientific Data"},{"issue":"6","key":"key20260212093430_B56","first-page":"929","article-title":"\u2018Review of vegetation classification and mapping systems undertaken by major forested land management agencies in Australia\u2019","volume":"45","year":"1997","journal-title":"Australian Journal of Botany"},{"issue":"4","key":"key20260212093430_B57","article-title":"\u2018Transforming metadata content guidelines and instructions to linked data\u2019","volume":"51","year":"2023","journal-title":"Journal of Documentation"},{"issue":"2","key":"key20260212093430_B58","doi-asserted-by":"crossref","first-page":"175","DOI":"10.1007\/s00799-021-00303-0","article-title":"\u2018Data-seeking behaviour in the social sciences\u2019","volume":"22","year":"2021","journal-title":"International Journal on Digital Libraries"},{"key":"key20260212093430_B59","first-page":"547","volume-title":"The semantic web \u2013 ISWC 2020","year":"2020"},{"issue":"C","key":"key20260212093430_B60","first-page":"81","article-title":"\u2018Visual query interfaces for semantic datasets: An evaluation study\u2019","volume":"39","year":"2016","journal-title":"Journal of Web Semantics"},{"issue":"4","key":"key20260212093430_B61","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1080\/07421222.1996.11518099","article-title":"\u2018Beyond Accuracy: What Data Quality Means to Data Consumers\u2019","volume":"12","year":"1996","journal-title":"Journal of Management Information Systems"},{"key":"key20260212093430_B62","first-page":"17716","article-title":"\u2018Searching for best practices in retrieval-augmented generation\u2019","year":"2024"},{"issue":"1\u20132","key":"key20260212093430_B63","article-title":"\u2018Improving WorldCat quality: Resolving to reduce duplicates\u2019","volume":"25","year":"2020","journal-title":"Organizacija znanja"},{"key":"key20260212093430_B64","first-page":"262","volume-title":"Electronic Government","year":"2023"},{"key":"key20260212093430_B65","volume-title":"Interactions with search systems","year":"2016"},{"key":"key20260212093430_B66","article-title":"\u2018The FAIR Guiding Principles for scientific data management and stewardship\u2019","volume":"3","year":"2016","journal-title":"Scientific Data"},{"issue":"1","key":"key20260212093430_B67","article-title":"\u2018Automatic transcription of English and German qualitative interviews\u2019","volume":"25","year":"2024","journal-title":"Forum Qualitative Sozialforschung Forum: Qualitative Social Research"},{"key":"key20260212093430_B68","year":"2022","journal-title":"ARDC Project: Eliciting data search context"},{"key":"key20260212093430_B69","author":"RDA Research Metadata Schemas WG","year":"2021","journal-title":"Guidelines for publishing structured metadata on the web (3.1)"},{"issue":"1","key":"key20260212093430_B70","article-title":"\u2018Data discovery paradigms: User requirements and recommendations for data repositories\u2019","volume":"18","year":"2019","journal-title":"Data Science Journal"},{"issue":"1","key":"key20260212093430_B71","doi-asserted-by":"crossref","first-page":"122","DOI":"10.1162\/dint_a_00162","article-title":"\u2018Automated metadata annotation: What is and is not possible with machine learning\u2019","volume":"5","year":"2023","journal-title":"Data Intelligence"},{"key":"key20260212093430_B72","year":"2024","journal-title":"Ten principles to improve dataset discoverability (1.0)"}],"container-title":["Data Science Journal"],"original-title":[],"language":"en","deposited":{"date-parts":[[2026,2,12]],"date-time":"2026-02-12T09:34:51Z","timestamp":1770888891000},"score":1,"resource":{"primary":{"URL":"http:\/\/datascience.codata.org\/articles\/10.5334\/dsj-2026-006\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"references-count":72,"alternative-id":["10.5334\/dsj-2026-006"],"URL":"https:\/\/doi.org\/10.5334\/dsj-2026-006","relation":{},"ISSN":["1683-1470"],"issn-type":[{"value":"1683-1470","type":"print"}],"subject":[],"published":{"date-parts":[[2026]]},"article-number":"6"}}