{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,14]],"date-time":"2026-05-14T22:45:39Z","timestamp":1778798739480,"version":"3.51.4"},"publisher-location":"Cham","reference-count":42,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783032164506","type":"print"},{"value":"9783032164513","type":"electronic"}],"license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-032-16451-3_26","type":"book-chapter","created":{"date-parts":[[2026,2,10]],"date-time":"2026-02-10T05:03:38Z","timestamp":1770699818000},"page":"421-440","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Keywords Are Not Always the\u00a0Key: A Metadata Field Analysis for\u00a0Natural Language Search on\u00a0Open Data Portals"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0004-3099-1738","authenticated-orcid":false,"given":"Lisa-Yao","family":"Gan","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-9989-1718","authenticated-orcid":false,"given":"Arunav","family":"Das","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5498-8670","authenticated-orcid":false,"given":"Johanna","family":"Walker","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1722-947X","authenticated-orcid":false,"given":"Elena","family":"Simperl","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,2,11]]},"reference":[{"key":"26_CR1","unstructured":"Varon, B.: Catalog search faq. https:\/\/support.socrata.com\/hc\/en-us\/articles\/225465147-Catalog-Search-FAQ (2023), Accessed 14 May 2025"},{"key":"26_CR2","unstructured":"Blei, D.M., Ng, A.Y., Jordan, M.I.: Latent dirichlet allocation. J. Mach. Learn. Res. 3(null), 993\u20131022 (2003)"},{"key":"26_CR3","unstructured":"Bonnet, A.: What is natural language search? how ai is transforming search (January 2025). https:\/\/encord.com\/blog\/natural-language-search\/ Accessed 17 July 2025"},{"key":"26_CR4","doi-asserted-by":"publisher","unstructured":"Bordes, A., Chopra, S., Weston, J.: Question answering with subgraph embeddings. In: Moschitti, A., Pang, B., Daelemans, W. (eds.) Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 615\u2013620. Association for Computational Linguistics, Doha, Qatar (Oct 2014). https:\/\/doi.org\/10.3115\/v1\/D14-1067, https:\/\/aclanthology.org\/D14-1067\/","DOI":"10.3115\/v1\/D14-1067"},{"key":"26_CR5","doi-asserted-by":"publisher","unstructured":"Chapman, A., et al.: Dataset search: a survey. VLDB J. 29(1), 251\u2013272 (Aug 2019). https:\/\/doi.org\/10.1007\/s00778-019-00564-x","DOI":"10.1007\/s00778-019-00564-x"},{"key":"26_CR6","unstructured":"Chen, P.B., Zhang, Y., Roth, D.: Is table retrieval a solved problem? exploring join-aware multi-table retrieval (2025). https:\/\/arxiv.org\/abs\/2404.09889"},{"key":"26_CR7","unstructured":"CKAN Project: Search feature detail page (2025). https:\/\/ckan.org\/features\/search Accessed 13 May 2025"},{"key":"26_CR8","doi-asserted-by":"publisher","unstructured":"Deerwester, S., Dumais, S.T., Furnas, G.W., Landauer, T.K., Harshman, R.: Indexing by latent semantic analysis. J. Am. Soc. Inform. Sci. 41(6), 391\u2013407 (1990). https:\/\/doi.org\/10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9, https:\/\/asistdl.onlinelibrary.wiley.com\/doi\/abs\/10.1002\/%28SICI%291097-4571%28199009%2941%3A6%3C391%3A%3AAID-ASI1%3E3.0.CO%3B2-9","DOI":"10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9"},{"key":"26_CR9","doi-asserted-by":"crossref","unstructured":"Douze, M., et al.: The faiss library (2025). https:\/\/arxiv.org\/abs\/2401.08281","DOI":"10.1109\/TBDATA.2025.3618474"},{"key":"26_CR10","doi-asserted-by":"publisher","unstructured":"Frank, M., Walker, J.: User centred methods for measuring the value of open data. J. Community Inform. 12 (2016). https:\/\/doi.org\/10.15353\/joci.v12i2.3221","DOI":"10.15353\/joci.v12i2.3221"},{"key":"26_CR11","doi-asserted-by":"publisher","unstructured":"Frank, M., Walker, J., Attard, J., Tygel, A.: Data literacy - what is it and how can we make it happen? J. Community Inform. 12 (2016). https:\/\/doi.org\/10.15353\/joci.v12i3.3274","DOI":"10.15353\/joci.v12i3.3274"},{"key":"26_CR12","doi-asserted-by":"crossref","unstructured":"Gao, J., Xiong, C., Bennett, P., Craswell, N.: Neural approaches to conversational information retrieval (2022). https:\/\/arxiv.org\/abs\/2201.05176","DOI":"10.1007\/978-3-031-23080-6"},{"key":"26_CR13","unstructured":"Google Research: Google dataset search (2025). https:\/\/datasetsearch.research.google.com\/, Accessed 17 May 2025"},{"key":"26_CR14","unstructured":"Greater London Authority: London datastore. https:\/\/data.london.gov.uk\/ (2025), Accessed 17 May 2025"},{"key":"26_CR15","doi-asserted-by":"publisher","unstructured":"Grootendorst, M.: Keybert: Minimal keyword extraction with bert (2020). https:\/\/doi.org\/10.5281\/zenodo.4461265","DOI":"10.5281\/zenodo.4461265"},{"key":"26_CR16","doi-asserted-by":"publisher","unstructured":"Gurin, J.: Open governments, open data: a new lever for transparency, citizen engagement, and economic growth. SAIS Rev. Inter. Affairs 34, 71\u201382 (2014). https:\/\/doi.org\/10.1353\/sais.2014.0009","DOI":"10.1353\/sais.2014.0009"},{"key":"26_CR17","doi-asserted-by":"publisher","unstructured":"Honnibal, M., Montani, I., Van\u00a0Landeghem, S., Boyd, A.: spaCy: industrial-strength Natural Language Processing in Python (2020). https:\/\/doi.org\/10.5281\/zenodo.1212303","DOI":"10.5281\/zenodo.1212303"},{"key":"26_CR18","doi-asserted-by":"publisher","unstructured":"Hulsebos, M., Lin, W., Shankar, S., Parameswaran, A.: It took longer than i was expecting: why is dataset search still so hard? In: Proceedings of the 2024 Workshop on Human-In-the-Loop Data Analytics, HILDA 2024, pp. 1\u20134. Association for Computing Machinery, New York (2024). https:\/\/doi.org\/10.1145\/3665939.3665959","DOI":"10.1145\/3665939.3665959"},{"key":"26_CR19","doi-asserted-by":"publisher","unstructured":"Jetzek, T.: The value of open government data (the value generating mechanisms of open government data). Geoforum Perspektiv 23, 48\u201357 (2013). https:\/\/doi.org\/10.5278\/ojs.persk..v12i23.489","DOI":"10.5278\/ojs.persk..v12i23.489"},{"key":"26_CR20","doi-asserted-by":"publisher","unstructured":"Kacprzak, E., Koesten, L., Ib\u00e1\u00f1ez, L.D., Blount, T., Tennison, J., Simperl, E.: Characterising dataset search \u2013 an analysis of search logs and data requests. SSRN Electronic J. (2018). https:\/\/doi.org\/10.2139\/ssrn.3287149","DOI":"10.2139\/ssrn.3287149"},{"key":"26_CR21","doi-asserted-by":"publisher","unstructured":"Kacprzak, E., Koesten, L., Ib\u00e1\u00f1ez, L.D., Blount, T., Tennison, J., Simperl, E.: Characterising dataset search\u2014an analysis of search logs and data requests. J. Web Semantics 55, 37\u201355 (2019). https:\/\/doi.org\/10.1016\/j.websem.2018.11.003, https:\/\/www.sciencedirect.com\/science\/article\/pii\/S1570826818300556","DOI":"10.1016\/j.websem.2018.11.003"},{"key":"26_CR22","doi-asserted-by":"publisher","unstructured":"Koesten, L., Gregory, K., Groth, P., Simperl, E.: Talking datasets \u2013 understanding data sensemaking behaviours. Inter. J. Human-Comput. Stud. 146, 102562 (2021). https:\/\/doi.org\/10.1016\/j.ijhcs.2020.102562, https:\/\/www.sciencedirect.com\/science\/article\/pii\/S1071581920301646","DOI":"10.1016\/j.ijhcs.2020.102562"},{"key":"26_CR23","doi-asserted-by":"publisher","unstructured":"Koesten, L.M., Kacprzak, E., Tennison, J.F.A., Simperl, E.: The trials and tribulations of working with structured data: -a study on information seeking behaviour. In: Proceedings of the 2017 CHI Conference on Human Factors in Computing Systems, CHI 2017. pp. 1277\u20131289. Association for Computing Machinery, New York (2017). https:\/\/doi.org\/10.1145\/3025453.3025838","DOI":"10.1145\/3025453.3025838"},{"key":"26_CR24","unstructured":"Mo, F., et al.: A survey of conversational search (2024). https:\/\/arxiv.org\/abs\/2410.15576"},{"key":"26_CR25","doi-asserted-by":"publisher","unstructured":"M\u00e1chov\u00e1, R., Hub, M., Ln\u011bni\u010dka, M.: Usability evaluation of open data portals: evaluating data discoverability, accessibility, and reusability from a stakeholders\u2019 perspective. Aslib J. Inform. Manag. 70 (2018). https:\/\/doi.org\/10.1108\/AJIM-02-2018-0026","DOI":"10.1108\/AJIM-02-2018-0026"},{"key":"26_CR26","doi-asserted-by":"publisher","unstructured":"Neumaier, S., Umbrich, J., Polleres, A.: Automated quality assessment of metadata across open data portals. J. Data Inform. Quality 8(1) (Oct 2016). https:\/\/doi.org\/10.1145\/2964909","DOI":"10.1145\/2964909"},{"key":"26_CR27","unstructured":"OpenAI, Achiam, J., et al.: Gpt-4 technical report (2024). https:\/\/arxiv.org\/abs\/2303.08774"},{"key":"26_CR28","doi-asserted-by":"publisher","unstructured":"Parthasarathi, S., Zeng, L., Hakkani-Tur, D.: Conversational text-to-sql: an odyssey into state-of-the-art and challenges ahead, pp.\u00a01\u20135 (June 2023). https:\/\/doi.org\/10.1109\/ICASSP49357.2023.10096170","DOI":"10.1109\/ICASSP49357.2023.10096170"},{"key":"26_CR29","unstructured":"Publications Office of the European Union: Portal architecture of data.europa.eu. https:\/\/data.europa.eu\/sites\/default\/files\/edp_factsheet_portal_architecture_online.pdf (2023), Accessed 13 May 2025"},{"key":"26_CR30","unstructured":"Radhakrishnan, P., et al.: Knowing when to ask \u2013 bridging large language models and data (2024). https:\/\/arxiv.org\/abs\/2409.13741"},{"key":"26_CR31","doi-asserted-by":"publisher","unstructured":"Sari, D.P., Ma, D.C., Ardhi, D.C.: Civic trust and the intention to utilize open government data: an experiment. In: Proceedings of the 25th Annual International Conference on Digital Government Research, dg.o 2024, pp. 1017\u20131019. Association for Computing Machinery, New York (2024). https:\/\/doi.org\/10.1145\/3657054.3657183","DOI":"10.1145\/3657054.3657183"},{"key":"26_CR32","unstructured":"Schema.org Community Group: Schema.org (2025). https:\/\/schema.org\/ Accessed 13 May 2025"},{"key":"26_CR33","doi-asserted-by":"crossref","unstructured":"Shahi, D.: Apache Solr: A Practical Approach to Enterprise Search. Apress, New York (2015). https:\/\/books.google.com\/books\/about\/Apache_Solr.html?id=5YZNCwAAQBAJ","DOI":"10.1007\/978-1-4842-1070-3"},{"key":"26_CR34","unstructured":"Touvron, H., et al.: Llama 2: Open foundation and fine-tuned chat models (2023). https:\/\/arxiv.org\/abs\/2307.09288"},{"key":"26_CR35","unstructured":"U.S. General Services Administration: Resources.data.gov. https:\/\/resources.data.gov\/ (2025), Accessed 11 May 2025"},{"key":"26_CR36","doi-asserted-by":"crossref","unstructured":"Voorhees, E.M., Tice, D.M.: The TREC-8 question answering track. In: Gavrilidou, M., Carayannis, G., Markantonatou, S., Piperidis, S., Stainhauer, G. (eds.) Proceedings of the Second International Conference on Language Resources and Evaluation (LREC 2000). European Language Resources Association (ELRA), Athens, Greece (May 2000). https:\/\/aclanthology.org\/L00-1018\/","DOI":"10.6028\/NIST.SP.500-246.qa-overview"},{"key":"26_CR37","unstructured":"Walker, J., Koutsiana, E., Massey, J., Thuermer, G., Simperl, E.: Prompting datasets: Data discovery with conversational agents (2023). https:\/\/arxiv.org\/abs\/2312.09947"},{"key":"26_CR38","doi-asserted-by":"crossref","unstructured":"Xiao, S., Liu, Z., Zhang, P., Muennighoff, N.: C-pack: Packaged resources to advance general chinese embedding (2023)","DOI":"10.1145\/3626772.3657878"},{"key":"26_CR39","doi-asserted-by":"publisher","unstructured":"Yu, T., et al.: CoSQL: a conversational text-to-SQL challenge towards cross-domain natural language interfaces to databases. In: Inui, K., Jiang, J., Ng, V., Wan, X. (eds.) Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP), pp. 1962\u20131979. Association for Computational Linguistics, Hong Kong, China (Nov 2019). https:\/\/doi.org\/10.18653\/v1\/D19-1204, https:\/\/aclanthology.org\/D19-1204\/","DOI":"10.18653\/v1\/D19-1204"},{"key":"26_CR40","doi-asserted-by":"publisher","unstructured":"Zhang, S., Balog, K.: Semantic table &nbsp;retrieval using keyword and table queries. ACM Trans. Web 15(3) (2021). https:\/\/doi.org\/10.1145\/3441690","DOI":"10.1145\/3441690"},{"key":"26_CR41","doi-asserted-by":"publisher","unstructured":"Zhang, S., Dai, Z., Balog, K., Callan, J.: Summarizing and exploring tabular data in conversational search. In: Proceedings of the 43rd International ACM SIGIR Conference on Research and Development in Information Retrieval, SIGIR 2020, pp. 1537\u20131540. Association for Computing Machinery, New York (2020). https:\/\/doi.org\/10.1145\/3397271.3401205, https:\/\/doi.org\/10.1145\/3397271.3401205","DOI":"10.1145\/3397271.3401205"},{"key":"26_CR42","unstructured":"Zhao, Y., Mero\u00f1o-Pe\u00f1uela, A., Simperl, E.: User experience in dataset search (2024). https:\/\/arxiv.org\/abs\/2403.15861"}],"container-title":["Communications in Computer and Information Science","Computer-Human Interaction Research and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-032-16451-3_26","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,10]],"date-time":"2026-02-10T05:03:46Z","timestamp":1770699826000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-032-16451-3_26"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"ISBN":["9783032164506","9783032164513"],"references-count":42,"URL":"https:\/\/doi.org\/10.1007\/978-3-032-16451-3_26","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"value":"1865-0929","type":"print"},{"value":"1865-0937","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]},"assertion":[{"value":"11 February 2026","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interest"}},{"value":"CHIRA","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Computer-Human Interaction Research and Applications","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Marbella","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Spain","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20 October 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21 October 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"9","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"chira2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/chira.scitevents.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}