{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,29]],"date-time":"2026-06-29T17:48:22Z","timestamp":1782755302901,"version":"3.54.5"},"reference-count":20,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2025,1,31]],"date-time":"2025-01-31T00:00:00Z","timestamp":1738281600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,31]],"date-time":"2025-01-31T00:00:00Z","timestamp":1738281600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100004586","name":"FAPERJ","doi-asserted-by":"crossref","award":["E-26\/202.818\/2017"],"award-info":[{"award-number":["E-26\/202.818\/2017"]}],"id":[{"id":"10.13039\/501100004586","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100002322","name":"CAPES","doi-asserted-by":"crossref","award":["88881.310592-2018\/01 and 88881.134081\/2016-01 and 88882.164913\/2010- 01"],"award-info":[{"award-number":["88881.310592-2018\/01 and 88881.134081\/2016-01 and 88882.164913\/2010- 01"]}],"id":[{"id":"10.13039\/501100002322","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100003593","name":"CNPq","doi-asserted-by":"crossref","award":["302303\/2017-0"],"award-info":[{"award-number":["302303\/2017-0"]}],"id":[{"id":"10.13039\/501100003593","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["SN COMPUT. SCI."],"DOI":"10.1007\/s42979-025-03662-6","type":"journal-article","created":{"date-parts":[[2025,1,31]],"date-time":"2025-01-31T14:45:21Z","timestamp":1738334721000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":13,"title":["LLM-Based Text-to-SQL for Real-World Databases"],"prefix":"10.1007","volume":"6","author":[{"given":"Eduardo R.","family":"Nascimento","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Grettel","family":"Garc\u00eda","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yenier T.","family":"Izquierdo","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Lucas","family":"Feij\u00f3","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Gustavo M. C.","family":"Coelho","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Aiko R.","family":"de Oliveira","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Melissa","family":"Lemos","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Robinson L. S.","family":"Garcia","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Luiz A. P. Paes","family":"Leme","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0765-9636","authenticated-orcid":false,"given":"Marco A.","family":"Casanova","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,1,31]]},"reference":[{"issue":"4","key":"3662_CR1","doi-asserted-by":"publisher","first-page":"905","DOI":"10.1007\/s00778-022-00776-8","volume":"32","author":"G Katsogiannis-Meimarakis","year":"2023","unstructured":"Katsogiannis-Meimarakis G, Koutrika G. A survey on deep learning approaches for text-to-SQL. VLDB J. 2023;32(4):905\u201336. https:\/\/doi.org\/10.1007\/s00778-022-00776-8.","journal-title":"VLDB J"},{"issue":"10","key":"3662_CR2","doi-asserted-by":"publisher","first-page":"1737","DOI":"10.1007\/s00778-022-00776-8","volume":"13","author":"H Kim","year":"2020","unstructured":"Kim H, So B-H, Han W-S, Lee H. Natural language to SQL: where are we today? Proc VLDB Endow. 2020;13(10):1737\u20131750. https:\/\/doi.org\/10.14778\/3401960.3401970","journal-title":"Proc VLDB Endow"},{"key":"3662_CR3","doi-asserted-by":"publisher","first-page":"793","DOI":"10.1007\/s00778-019-00567-8","volume":"28","author":"K Affolter","year":"2019","unstructured":"Affolter K, Stockinger K, Bernstein A. A comparative survey of recent natural language interfaces for databases. VLDB J. 2019;28:793\u2013819. https:\/\/doi.org\/10.1007\/s00778-019-00567-8.","journal-title":"VLDB J"},{"key":"3662_CR4","doi-asserted-by":"publisher","unstructured":"Yu T, Zhang R, Yang K, Yasunaga M, Wang D, Li Z, Ma J, Li I, Yao Q, Roman S, Zhang Z, Radev D. Spider: alarge-scale human-labeled dataset for complex and cross-domain semantic parsing and text-to-sql task. In: Riloff E, Chiang D, Hockenmaier J, Tsujii J, editors. Proceedings of 2018 conference on empirical methods in natural language processing. Brussels, Belgium: Association for Computational Linguistics; 2018. pp. 3911\u20133921. https:\/\/doi.org\/10.18653\/v1\/D18-1425; https:\/\/aclanthology.org\/D18-1425.","DOI":"10.18653\/v1\/D18-1425"},{"key":"3662_CR5","unstructured":"Li J, Hui B, Qu G, Yang J, Li B, Li B, Wang B, Qin B, Geng R, Huo N, Zhou X, Ma C, Li G, Chang K, Huang F, Cheng R, Li Y. Can llm already serve as a database interface? A big bench for large-scale database grounded text-to-sqls. In: Proceedings of the 37th international conference on neural information processing systems. NIPS \u201923. Curran Associates Inc., Red Hook, NY, USA.  2024."},{"issue":"5","key":"3662_CR6","doi-asserted-by":"publisher","first-page":"521","DOI":"10.5753\/jidm.2021.1904","volume":"12","author":"YT Izquierdo","year":"2021","unstructured":"Izquierdo YT, Garc\u00eda GM, Lemos M, Novello A, Novelli B, Damasceno C, Leme LAPP, Casanova MA. A platform for keyword search and its application for COVID-19 pandemic data. J Inf Data Manag. 2021;12(5):521\u201335. https:\/\/doi.org\/10.5753\/jidm.2021.1904.","journal-title":"J Inf Data Manag"},{"key":"3662_CR7","unstructured":"Nascimento ER, Casanova MA, Leme LAPP, Garc\u00eda GM, Lemos M, Izquierdo YT, Garcia R, Victorio W. A family of natural language interfaces for databases based on chatgpt and langchain (short paper). In: Companion proceedings of the 42nd international conference on conceptual modeling: posters and demos co-located with ER 2023, Lisbon, Portugal, November 06\u201309, 2023. CEUR Workshop Proceedings, vol. 3618. 2023. https:\/\/ceur-ws.org\/Vol-3618\/pd_paper_1.pdf."},{"key":"3662_CR8","doi-asserted-by":"publisher","unstructured":"Dong X, Zhang C, Ge Y, Mao Y, Gao Y, Chen L, Lin J, Lou D. C3: zero-shot text-to-SQL with chatgpt. arXiv preprint. 2023. https:\/\/doi.org\/10.48550\/arXiv.2307.07306.","DOI":"10.48550\/arXiv.2307.07306"},{"key":"3662_CR9","unstructured":"Pourreza M, Rafiei D. DIN-SQL: decomposed in-context learning of text-to-SQL with self-correction. In: Proceedings of the 37th international conference on neural information processing systems. NIPS \u201923. Curran Associates Inc., Red Hook, NY, USA.  2024."},{"key":"3662_CR10","doi-asserted-by":"publisher","unstructured":"Nascimento ERS, Garcia GM, Feij\u00f3 L, Victorio W, Izquierdo YT, Oliveira A, Coelho GMC, Lemos M, Garcia RLS, Leme LAPP, Casanova MA. Text-to-SQL meets the real-world. In: Proceedings of the 26th international conference on enterprise information systems, vol. 1. ICEIS. SciTePress, Set\u00fabal, Portugal. 2024. pp. 61\u201372. INSTICC. https:\/\/doi.org\/10.5220\/0012555200003690.","DOI":"10.5220\/0012555200003690"},{"key":"3662_CR11","doi-asserted-by":"publisher","unstructured":"Nascimento ERS, Izquierdo YT, Garcia GM, Coelho G, Feij\u00f3 L, Lemos M, Leme LAPP, Casanova MA. My database user is a large language model. In: Proceedings of the 26th international conference on enterprise information systems, vol. 1. ICEIS. SciTePress, Set\u00fabal, Portugal. 2024. pp. 800\u2013806. INSTICC. https:\/\/doi.org\/10.5220\/0012697700003690.","DOI":"10.5220\/0012697700003690"},{"key":"3662_CR12","doi-asserted-by":"publisher","unstructured":"Zhong V, Xiong C Socher R. SEQ2SQL: generating structured queries from natural language using reinforcement learning. arXiv preprint. 2017. https:\/\/doi.org\/10.48550\/arXiv.1709.00103.","DOI":"10.48550\/arXiv.1709.00103"},{"key":"3662_CR13","doi-asserted-by":"crossref","unstructured":"Guo J, Si Z, Wang Y, Liu Q, Fan M, Lou J-G, Yang Z, Liu T Chase: a large-scale and pragmatic chinese dataset for cross-database context-dependent text-to-SQL. In: Proceedings of the 59th annual meeting of the association for computational linguistics and the 11th international joint conference on natural language processing.  2021. pp. 2316\u20132331. https:\/\/aclanthology.org\/2021.acl-long.180.","DOI":"10.18653\/v1\/2021.acl-long.180"},{"key":"3662_CR14","unstructured":"Ping WJ. Open-sourcing SQLEval: our framework for evaluating LLM-generated SQL. 2023. https:\/\/defog.ai\/blog\/open-sourcing-sqleval\/."},{"key":"3662_CR15","doi-asserted-by":"publisher","unstructured":"Gao D, Wang H, Li Y, Sun X, Qian Y, Ding B, Zhou J. Text-to-SQL empowered by large language models: a benchmark evaluation. arXiv preprint. 2023. https:\/\/doi.org\/10.48550\/arXiv:2308.15363.","DOI":"10.48550\/arXiv:2308.15363"},{"key":"3662_CR16","doi-asserted-by":"publisher","unstructured":"Izquierdo YT, Garc\u00eda GM, Menendez ES, Casanova MA, Dartayre F, Levy CH. QUIOW: a keyword-based query processing tool for rdf datasets and relational databases. In: Hartmann S, Ma H, Hameurlain A, Pernul G, Wagner RR, editors. International conference on database and expert systems applications (DEXA). Springer, Cham.  2018. pp. 259\u2013269. https:\/\/doi.org\/10.1007\/978-3-319-98812-2_22.","DOI":"10.1007\/978-3-319-98812-2_22"},{"key":"3662_CR17","doi-asserted-by":"publisher","unstructured":"Garc\u00eda GM, Izquierdo YT, Menendez E, Dartayre F, Casanova MA. RDF keyword-based query technology meets a real-world dataset. In: Proceedings of the 20th international conference on extending database technology (EDBT). OpenProceedings.org, Venice, Italy. 2017. pp. 656\u2013667. https:\/\/doi.org\/10.5441\/002\/edbt.2017.86.","DOI":"10.5441\/002\/edbt.2017.86"},{"key":"3662_CR18","doi-asserted-by":"publisher","unstructured":"Wei J, Wang X, Schuurmans D, Bosma M, Ichter B, Xia F, Chi E, Le Q, Zhou D. Chain-of-thought prompting elicits reasoning in large language models. arXiv preprint. 2023. https:\/\/doi.org\/10.48550\/arXiv.2310.12516.","DOI":"10.48550\/arXiv.2310.12516"},{"key":"3662_CR19","doi-asserted-by":"publisher","unstructured":"Yu X, Cheng H, Liu X, Roth D, Gao J Automatic hallucination assessment for aligned large language models via transferable adversarial attacks. arXiv preprint. 2023. https:\/\/doi.org\/10.48550\/arXiv:2310.12516.","DOI":"10.48550\/arXiv:2310.12516"},{"key":"3662_CR20","unstructured":"Lewis P, Perez E, Piktus A, Petroni F, Karpukhin V, Goyal N, K\u00fcttler H, Lewis M, Yih W-T, Rockt\u00e4schel T, Riedel S, Kiela D. Retrieval-augmented generation for knowledge-intensive NLP tasks. In: Larochelle H, Ranzato M, Hadsell R, Balcan M, Lin H, editors. Advances in neural information processing systems, vol. 33. Curran Associates, Inc., Red Hook, NY, USA, 2020. pp. 9459\u20139474.  https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2020\/file\/6b493230205f780e1bc26945df7481e5-Paper.pdf."}],"container-title":["SN Computer Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42979-025-03662-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s42979-025-03662-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42979-025-03662-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,31]],"date-time":"2025-01-31T14:45:32Z","timestamp":1738334732000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s42979-025-03662-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,1,31]]},"references-count":20,"journal-issue":{"issue":"2","published-online":{"date-parts":[[2025,2]]}},"alternative-id":["3662"],"URL":"https:\/\/doi.org\/10.1007\/s42979-025-03662-6","relation":{},"ISSN":["2661-8907"],"issn-type":[{"value":"2661-8907","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,1,31]]},"assertion":[{"value":"5 October 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 December 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"31 January 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"On behalf of all authors, the corresponding author states that there is no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Research involving humans and\/or animals"}},{"value":"Not applicable.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Informed consent"}}],"article-number":"130"}}