{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,1,18]],"date-time":"2025-01-18T05:07:23Z","timestamp":1737176843891,"version":"3.33.0"},"reference-count":27,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,12,15]],"date-time":"2024-12-15T00:00:00Z","timestamp":1734220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,12,15]],"date-time":"2024-12-15T00:00:00Z","timestamp":1734220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,12,15]]},"DOI":"10.1109\/bigdata62323.2024.10826033","type":"proceedings-article","created":{"date-parts":[[2025,1,16]],"date-time":"2025-01-16T18:31:23Z","timestamp":1737052283000},"page":"6564-6573","source":"Crossref","is-referenced-by-count":0,"title":["Inferring Relationships between Tabular Data and Topics using LLM for a Dataset Search Task"],"prefix":"10.1109","author":[{"given":"Yukihisa","family":"Fujita","sequence":"first","affiliation":[{"name":"Toyota Motor Corporation,Social System PF Development Division,Tokyo,Japan"}]},{"given":"Teruaki","family":"Hayashi","sequence":"additional","affiliation":[{"name":"The University of Tokyo,Graduate School of Engineering,Tokyo,Japan"}]},{"given":"Masahiro","family":"Kuwahara","sequence":"additional","affiliation":[{"name":"Toyota Motor Corporation,Social System PF Development Division,Tokyo,Japan"}]}],"member":"263","reference":[{"key":"ref1","first-page":"113766","article-title":"Enhancing credit scoring with alternative data","volume-title":"Expert Systems with Applications","volume":"163","author":"Djeundje","year":"2021"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/s00778-019-00564-x"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/3308558.3313685"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.14778\/3476311.3476346"},{"key":"ref5","first-page":"5629","article-title":"Topic-Based Search: Dataset search without metadata and users\u2019 knowledge about data","volume-title":"2023 IEEE International Conference on Big Data (BigData)","author":"Fujita"},{"key":"ref6","article-title":"MNIST handwritten digit database","volume-title":"ATT Labs","volume":"2","author":"LeCun","year":"2010"},{"article-title":"Overview of the NTCIR-15 data search task","volume-title":"Proceedings of the 15th NTCIR Conference on Evaluation of Information Access Technologies","author":"Kato","key":"ref7"},{"article-title":"Overview of the NTCIR-16 data search 2 task","volume-title":"Proceedings of the 16th NTCIR Conference on Evaluation of Information Access Technologies","author":"Kato","key":"ref8"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/3477495.3531729"},{"key":"ref10","first-page":"39","article-title":"Benchmarking large language models for news summarization","volume-title":"Transactions of the Association for Computational Linguistics","volume":"12","author":"Zhang","year":"2024"},{"key":"ref11","first-page":"111734","article-title":"GitHub Copilot AI pair programmer: Asset or Liability?","volume-title":"Journal of Systems and Software","volume":"203","author":"Dakhel","year":"2023"},{"key":"ref12","first-page":"41092","article-title":"Prompting large language model for machine translation: a case study","volume-title":"Proceedings of the 40th International Conference on Machine Learning","volume":"202","author":"Zhang"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.2305016120"},{"key":"ref14","article-title":"Personalized Web search challenge","volume-title":"Kaggle","author":"Eugene","year":"2013"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3589335.3648327"},{"key":"ref16","first-page":"575","article-title":"Search4Code: Code Search Intent Classification Using Weak Supervision","volume-title":"2021 IEEE\/ACM 18th International Conference on Mining Software Repositories (MSR)","author":"Rao"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3626772.3661384"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/3331184.3331333"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.14778\/3430915.3430921"},{"key":"ref20","first-page":"3446","article-title":"TABBIE: Pretrained representations of tabular data","volume-title":"Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies","author":"Iida"},{"key":"ref21","doi-asserted-by":"crossref","first-page":"281","DOI":"10.18653\/v1\/2020.findings-emnlp.27","article-title":"Understanding tables with intermediate pre-training","volume-title":"Findings of the Association for Computational Linguistics: EMNLP 2020","author":"Eisenschlos","year":"2020"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref23","doi-asserted-by":"crossref","DOI":"10.18653\/v1\/2024.findings-emnlp.603","article-title":"TAP4LLM: Table provider on sampling, augmenting, and packing semi-structured data for large language model reasoning","author":"Sui","year":"2024"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3025453.3025838"},{"key":"ref25","first-page":"1877","article-title":"Language models are few-shot learners","volume-title":"Proceedings of the 34th International Conference on Neural Information Processing Systems","author":"Brown"},{"key":"ref26","first-page":"24824","article-title":"Chain-of-thought prompting elicits reasoning in large language models","volume-title":"Proceedings of the 36th International Conference on Neural Information Processing Systems","author":"Wei"},{"year":"2020","key":"ref27","article-title":"pandas-dev\/pandas: Pandas"}],"event":{"name":"2024 IEEE International Conference on Big Data (BigData)","start":{"date-parts":[[2024,12,15]]},"location":"Washington, DC, USA","end":{"date-parts":[[2024,12,18]]}},"container-title":["2024 IEEE International Conference on Big Data (BigData)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10824975\/10824942\/10826033.pdf?arnumber=10826033","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,17]],"date-time":"2025-01-17T07:48:59Z","timestamp":1737100139000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10826033\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,15]]},"references-count":27,"URL":"https:\/\/doi.org\/10.1109\/bigdata62323.2024.10826033","relation":{},"subject":[],"published":{"date-parts":[[2024,12,15]]}}}