{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,1,18]],"date-time":"2025-01-18T05:07:58Z","timestamp":1737176878274,"version":"3.33.0"},"reference-count":38,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,12,15]],"date-time":"2024-12-15T00:00:00Z","timestamp":1734220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,12,15]],"date-time":"2024-12-15T00:00:00Z","timestamp":1734220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100004405","name":"Toyota Motor Corporation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100004405","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,12,15]]},"DOI":"10.1109\/bigdata62323.2024.10825245","type":"proceedings-article","created":{"date-parts":[[2025,1,16]],"date-time":"2025-01-16T18:31:23Z","timestamp":1737052283000},"page":"6604-6613","source":"Crossref","is-referenced-by-count":0,"title":["Metadata-less Dataset Recommendation Leveraging Dataset Embeddings by Pre-trained Tabular Language Models"],"prefix":"10.1109","author":[{"given":"Kosuke","family":"Manabe","sequence":"first","affiliation":[{"name":"The University of Tokyo,School of Engineering,Tokyo,Japan"}]},{"given":"Yukihisa","family":"Fujita","sequence":"additional","affiliation":[{"name":"Toyota Motor Corporation,Social System PF Development Division,Tokyo,Japan"}]},{"given":"Masahiro","family":"Kuwahara","sequence":"additional","affiliation":[{"name":"Toyota Motor Corporation,Social System PF Development Division,Tokyo,Japan"}]},{"given":"Teruaki","family":"Hayashi","sequence":"additional","affiliation":[{"name":"The University of Tokyo,School of Engineering,Tokyo,Japan"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.pursup.2016.08.005"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1111\/j.0000-0000.2011.01026.x"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2018.2806881"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3572751.3572755"},{"article-title":"Google dataset search: Building a search engine for datasets in an open web ecosystem","volume-title":"28th Web Conference (WebConf 2019)","author":"Noy","key":"ref5"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/s00778-019-00564-x"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/s11036-014-0547-2"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/s10115-022-01751-z"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICOSC.2019.8665522"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/3184558.3191602"},{"article-title":"Visually Exploring Data Provenance and Quality of Open Data","volume-title":"EuroVis 2018 - Posters","author":"Bors","key":"ref11"},{"key":"ref12","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-030-62466-8_41","volume-title":"Google Dataset Search by the Numbers","author":"Benjelloun","year":"2020"},{"key":"ref13","first-page":"66","article-title":"Large-scale analysis of query logs to profile users for dataset search","volume-title":"J. Documentation","volume":"79","author":"Sharifpour","year":"2022"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/IntelliSys.2017.8324327"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2024.3375750"},{"key":"ref16","first-page":"59","article-title":"Making open data transparent: Data discovery on open data","volume-title":"IEEE Data Eng. Bull.","volume":"41","author":"Miller","year":"2018"},{"key":"ref17","doi-asserted-by":"crossref","DOI":"10.14778\/3430915.3430921","article-title":"Turl: Table understanding through representation learning","author":"Deng","year":"2020"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.745"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.398"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.270"},{"article-title":"Hytrel: Hypergraph-enhanced tabular data representation learning","year":"2023","author":"Chen","key":"ref21"},{"article-title":"Sotab: The wdc schema.org table annotation benchmark","volume-title":"SemTab@ISWC","author":"Korini","key":"ref22"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3331184.3331333"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3178876.3186067"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/3366423.3379995"},{"key":"ref26","doi-asserted-by":"crossref","DOI":"10.1145\/2501511.2501516","article-title":"Methods for exploring and mining tables on wikipedia","volume-title":"Proceedings of the ACM SIGKDD Workshop on Interactive Data Exploration and Analytics","author":"Bhagavatula"},{"key":"ref27","first-page":"227","article-title":"Transformers for tabular data representation: A survey of models and applications","volume-title":"Transactions of the Association for Computational Linguistics","volume":"11","author":"Badaro","year":"2023"},{"article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","year":"2019","author":"Devlin","key":"ref28"},{"key":"ref29","doi-asserted-by":"crossref","first-page":"6769","DOI":"10.18653\/v1\/2020.emnlp-main.550","article-title":"Dense passage retrieval for open-domain question answering","volume-title":"Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP)","author":"Karpukhin","year":"2020"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1410"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.552"},{"key":"ref32","first-page":"380","article-title":"Utilizing BERT for aspect-based sentiment analysis via constructing auxiliary sentence","volume-title":"Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers)","author":"Sun"},{"key":"ref33","first-page":"1597","article-title":"A simple framework for contrastive learning of visual representations","volume-title":"International conference on machine learning","author":"Chen"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300892"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/3588710"},{"key":"ref36","first-page":"512","article-title":"Open domain question answering over tables via dense retrieval","volume-title":"Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies","author":"Herzig"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/2872518.2889386"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/BigData50022.2020.9378077"}],"event":{"name":"2024 IEEE International Conference on Big Data (BigData)","start":{"date-parts":[[2024,12,15]]},"location":"Washington, DC, USA","end":{"date-parts":[[2024,12,18]]}},"container-title":["2024 IEEE International Conference on Big Data (BigData)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10824975\/10824942\/10825245.pdf?arnumber=10825245","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,17]],"date-time":"2025-01-17T08:14:01Z","timestamp":1737101641000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10825245\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,15]]},"references-count":38,"URL":"https:\/\/doi.org\/10.1109\/bigdata62323.2024.10825245","relation":{},"subject":[],"published":{"date-parts":[[2024,12,15]]}}}