{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,8]],"date-time":"2026-02-08T05:58:25Z","timestamp":1770530305246,"version":"3.49.0"},"publisher-location":"Cham","reference-count":38,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030824716","type":"print"},{"value":"9783030824723","type":"electronic"}],"license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-82472-3_19","type":"book-chapter","created":{"date-parts":[[2021,8,15]],"date-time":"2021-08-15T23:03:01Z","timestamp":1629068581000},"page":"260-274","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":20,"title":["SMAT: An Attention-Based Deep Learning Solution to the Automation of Schema Matching"],"prefix":"10.1007","author":[{"given":"Jing","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bonggun","family":"Shin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jinho D.","family":"Choi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Joyce C.","family":"Ho","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,8,16]]},"reference":[{"issue":"1\u20132","key":"19_CR1","doi-asserted-by":"publisher","first-page":"81","DOI":"10.14778\/1920841.1920857","volume":"3","author":"B Alexe","year":"2010","unstructured":"Alexe, B., Hern\u00e1ndez, M., Popa, L., Tan, W.C.: Mapmerge: correlating independent schema mappings. Proc. VLDB Endow. 3(1\u20132), 81\u201392 (2010)","journal-title":"Proc. VLDB Endow."},{"key":"19_CR2","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9781139060158","volume-title":"Foundations of Data Exchange","author":"M Arenas","year":"2014","unstructured":"Arenas, M., Barcel\u00f3, P., Libkin, L., Murlak, F.: Foundations of Data Exchange. Cambridge University Press, Cambridge (2014)"},{"key":"19_CR3","doi-asserted-by":"publisher","unstructured":"Atzeni, P., Bellomarini, L., Papotti, P., Torlone, R.: Meta-mappings for schema mapping reuse. Proc. VLDB Endow. 12(5), 557\u2013569 (2019). https:\/\/doi.org\/10.14778\/3303753.3303761","DOI":"10.14778\/3303753.3303761"},{"key":"19_CR4","doi-asserted-by":"crossref","unstructured":"Cappuzzo, R., Papotti, P., Thirumuruganathan, S.: Creating embeddings of heterogeneous relational datasets for data integration tasks. In: Proceedings of SIGMOD, pp. 1335\u20131349 (2020)","DOI":"10.1145\/3318464.3389742"},{"key":"19_CR5","doi-asserted-by":"crossref","unstructured":"Ten Cate, B., Kolaitis, P.G., Qian, K., Tan, W.C.: Active learning of GAV schema mappings. In: Proceedings of SIGMOD\/PODS, pp. 355\u2013368 (2018)","DOI":"10.1145\/3196959.3196974"},{"issue":"2","key":"19_CR6","first-page":"10","volume":"41","author":"C Chen","year":"2018","unstructured":"Chen, C., Golshan, B., Halevy, A.Y., Tan, W.C., Doan, A.: Biggorilla: an open-source ecosystem for data preparation and integration. IEEE Data Eng. Bull. 41(2), 10\u201322 (2018)","journal-title":"IEEE Data Eng. Bull."},{"key":"19_CR7","unstructured":"Centers for medicare & medicaid services (cms). https:\/\/www.cms.gov\/OpenPayments\/Explore-the-Data\/Data-Overview.html"},{"key":"19_CR8","doi-asserted-by":"crossref","unstructured":"Conneau, A., Kiela, D., Schwenk, H., Barrault, L., Bordes, A.: Supervised learning of universal sentence representations from natural language inference data. In: Proceedings of EMNLP, pp. 670\u2013680 (2017)","DOI":"10.18653\/v1\/D17-1070"},{"key":"19_CR9","doi-asserted-by":"crossref","unstructured":"Cui, Y., Chen, Z., Wei, S., Wang, S., Liu, T., Hu, G.: Attention-over-attention neural networks for reading comprehension. In: Proceedings of ACL (2017)","DOI":"10.18653\/v1\/P17-1055"},{"key":"19_CR10","unstructured":"Devlin, J., Chang, M.W., Lee, K., Toutanova, K.: Bert: pre-training of deep bidirectional transformers for language understanding. In: Proceedings of of NAACL-HLT, pp. 4171\u20134186 (2019)"},{"key":"19_CR11","doi-asserted-by":"crossref","unstructured":"Do, H.H., Rahm, E.: Coma\u2013a system for flexible combination of schema matching approaches. In: Proceedings of VLDB, pp. 610\u2013621 (2002)","DOI":"10.1016\/B978-155860869-6\/50060-3"},{"issue":"6","key":"19_CR12","doi-asserted-by":"publisher","first-page":"1367","DOI":"10.1109\/TPAMI.2018.2832629","volume":"41","author":"Q Dong","year":"2019","unstructured":"Dong, Q., Gong, S., Zhu, X.: Imbalanced deep learning by minority class incremental rectification. IEEE Trans. Pattern Analy. Mach. Intell. 41(6), 1367\u20131381 (2019). https:\/\/doi.org\/10.1109\/TPAMI.2018.2832629","journal-title":"IEEE Trans. Pattern Analy. Mach. Intell."},{"key":"19_CR13","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"198","DOI":"10.1007\/978-3-642-02463-4_12","volume-title":"Conceptual Modeling: Foundations and Applications","author":"R Fagin","year":"2009","unstructured":"Fagin, R., Haas, L.M., Hern\u00e1ndez, M., Miller, R.J., Popa, L., Velegrakis, Y.: Clio: schema mapping creation and data exchange. In: Borgida, A.T., Chaudhri, V.K., Giorgini, P., Yu, E.S. (eds.) Conceptual Modeling: Foundations and Applications. LNCS, vol. 5600, pp. 198\u2013236. Springer, Heidelberg (2009). https:\/\/doi.org\/10.1007\/978-3-642-02463-4_12"},{"key":"19_CR14","doi-asserted-by":"crossref","unstructured":"Fagin, R., Kolaitis, P.G., Popa, L., Tan, W.C.: Schema mapping evolution through composition and inversion. In: Schema Matching and Mapping, pp. 191\u2013222. Springer (2011)","DOI":"10.1007\/978-3-642-16518-4_7"},{"key":"19_CR15","unstructured":"Fernandez, R.C., et al.: Seeping semantics: linking datasets using word embeddings for data discovery. In: Proceedings of ICDE, pp. 989\u20131000 (2018)"},{"issue":"1","key":"19_CR16","doi-asserted-by":"publisher","first-page":"1","DOI":"10.2200\/S00337ED1V01Y201102DTM013","volume":"3","author":"A Gal","year":"2011","unstructured":"Gal, A.: Uncertain schema matching. Synth. Lect. Data Manag. 3(1), 1\u201397 (2011)","journal-title":"Synth. Lect. Data Manag."},{"key":"19_CR17","unstructured":"Gal, A., Roitman, H., Shraga, R.: Learning to rerank schema matches. IEEE Trans. Knowl. Data Eng. (2019)"},{"key":"19_CR18","doi-asserted-by":"crossref","unstructured":"Halevy, A., Nemes, E., Dong, X., Madhavan, J., Zhang, J.: Similarity search for web services. In: Proceedings of the 30th VLDB Conference, pp. 372\u2013383 (2004)","DOI":"10.1016\/B978-012088469-8.50035-8"},{"key":"19_CR19","unstructured":"Han, L., Kashyap, A.L., Finin, T., Mayfield, J., Weese, J.: Umbc\\_ebiquity-core: semantic textual similarity systems. In: Second Joint Conference on Lexical and Computational Semantics (* SEM), Volume 1: Proceedings of the Main Conference and the Shared Task: Semantic Textual Similarity, pp. 44\u201352 (2013)"},{"key":"19_CR20","doi-asserted-by":"crossref","unstructured":"He, B., Chang, K.C.C.: Statistical schema matching across web query interfaces. In: Proceedings of SIGMOD, pp. 217\u2013228 (2003)","DOI":"10.1145\/872757.872784"},{"key":"19_CR21","unstructured":"Hernandez, M., Ho, H., Naumann, F., Popa, L.: Clio: a schema mapping tool for information integration. In: 8th International Symposium on Parallel Architectures, Algorithms and Networks (ISPAN 2005), p. 1. IEEE (2005)"},{"key":"19_CR22","doi-asserted-by":"crossref","unstructured":"Johnson, A.E., et al.: Mimic-iii, a freely accessible critical care database. Sci. Data 3, 160035 (2016)","DOI":"10.1038\/sdata.2016.35"},{"key":"19_CR23","doi-asserted-by":"crossref","unstructured":"Kettouch, M.S., Luca, C., Hobbs, M., Dascalu, S.: Using semantic similarity for schema matching of semi-structured and linked data. In: 2017 Internet Technologies and Applications (ITA), pp. 128\u2013133. IEEE (2017)","DOI":"10.1109\/ITECHA.2017.8101923"},{"key":"19_CR24","doi-asserted-by":"crossref","unstructured":"Kolyvakis, P., Kalousis, A., Kiritsis, D.: Deepalignment: unsupervised ontology matching with refined word vectors. In: Proceedings of NAACL-HLT, pp. 787\u2013798 (2018)","DOI":"10.18653\/v1\/N18-1072"},{"key":"19_CR25","unstructured":"Koutras, C., Fragkoulis, M., Katsifodimos, A., Lofi, C.: Rema: graph embeddings-based relational schema matching. In: EDBT\/ICDT Workshops (2020)"},{"key":"19_CR26","doi-asserted-by":"crossref","unstructured":"Li, Y., Li, J., Suhara, Y., Doan, A., Tan, W.C.: Deep entity matching with pre-trained language models. arXiv preprint arXiv:2004.00584 (2020)","DOI":"10.14778\/3421424.3421431"},{"key":"19_CR27","unstructured":"Liu, Y., et al.: Roberta: A robustly optimized bert pretraining approach. arXiv preprint arXiv:1907.11692 (2019)"},{"key":"19_CR28","series-title":"Studies in Big Data","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1007\/978-3-319-61893-7_12","volume-title":"A Comprehensive Guide Through the Italian Database Research Over the Last 25 Years","author":"G Mecca","year":"2018","unstructured":"Mecca, G., Papotti, P., Santoro, D.: Schema mappings: from data translation to data cleaning. In: Flesca, S., Greco, S., Masciari, E., Sacc\u00e0, D. (eds.) A Comprehensive Guide Through the Italian Database Research Over the Last 25 Years. SBD, vol. 31, pp. 203\u2013217. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-319-61893-7_12"},{"key":"19_CR29","doi-asserted-by":"crossref","unstructured":"Mudgal, S., Kumar, S.: Deep learning for entity matching: A design space exploration. Tech. rep. (2018)","DOI":"10.1145\/3183713.3196926"},{"key":"19_CR30","unstructured":"Nguyen, Q.V.H., Weidlich, M., Nguyen, T.T., Mikl\u00f3s, Z., Aberer, K., Gal, A.: Reconciling matching networks of conceptual models. Tech. rep. (2019)"},{"key":"19_CR31","unstructured":"Observational Health Data Sciences and Informatics: The book of OHDSI. Independently published (2019)"},{"key":"19_CR32","doi-asserted-by":"crossref","unstructured":"Pennington, J., Socher, R., Manning, C.: Glove: global vectors for word representation. In: Proceedings of EMNLP, pp. 1532\u20131543 (2014)","DOI":"10.3115\/v1\/D14-1162"},{"key":"19_CR33","doi-asserted-by":"crossref","unstructured":"Rahm, E., Bernstein, P.A.: A survey of approaches to automatic schema matching. VLDB J. 10(4), 334\u2013350 (2001)","DOI":"10.1007\/s007780100057"},{"key":"19_CR34","doi-asserted-by":"crossref","unstructured":"Sennrich, R., Haddow, B., Birch, A.: Neural machine translation of rare words with subword units. arXiv preprint arXiv:1508.07909 (2015)","DOI":"10.18653\/v1\/P16-1162"},{"issue":"9","key":"19_CR35","doi-asserted-by":"publisher","first-page":"1401","DOI":"10.14778\/3397230.3397237","volume":"13","author":"R Shraga","year":"2020","unstructured":"Shraga, R., Gal, A., Roitman, H.: Adnev: cross-domain schema matching using deep similarity matrix adjustment and evaluation. Proc. VLDB 13(9), 1401\u20131415 (2020)","journal-title":"Proc. VLDB"},{"key":"19_CR36","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"336","DOI":"10.1007\/978-3-319-92013-9_29","volume-title":"Databases Theory and Applications","author":"NT Toan","year":"2018","unstructured":"Toan, N.T., Cong, P.T., Thang, D.C., Hung, N.Q.V., Stantic, B.: Bootstrapping uncertainty in schema covering. In: Wang, J., Cong, G., Chen, J., Qi, J. (eds.) ADC 2018. LNCS, vol. 10837, pp. 336\u2013342. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-319-92013-9_29"},{"key":"19_CR37","unstructured":"Walonoski, J., et al.: Synthea: An approach, method, and software mechanism for generating synthetic patients and the synthetic electronic health care record. J. Am. Med. Inform. Assoc. 25(3), 230\u2013238 (2017)"},{"key":"19_CR38","doi-asserted-by":"crossref","unstructured":"Wu, W., Yu, C., Doan, A., Meng, W.: An interactive clustering-based approach to integrating source query interfaces on the deep web. In: Proceedings of SIGMOD, pp. 95\u2013106 (2004)","DOI":"10.1145\/1007568.1007582"}],"container-title":["Lecture Notes in Computer Science","Advances in Databases and Information Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-82472-3_19","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,7]],"date-time":"2023-01-07T11:50:58Z","timestamp":1673092258000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-82472-3_19"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"ISBN":["9783030824716","9783030824723"],"references-count":38,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-82472-3_19","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021]]},"assertion":[{"value":"16 August 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ADBIS","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Advances in Databases and Information Systems","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Tartu","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Estonia","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"24 August 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 August 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"25","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"adbis2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/adbis2021.cs.ut.ee\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Easychair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"70","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"18","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"26% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Workshops: submissions: 17, papers accepted: DOING 2021: 3, SIMPDA 2021: 1, MADEISD 2021: 4, MegaData 2021: 1, CAoNS 2021: 2","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}