{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T15:42:28Z","timestamp":1774021348500,"version":"3.50.1"},"reference-count":40,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T00:00:00Z","timestamp":1782864000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,2,24]],"date-time":"2026-02-24T00:00:00Z","timestamp":1771891200000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100000780","name":"European Commission","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100000780","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100018693","name":"Horizon Europe","doi-asserted-by":"publisher","award":["101070122"],"award-info":[{"award-number":["101070122"]}],"id":[{"id":"10.13039\/100018693","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Information Systems"],"published-print":{"date-parts":[[2026,7]]},"DOI":"10.1016\/j.is.2026.102711","type":"journal-article","created":{"date-parts":[[2026,2,24]],"date-time":"2026-02-24T07:44:06Z","timestamp":1771919046000},"page":"102711","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["SMBench: No-code benchmarking of learning-based entity matching"],"prefix":"10.1016","volume":"139","author":[{"given":"Oleh","family":"Astappiev","sequence":"first","affiliation":[]},{"given":"Franziska","family":"Neuhof","sequence":"additional","affiliation":[]},{"given":"Marco","family":"Fisichella","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7298-9431","authenticated-orcid":false,"given":"George","family":"Papadakis","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.is.2026.102711_b1","article-title":"Data matching - concepts and techniques for record linkage, entity resolution, and duplicate detection","author":"Christen","year":"2012"},{"issue":"12","key":"10.1016\/j.is.2026.102711_b2","first-page":"1197","article-title":"Magellan: Toward building entity matching management systems","volume":"9","author":"Konda","year":"2016","journal-title":"PVLDB"},{"issue":"2","key":"10.1016\/j.is.2026.102711_b3","doi-asserted-by":"crossref","first-page":"31:1","DOI":"10.1145\/3377455","article-title":"Blocking and filtering techniques for Entity Resolution: A survey","volume":"53","author":"Papadakis","year":"2021","journal-title":"ACM Comput. Surv."},{"issue":"9","key":"10.1016\/j.is.2026.102711_b4","doi-asserted-by":"crossref","first-page":"1537","DOI":"10.1109\/TKDE.2011.127","article-title":"A survey of indexing techniques for scalable record linkage and deduplication","volume":"24","author":"Christen","year":"2012","journal-title":"IEEE Trans. Knowl. Data Eng."},{"issue":"11","key":"10.1016\/j.is.2026.102711_b5","doi-asserted-by":"crossref","first-page":"2459","DOI":"10.14778\/3476249.3476294","article-title":"Deep learning for blocking in entity matching: A design space exploration","volume":"14","author":"Thirumuruganathan","year":"2021","journal-title":"Proc. VLDB Endow."},{"issue":"6","key":"10.1016\/j.is.2026.102711_b6","doi-asserted-by":"crossref","first-page":"1507","DOI":"10.14778\/3583140.3583163","article-title":"Sparkly: A simple yet surprisingly strong TF\/IDF blocker for entity matching","volume":"16","author":"Paulsen","year":"2023","journal-title":"Proc. VLDB Endow."},{"issue":"5","key":"10.1016\/j.is.2026.102711_b7","doi-asserted-by":"crossref","first-page":"1671","DOI":"10.1007\/s00778-024-00868-7","article-title":"Open benchmark for filtering techniques in Entity Resolution","volume":"33","author":"Neuhof","year":"2024","journal-title":"VLDB J."},{"key":"10.1016\/j.is.2026.102711_b8","series-title":"SIGMOD","first-page":"1149","article-title":"ZeroER: Entity resolution using Zero labeled examples","author":"Wu","year":"2020"},{"key":"10.1016\/j.is.2026.102711_b9","series-title":"IJCAI","first-page":"3665","article-title":"Hierarchical matching network for heterogeneous Entity Resolution","author":"Fu","year":"2020"},{"key":"10.1016\/j.is.2026.102711_b10","series-title":"SIGMOD","first-page":"19","article-title":"Deep learning for entity matching: A design space exploration","author":"Mudgal","year":"2018"},{"issue":"1","key":"10.1016\/j.is.2026.102711_b11","doi-asserted-by":"crossref","first-page":"50","DOI":"10.14778\/3421424.3421431","article-title":"Deep entity matching with pre-trained language models","volume":"14","author":"Li","year":"2020","journal-title":"Proc. VLDB Endow."},{"key":"10.1016\/j.is.2026.102711_b12","series-title":"EDBT","first-page":"463","article-title":"Entity matching with transformer architectures - a step forward in data integration","author":"Brunner","year":"2020"},{"key":"10.1016\/j.is.2026.102711_b13","series-title":"WWW","first-page":"1686","article-title":"GNEM: a generic one-to-set neural entity matching framework","author":"Chen","year":"2020"},{"key":"10.1016\/j.is.2026.102711_b14","article-title":"A critical re-evaluation of benchmark datasets for (deep) learning-based matching algorithms","author":"Papadakis","year":"2024","journal-title":"ICDE"},{"key":"10.1016\/j.is.2026.102711_b15","doi-asserted-by":"crossref","DOI":"10.1016\/j.is.2020.101565","article-title":"Three-dimensional Entity Resolution with JedAI","volume":"93","author":"Papadakis","year":"2020","journal-title":"Inf. Syst."},{"key":"10.1016\/j.is.2026.102711_b16","series-title":"An Introduction to Duplicate Detection","author":"Nauman","year":"2022"},{"issue":"6","key":"10.1016\/j.is.2026.102711_b17","doi-asserted-by":"crossref","first-page":"127:1","DOI":"10.1145\/3418896","article-title":"An overview of end-to-end Entity Resolution for big data","volume":"53","author":"Christophides","year":"2021","journal-title":"ACM Comput. Surv."},{"key":"10.1016\/j.is.2026.102711_b18","doi-asserted-by":"crossref","unstructured":"T. Sagi, A. Gal, O. Barkol, R. Bergman, A. Avram, Multi-source uncertain Entity Resolution at yad vashem: Transforming holocaust victim reports into people, in: Proceedings of the 2016 International Conference on Management of Data, 2016, pp. 807\u2013819.","DOI":"10.1145\/2882903.2903737"},{"key":"10.1016\/j.is.2026.102711_b19","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-031-01878-7","article-title":"The four generations of Entity Resolution","author":"Papadakis","year":"2021"},{"key":"10.1016\/j.is.2026.102711_b20","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-031-79468-1","article-title":"Entity Resolution in the web of data","author":"Christophides","year":"2015"},{"key":"10.1016\/j.is.2026.102711_b21","doi-asserted-by":"crossref","first-page":"135","DOI":"10.1162\/tacl_a_00051","article-title":"Enriching word vectors with subword information","volume":"5","author":"Bojanowski","year":"2017","journal-title":"Trans. Assoc. Comput. Linguist."},{"issue":"3","key":"10.1016\/j.is.2026.102711_b22","doi-asserted-by":"crossref","first-page":"535","DOI":"10.1109\/TBDATA.2019.2921572","article-title":"Billion-scale similarity search with GPUs","volume":"7","author":"Johnson","year":"2021","journal-title":"IEEE Trans. Big Data"},{"issue":"1","key":"10.1016\/j.is.2026.102711_b23","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/s10115-007-0114-2","article-title":"Top 10 algorithms in data mining","volume":"14","author":"Wu","year":"2008","journal-title":"Knowl. Inf. Syst."},{"key":"10.1016\/j.is.2026.102711_b24","series-title":"NAACL-HLT","first-page":"4171","article-title":"BERT: pre-training of deep bidirectional transformers for language understanding","author":"Devlin","year":"2019"},{"key":"10.1016\/j.is.2026.102711_b25","series-title":"RoBERTa: A robustly optimized BERT pretraining approach","author":"Liu","year":"2019"},{"key":"10.1016\/j.is.2026.102711_b26","series-title":"DistilBERT, a distilled version of BERT: smaller, faster, cheaper and lighter","author":"Sanh","year":"2019"},{"key":"10.1016\/j.is.2026.102711_b27","series-title":"NeurIPS","first-page":"5754","article-title":"XLNet: Generalized autoregressive pretraining for language understanding","author":"Yang","year":"2019"},{"key":"10.1016\/j.is.2026.102711_b28","series-title":"ICLR","article-title":"ALBERT: a lite BERT for self-supervised learning of language representations","author":"Lan","year":"2020"},{"issue":"1","key":"10.1016\/j.is.2026.102711_b29","doi-asserted-by":"crossref","first-page":"484","DOI":"10.14778\/1920841.1920904","article-title":"Evaluation of Entity Resolution approaches on real-world match problems","volume":"3","author":"K\u00f6pcke","year":"2010","journal-title":"Proc. VLDB Endow."},{"key":"10.1016\/j.is.2026.102711_b30","series-title":"KGCW Co-Located At ESWC","article-title":"Embedding-assisted Entity Resolution for knowledge graphs","author":"Obraczka","year":"2021"},{"issue":"1","key":"10.1016\/j.is.2026.102711_b31","doi-asserted-by":"crossref","first-page":"84:1","DOI":"10.1145\/3588938","article-title":"Unicorn: A unified multi-tasking model for supporting matching tasks in data integration","volume":"1","author":"Tu","year":"2023","journal-title":"Proc. ACM Manag. Data"},{"issue":"4","key":"10.1016\/j.is.2026.102711_b32","doi-asserted-by":"crossref","first-page":"224:1","DOI":"10.1145\/3626711","article-title":"The battleship approach to the low resource entity matching problem","volume":"1","author":"Genossar","year":"2023","journal-title":"Proc. ACM Manag. Data"},{"issue":"4","key":"10.1016\/j.is.2026.102711_b33","doi-asserted-by":"crossref","first-page":"738","DOI":"10.14778\/3574245.3574258","article-title":"Can foundation models wrangle your data?","volume":"16","author":"Narayan","year":"2022","journal-title":"Proc. VLDB Endow."},{"key":"10.1016\/j.is.2026.102711_b34","series-title":"EDBT","first-page":"529","article-title":"Entity matching using large language models","author":"Peeters","year":"2025"},{"key":"10.1016\/j.is.2026.102711_b35","series-title":"COLING","first-page":"96","article-title":"Match, compare, or select? An investigation of large language models for entity matching","author":"Wang","year":"2025"},{"key":"10.1016\/j.is.2026.102711_b36","series-title":"ICDE","first-page":"3696","article-title":"Cost-effective in-context learning for Entity Resolution: A design space exploration","author":"Fan","year":"2024"},{"issue":"4","key":"10.1016\/j.is.2026.102711_b37","doi-asserted-by":"crossref","first-page":"252:1","DOI":"10.1145\/3749170","article-title":"In-context clustering-based Entity Resolution with large language models: A design space exploration","volume":"3","author":"Fu","year":"2025","journal-title":"Proc. ACM Manag. Data"},{"key":"10.1016\/j.is.2026.102711_b38","first-page":"1950","article-title":"The return of JedAI: End-to-end Entity Resolution for structured and semi-structured data","author":"Papadakis","year":"2018","journal-title":"PVLDB"},{"key":"10.1016\/j.is.2026.102711_b39","series-title":"ISWC","article-title":"pyJedAI: a lightsaber for link discovery","author":"Nikoletos","year":"2022"},{"issue":"9","key":"10.1016\/j.is.2026.102711_b40","doi-asserted-by":"crossref","first-page":"2225","DOI":"10.14778\/3598581.3598594","article-title":"Pre-trained embeddings for Entity Resolution: An experimental analysis","volume":"16","author":"Zeakis","year":"2023","journal-title":"Proc. VLDB Endow."}],"container-title":["Information Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0306437926000256?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0306437926000256?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T14:42:58Z","timestamp":1774017778000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0306437926000256"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,7]]},"references-count":40,"alternative-id":["S0306437926000256"],"URL":"https:\/\/doi.org\/10.1016\/j.is.2026.102711","relation":{},"ISSN":["0306-4379"],"issn-type":[{"value":"0306-4379","type":"print"}],"subject":[],"published":{"date-parts":[[2026,7]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"SMBench: No-code benchmarking of learning-based entity matching","name":"articletitle","label":"Article Title"},{"value":"Information Systems","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.is.2026.102711","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 The Authors. Published by Elsevier Ltd.","name":"copyright","label":"Copyright"}],"article-number":"102711"}}