{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,10]],"date-time":"2026-05-10T10:16:29Z","timestamp":1778408189434,"version":"3.51.4"},"reference-count":32,"publisher":"IEEE","license":[{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,12,1]],"date-time":"2019-12-01T00:00:00Z","timestamp":1575158400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019,12]]},"DOI":"10.1109\/bigdata47090.2019.9006095","type":"proceedings-article","created":{"date-parts":[[2020,2,25]],"date-time":"2020-02-25T01:05:34Z","timestamp":1582592734000},"page":"623-630","source":"Crossref","is-referenced-by-count":13,"title":["Fast Record Linkage for Company Entities"],"prefix":"10.1109","author":[{"given":"Thomas","family":"Gschwind","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Christoph","family":"Miksovic","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Julian","family":"Minder","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Katsiaryna","family":"Mirylenka","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Paolo","family":"Scotton","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref32","year":"2019","journal-title":"The Unicode Standard"},{"key":"ref31","year":"0","journal-title":"Solr"},{"key":"ref30","year":"0","journal-title":"What is a SIC code?"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.14778\/2367502.2367564"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2016.09.306"},{"key":"ref12","article-title":"Record linkage: Current practice and future directions","volume":"3","author":"gu","year":"2003","journal-title":"CSIRO Mathematical and Information Sciences Technical Report"},{"key":"ref13","article-title":"Bidirectional LSTM-CRF models for sequence tagging","volume":"abs 1508 1991","author":"huang","year":"2015","journal-title":"CoRR"},{"key":"ref14","year":"0","journal-title":"IBM Watson Natural Language Understanding"},{"key":"ref15","author":"inman","year":"1835","journal-title":"Navigation and Nautical Astronomy for the Use of British Seamen"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.14778\/3007263.3007314"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.14778\/3311880.3311883"},{"key":"ref18","first-page":"282","article-title":"Conditional random fields: Probabilistic models for segmenting and labeling sequence data","author":"lafferty","year":"2001","journal-title":"Proc of the International Conference on Machine Learning (ICML)"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9781139924801"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1186\/1472-6947-13-64"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/276698.276781"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3132847.3132949"},{"key":"ref3","first-page":"21","article-title":"On the resemblance and containment of documents","author":"broder","year":"1997","journal-title":"Proc Compression and Complexity of Sequences 1997"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/509961.509965"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.4086\/toc.2012.v008a014"},{"key":"ref5","author":"charikar","year":"2001","journal-title":"Methods and apparatus for estimating similarity"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.2307\/2286061"},{"key":"ref7","article-title":"Record linkage: A machine learning approach, a toolbox, and a digital government web service","author":"elfeky","year":"2003","journal-title":"Technical Report 1573 Purdue University"},{"key":"ref2","first-page":"71","article-title":"Big data integration for product specifications","volume":"41","author":"barbosa","year":"2018","journal-title":"IEEE Data Engineering Bulletin"},{"key":"ref9","year":"0","journal-title":"GeoNames"},{"key":"ref1","first-page":"722","article-title":"DBpedia: A nucleus for a web of open data","author":"auer","year":"2007","journal-title":"6th International Semantic Web Conference and 2nd Asian Semantic Web Conference"},{"key":"ref20","first-page":"610","article-title":"Improving company recognition from unstructured text by using dictionaries","author":"loster","year":"2017","journal-title":"Proc Int Conf on Extending Database Technology (EDBT)"},{"key":"ref22","first-page":"29","article-title":"Recurrent neural networks for modeling company-product time series","author":"mirylenka","year":"2016","journal-title":"Proceedings of 2nd ECML\/PKDD Workshop on Advanced Analytics and Learning on Temporal Data (AALTD)"},{"key":"ref21","article-title":"Applicability of latent dirichlet allocation for company modeling","author":"mirylenka","year":"2016","journal-title":"Industrial Conference on Data Mining (ICDM)"},{"key":"ref24","first-page":"468","article-title":"Hidden layer models for company representations and product recommendations","author":"mirylenka","year":"2019","journal-title":"Proceedings of the International Conference on Extending Database Technology Advances in Database Technology (EDBT)"},{"key":"ref23","article-title":"Linking IT product records","author":"mirylenka","year":"2019","journal-title":"In Proceedings of the Data Integration and Applications Workshop (DINA)"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/3183713.3196926"},{"key":"ref25","author":"mirylenka","year":"2018","journal-title":"Similarity matching system for record linkage"}],"event":{"name":"2019 IEEE International Conference on Big Data (Big Data)","location":"Los Angeles, CA, USA","start":{"date-parts":[[2019,12,9]]},"end":{"date-parts":[[2019,12,12]]}},"container-title":["2019 IEEE International Conference on Big Data (Big Data)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8986695\/9005444\/09006095.pdf?arnumber=9006095","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,17]],"date-time":"2022-07-17T17:46:56Z","timestamp":1658080016000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9006095\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,12]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/bigdata47090.2019.9006095","relation":{},"subject":[],"published":{"date-parts":[[2019,12]]}}}