{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T09:51:27Z","timestamp":1773481887702,"version":"3.50.1"},"publisher-location":"Cham","reference-count":24,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783319180311","type":"print"},{"value":"9783319180328","type":"electronic"}],"license":[{"start":{"date-parts":[[2015,1,1]],"date-time":"2015-01-01T00:00:00Z","timestamp":1420070400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2015,1,1]],"date-time":"2015-01-01T00:00:00Z","timestamp":1420070400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2015]]},"DOI":"10.1007\/978-3-319-18032-8_45","type":"book-chapter","created":{"date-parts":[[2015,5,8]],"date-time":"2015-05-08T05:41:54Z","timestamp":1431063714000},"page":"574-585","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":14,"title":["Unsupervised Blocking Key Selection for Real-Time Entity Resolution"],"prefix":"10.1007","author":[{"given":"Banda","family":"Ramadan","sequence":"first","affiliation":[]},{"given":"Peter","family":"Christen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,5,9]]},"reference":[{"key":"45_CR1","unstructured":"Aizawa, A., Oyama, K.: A fast linkage detection scheme for multi-source information integration. In: WIRI, Tokyo (2005)"},{"key":"45_CR2","doi-asserted-by":"crossref","unstructured":"Bilenko, M., Kamath, B., Mooney, R.J.: Adaptive blocking: learning to scale up record linkage. In: IEEE ICDM, Hong Kong (2006)","DOI":"10.1109\/ICDM.2006.13"},{"key":"45_CR3","unstructured":"Cao, Y., Chen, Z., Zhu, J., Yue, P., Lin, C.Y., Yu, Y.: Leveraging unlabeled data to scale blocking for record linkage. In: IJCAI, Barcelona (2011)"},{"key":"45_CR4","doi-asserted-by":"crossref","unstructured":"Christen, P.: Data Matching. Springer (2012)","DOI":"10.1007\/978-3-642-31164-2"},{"key":"45_CR5","doi-asserted-by":"crossref","unstructured":"Christen, P.: A survey of indexing techniques for scalable record linkage and deduplication. IEEE Transactions on Knowledge and Data Engineering 24(9) (2012)","DOI":"10.1109\/TKDE.2011.127"},{"key":"45_CR6","doi-asserted-by":"crossref","unstructured":"Das Sarma, A., Jain, A., Machanavajjhala, A., Bohannon, P.: An automatic blocking mechanism for large-scale de-duplication tasks. In: ACM CIKM, Hawaii (2012)","DOI":"10.1145\/2396761.2398403"},{"key":"45_CR7","doi-asserted-by":"crossref","unstructured":"Dong, X.L., Srivastava, D.: Big data integration. In: IEEE ICDE, Brisbane (2013)","DOI":"10.1109\/ICDE.2013.6544914"},{"key":"45_CR8","doi-asserted-by":"crossref","unstructured":"Elmagarmid, A.K., Ipeirotis, P.G., Verykios, V.S.: Duplicate record detection: A survey. IEEE Transactions on Knowledge and Data Engineering 19(1) (2007)","DOI":"10.1109\/TKDE.2007.250581"},{"key":"45_CR9","doi-asserted-by":"crossref","unstructured":"Fellegi, I., Sunter, A.: A theory for record linkage. Journal of the American Statistical Association 64(328) (1969)","DOI":"10.1080\/01621459.1969.10501049"},{"key":"45_CR10","doi-asserted-by":"crossref","unstructured":"Giang, P.H.: A machine learning approach to create blocking criteria for record linkage. Health Care Management Science (2014)","DOI":"10.1007\/s10729-014-9276-0"},{"key":"45_CR11","doi-asserted-by":"crossref","unstructured":"Hernandez, M.A., Stolfo, S.J.: The merge\/purge problem for large databases. In: ACM SIGMOD, San Jose (1995)","DOI":"10.1145\/223784.223807"},{"key":"45_CR12","doi-asserted-by":"crossref","unstructured":"Kejriwal, M., Miranker, D.P.: An unsupervised algorithm for learning blocking schemes. In: IEEE ICDM, Dallas (2013)","DOI":"10.1109\/ICDM.2013.60"},{"key":"45_CR13","doi-asserted-by":"crossref","unstructured":"Kim, H., Lee, D.: HARRA: fast iterative hashed record linkage for large-scale data collections. In: ICDT, Lausanne, Switzerland (2010)","DOI":"10.1145\/1739041.1739104"},{"key":"45_CR14","doi-asserted-by":"crossref","unstructured":"K\u00f6pcke, H., Thor, A., Rahm, E.: Evaluation of entity resolution approaches on real-world match problems. VLDB Endowment 3(1\u20132) (2010)","DOI":"10.14778\/1920841.1920904"},{"key":"45_CR15","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"crossref","first-page":"449","DOI":"10.1007\/978-3-319-06605-9_37","volume-title":"Advances in Knowledge Discovery and Data Mining","author":"H Liang","year":"2014","unstructured":"Liang, H., Wang, Y., Christen, P., Gayler, R.: Noise-tolerant approximate blocking for dynamic real-time entity resolution. In: Tseng, V.S., Ho, T.B., Zhou, Z.-H., Chen, A.L.P., Kao, H.-Y. (eds.) PAKDD 2014, Part II. LNCS (LNAI), vol. 8444, pp. 449\u2013460. Springer, Heidelberg (2014)"},{"key":"45_CR16","doi-asserted-by":"crossref","unstructured":"Ma, Y., Tran, T.: Typimatch: type-specific unsupervised learning of keys and key values for heterogeneous web data integration. In: ACM WSDM, Rome (2013)","DOI":"10.1145\/2433396.2433439"},{"key":"45_CR17","doi-asserted-by":"crossref","unstructured":"McCallum, A., Nigam, K., Ungar, L.: Efficient clustering of high-dimensional data sets with application to reference matching. In: ACM SIGKDD, Boston (2000)","DOI":"10.1145\/347090.347123"},{"key":"45_CR18","unstructured":"Michelson, M., Knoblock, C.A.: Learning blocking schemes for record linkage. In: AAAI, Boston (2006)"},{"key":"45_CR19","doi-asserted-by":"crossref","unstructured":"Ramadan, B., Christen, P.: Forest-based dynamic sorted neighborhood indexing for real-time entity resolution. In: ACM CIKM, Shanghai (2014)","DOI":"10.1145\/2661829.2661869"},{"key":"45_CR20","series-title":"Lecture Notes in Computer Science","first-page":"1","volume-title":"Databases Theory and Applications","author":"B Ramadan","year":"2014","unstructured":"Ramadan, B., Christen, P., Liang, H.: Dynamic sorted neighborhood indexing for real-time entity resolution. In: Wang, H., Sharaf, M.A. (eds.) ADC 2014. LNCS, vol. 8506, pp. 1\u201312. Springer, Heidelberg (2014)"},{"key":"45_CR21","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"crossref","first-page":"47","DOI":"10.1007\/978-3-642-40319-4_5","volume-title":"Trends and Applications in Knowledge Discovery and Data Mining","author":"B Ramadan","year":"2013","unstructured":"Ramadan, B., Christen, P., Liang, H., Gayler, R.W., Hawking, D.: Dynamic similarity-aware inverted indexing for real-time entity resolution. In: Li, J., Cao, L., Wang, C., Tan, K.C., Liu, B., Pei, J., Tseng, V.S. (eds.) PAKDD 2013 Workshops. LNCS (LNAI), vol. 7867, pp. 47\u201358. Springer, Heidelberg (2013)"},{"key":"45_CR22","doi-asserted-by":"crossref","unstructured":"Tran, K.N., Vatsalan, D., Christen, P.: Geco: an online personal data generator and corruptor. In: ACM CIKM, New York (2013)","DOI":"10.1145\/2505515.2508207"},{"key":"45_CR23","unstructured":"Vogel, T., Naumann, F.: Automatic blocking key selection for duplicate detection based on unigram combinations. In: VLDB Workshops, Istanbul (2012)"},{"key":"45_CR24","doi-asserted-by":"crossref","unstructured":"Whang, S.E., Menestrina, D., Koutrika, G., Theobald, M., Garcia-Molina, H.: Entity resolution with iterative blocking. In: ACM SIGMOD, Providence (2009)","DOI":"10.1145\/1559845.1559870"}],"container-title":["Lecture Notes in Computer Science","Advances in Knowledge Discovery and Data Mining"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-18032-8_45","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,2,15]],"date-time":"2023-02-15T07:37:53Z","timestamp":1676446673000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-18032-8_45"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015]]},"ISBN":["9783319180311","9783319180328"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-18032-8_45","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015]]},"assertion":[{"value":"9 May 2015","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}