{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T21:59:47Z","timestamp":1757455187864,"version":"3.41.0"},"publisher-location":"Cham","reference-count":23,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319180311"},{"type":"electronic","value":"9783319180328"}],"license":[{"start":{"date-parts":[[2015,1,1]],"date-time":"2015-01-01T00:00:00Z","timestamp":1420070400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2015,1,1]],"date-time":"2015-01-01T00:00:00Z","timestamp":1420070400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2015]]},"DOI":"10.1007\/978-3-319-18032-8_44","type":"book-chapter","created":{"date-parts":[[2015,5,8]],"date-time":"2015-05-08T05:41:54Z","timestamp":1431063714000},"page":"562-573","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":15,"title":["Efficient Interactive Training Selection for Large-Scale Entity Resolution"],"prefix":"10.1007","author":[{"given":"Qing","family":"Wang","sequence":"first","affiliation":[]},{"given":"Dinusha","family":"Vatsalan","sequence":"additional","affiliation":[]},{"given":"Peter","family":"Christen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,5,9]]},"reference":[{"key":"44_CR1","doi-asserted-by":"crossref","unstructured":"Arasu, A., G\u00f6tz, M., Kaushik, R.: On active learning of record matching packages. In: ACM SIGMOD, Indianapolis, pp. 783\u2013794 (2010)","DOI":"10.1145\/1807167.1807252"},{"key":"44_CR2","doi-asserted-by":"crossref","unstructured":"Bellare, K., Iyengar, S., Parameswaran, A.G., Rastogi, V.: Active sampling for entity matching. In: ACM SIGKDD, Beijing, pp. 1131\u20131139 (2012)","DOI":"10.1145\/2339530.2339707"},{"key":"44_CR3","doi-asserted-by":"crossref","unstructured":"Bilenko, M., Mooney, R.J.: Adaptive duplicate detection using learnable string similarity measures. In: ACM SIGKDD, Washington DC, pp. 39\u201348 (2003)","DOI":"10.1145\/956750.956759"},{"key":"44_CR4","doi-asserted-by":"crossref","unstructured":"Chaudhuri, S., Ganti, V., Motwani, R.: Robust identification of fuzzy duplicates. In: IEEE ICDE, Tokyo, pp. 865\u2013876 (2005)","DOI":"10.1109\/ICDE.2005.125"},{"key":"44_CR5","doi-asserted-by":"crossref","unstructured":"Chen, Z., Kalashnikov, D.V., Mehrotra, S.: Exploiting context analysis for combining multiple entity resolution systems. In: ACM SIGMOD, Providence, pp. 207\u2013218 (2009)","DOI":"10.1145\/1559845.1559869"},{"key":"44_CR6","doi-asserted-by":"crossref","unstructured":"Christen, P.: Data Matching. Data-Centric Systems and Applications. Springer (2012)","DOI":"10.1007\/978-3-642-31164-2"},{"key":"44_CR7","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"511","DOI":"10.1007\/978-3-540-68125-0_45","volume-title":"Advances in Knowledge Discovery and Data Mining","author":"P Christen","year":"2008","unstructured":"Christen, P.: Automatic training example selection for scalable unsupervised record linkage. In: Washio, T., Suzuki, E., Ting, K.M., Inokuchi, A. (eds.) PAKDD 2008. LNCS (LNAI), vol. 5012, pp. 511\u2013518. Springer, Heidelberg (2008)"},{"key":"44_CR8","doi-asserted-by":"crossref","unstructured":"Christen, P.: Development and user experiences of an open source data cleaning, deduplication and record linkage system. SIGKDD Explorations 11(1) (2009)","DOI":"10.1145\/1656274.1656282"},{"issue":"1","key":"44_CR9","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/S0020-0255(00)00070-0","volume":"137","author":"M Cochinwala","year":"2001","unstructured":"Cochinwala, M., Kurien, V., Lalk, G., Shasha, D.: Efficient data reconciliation. Information Sciences 137(1), 1\u201315 (2001)","journal-title":"Information Sciences"},{"key":"44_CR10","doi-asserted-by":"crossref","unstructured":"Dal Bianco, G., Galante, R., Heuser, C.A., Gon\u00e7alves, M.A.: Tuning large scale deduplication with reduced effort. In: SSDBM, Baltimore, p. 18 (2013)","DOI":"10.1145\/2484838.2484873"},{"key":"44_CR11","doi-asserted-by":"crossref","unstructured":"Dasgupta, S., Hsu, D.: Hierarchical sampling for active learning. In: IEEE ICML, Helsinki, pp. 208\u2013215 (2008)","DOI":"10.1145\/1390156.1390183"},{"key":"44_CR12","doi-asserted-by":"crossref","unstructured":"Du, J., Ling, C.X.: Active learning with human-like noisy oracle. In: IEEE ICDM, Sydney, pp. 797\u2013802 (2010)","DOI":"10.1109\/ICDM.2010.114"},{"key":"44_CR13","doi-asserted-by":"crossref","unstructured":"Elfeky, M.G., Verykios, V.S., Elmagarmid, A.K.: TAILOR: a record linkage toolbox. In: IEEE ICDE, San Jose, pp. 17\u201328 (2002)","DOI":"10.1109\/ICDE.2002.994694"},{"issue":"1","key":"44_CR14","first-page":"1","volume":"19","author":"A Elmagarmid","year":"2007","unstructured":"Elmagarmid, A., Ipeirotis, P., Verykios, V.: Duplicate record detection: A survey. IEEE TKDE 19(1), 1\u201316 (2007)","journal-title":"IEEE TKDE"},{"issue":"2","key":"44_CR15","doi-asserted-by":"publisher","first-page":"180","DOI":"10.1287\/moor.10.2.180","volume":"10","author":"DS Hochbaum","year":"1985","unstructured":"Hochbaum, D.S., Shmoys, D.B.: A best possible heuristic for the k-center problem. Mathematics of Operations Research 10(2), 180\u2013184 (1985)","journal-title":"Mathematics of Operations Research"},{"key":"44_CR16","unstructured":"Huang, S.J., Jin, R., Zhou, Z.H.: Active learning by querying informative and representative examples. In: NIPS, Vancouver, pp. 892\u2013900 (2010)"},{"issue":"1\u20132","key":"44_CR17","doi-asserted-by":"publisher","first-page":"484","DOI":"10.14778\/1920841.1920904","volume":"3","author":"H K\u00f6pcke","year":"2010","unstructured":"K\u00f6pcke, H., Thor, A., Rahm, E.: Evaluation of entity resolution approaches on real-world match problems. VLDB Endowment 3(1\u20132), 484\u2013493 (2010)","journal-title":"VLDB Endowment"},{"key":"44_CR18","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa, F., Varoquaux, G., Gramfort, A., et al.: Scikit-learn: Machine learning in Python. The Journal of Machine Learning Research 12, 2825\u20132830 (2011)","journal-title":"The Journal of Machine Learning Research"},{"key":"44_CR19","doi-asserted-by":"crossref","unstructured":"Sarawagi, S., Bhamidipaty, A.: Interactive deduplication using active learning. In: ACM SIGKDD, Edmonton, pp. 269\u2013278 (2002)","DOI":"10.1145\/775047.775087"},{"key":"44_CR20","first-page":"55","volume-title":"Active learning literature survey","author":"B Settles","year":"2010","unstructured":"Settles, B.: Active learning literature survey, vol. 52, pp. 55\u201366. University of Wisconsin, Madison (2010)"},{"key":"44_CR21","doi-asserted-by":"crossref","unstructured":"Sheng, V.S., Provost, F., Ipeirotis, P.G.: Get another label? improving data quality and data mining using multiple, noisy labelers. In: ACM SIGKDD, Las Vegas, pp. 614\u2013622 (2008)","DOI":"10.1145\/1401890.1401965"},{"key":"44_CR22","doi-asserted-by":"crossref","unstructured":"Tejada, S., Knoblock, C.A., Minton, S.: Learning domain-independent string transformation weights for high accuracy object identification. In: ACM SIGKDD, Edmonton, pp. 350\u2013359 (2002)","DOI":"10.1145\/775047.775099"},{"key":"44_CR23","doi-asserted-by":"publisher","first-page":"253","DOI":"10.1016\/j.neucom.2013.02.034","volume":"118","author":"W Wu","year":"2013","unstructured":"Wu, W., Liu, Y., Guo, M., Wang, C., Liu, X.: A probabilistic model of active learning with multiple noisy oracles. Neurocomputing 118, 253\u2013262 (2013)","journal-title":"Neurocomputing"}],"container-title":["Lecture Notes in Computer Science","Advances in Knowledge Discovery and Data Mining"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-18032-8_44","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,27]],"date-time":"2025-05-27T21:15:51Z","timestamp":1748380551000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-18032-8_44"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015]]},"ISBN":["9783319180311","9783319180328"],"references-count":23,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-18032-8_44","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2015]]},"assertion":[{"value":"9 May 2015","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}