{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,8]],"date-time":"2024-09-08T10:39:18Z","timestamp":1725791958677},"publisher-location":"Cham","reference-count":21,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319058122"},{"type":"electronic","value":"9783319058139"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-319-05813-9_22","type":"book-chapter","created":{"date-parts":[[2014,4,16]],"date-time":"2014-04-16T11:57:50Z","timestamp":1397649470000},"page":"328-342","source":"Crossref","is-referenced-by-count":7,"title":["Large-Scale Similarity Join with Edit-Distance Constraints"],"prefix":"10.1007","author":[{"given":"Chen","family":"Lin","sequence":"first","affiliation":[]},{"given":"Haiyang","family":"Yu","sequence":"additional","affiliation":[]},{"given":"Wei","family":"Weng","sequence":"additional","affiliation":[]},{"given":"Xianmang","family":"He","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"22_CR1","doi-asserted-by":"crossref","unstructured":"Chaudhuri, S., Ganti, V., Kaushik, R.: A primitive operator for similarity joins in data cleaning. In: Proc of the 22nd International Conference on Data Engineering, ICDE, Washington (2006)","DOI":"10.1109\/ICDE.2006.9"},{"key":"22_CR2","unstructured":"Gravano, L., Ipeirotis, P.G., Jagadish, H.V., Koudas, N., et al.: Approximate string joins in a database (almost) for free. In: Proc of the 27th International Conference on Very Large Data Bases, VLDB, pp. 491\u2013500. Rome (2001)"},{"key":"22_CR3","unstructured":"Arasu, A., Ganti, V., Kaushik, R.: Efficient exact set-similarity joins. In: Proc of the 32nd International Conference on Very Large Data Bases, VLDB, pp. 918\u2013929. Seoul (2006)"},{"key":"22_CR4","doi-asserted-by":"publisher","first-page":"131","DOI":"10.1145\/1242572.1242591","volume-title":"Proc of the 16th International Conference on World Wide Web","author":"R.J. Bayardo","year":"2007","unstructured":"Bayardo, R.J., Ma, Y., Srikant, R.: Scaling up all pairs similarity search. In: Proc of the 16th International Conference on World Wide Web, pp. 131\u2013140. ACM, Alberta (2007)"},{"key":"22_CR5","first-page":"131","volume-title":"Proc of the 17th International Conference on World Wide Web","author":"C. Xiao","year":"2011","unstructured":"Xiao, C., Wang, W., Lin, X., et al.: Efficient Similarity Joins for Near Duplicate Detection. In: Proc of the 17th International Conference on World Wide Web, pp. 131\u2013140. ACM, New York (2011)"},{"issue":"1","key":"22_CR6","doi-asserted-by":"crossref","first-page":"933","DOI":"10.14778\/1453856.1453957","volume":"1","author":"C. Xiao","year":"2008","unstructured":"Xiao, C., Wang, W., Lin, X.: Ed-join: An efficient algorithm for similarity joins with edit distance constraints. Proc of the VLDB Endowment\u00a01(1), 933\u2013944 (2008)","journal-title":"Proc of the VLDB Endowment"},{"issue":"3","key":"22_CR7","doi-asserted-by":"publisher","first-page":"253","DOI":"10.14778\/2078331.2078340","volume":"5","author":"G. Li","year":"2011","unstructured":"Li, G., Deng, D., Wang, J., et al.: Pass-join: A partition-based method for similarity joins. Proceedings of the VLDB Endowment\u00a05(3), 253\u2013264 (2011)","journal-title":"Proceedings of the VLDB Endowment"},{"key":"22_CR8","doi-asserted-by":"crossref","unstructured":"Jiang, Y., Deng, D., Wang, J., et al.: Efficient parallel partition-based algorithms for similarity search and join with edit distance constraints. In: Proceedings of the Joint EDBT\/ICDT 2013 Workshops, pp. 341\u2013348. ACM (2013)","DOI":"10.1145\/2457317.2457382"},{"issue":"1","key":"22_CR9","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J. Dean","year":"2008","unstructured":"Dean, J., Ghemawat, S.: MapReduce: Simplified data processing on large clusters. Communications of the ACM\u00a051(1), 107\u2013113 (2008)","journal-title":"Communications of the ACM"},{"issue":"2","key":"22_CR10","doi-asserted-by":"publisher","first-page":"1265","DOI":"10.14778\/1454159.1454166","volume":"1","author":"R. Chaiken","year":"2008","unstructured":"Chaiken, R., Jenkins, B., Larson, P.\u00c5., et al.: SCOPE: Easy and efficient parallel processing of massive data sets. Proceedings of the VLDB Endowment\u00a01(2), 1265\u20131276 (2008)","journal-title":"Proceedings of the VLDB Endowment"},{"key":"22_CR11","doi-asserted-by":"crossref","unstructured":"Schneider, D.A., De Witt, D.J.: A performance evaluation of four parallel join algorithms in a shared-nothing multiprocessor environment. ACM (1989)","DOI":"10.1145\/67544.66937"},{"key":"22_CR12","doi-asserted-by":"crossref","unstructured":"Blanas, S., Patel, J.M., Ercegovac, V., et al.: A comparison of join algorithms for log processing in mapreduce. In: Proceedings of the 2010 ACM SIGMOD International Conference on Management of Data, pp. 975\u2013986. ACM (2010)","DOI":"10.1145\/1807167.1807273"},{"key":"22_CR13","unstructured":"Olston, C., Reed, B., Silberstein, A., et al.: Automatic Optimization of Parallel Dataflow Programs. In: USENIX Annual Technical Conference, pp. 267\u2013273 (2008)"},{"key":"22_CR14","doi-asserted-by":"crossref","unstructured":"Yang, H., Dasdan, A., Hsiao, R.L., et al.: Map-reduce-merge: Simplified relational data processing on large clusters. In: Proceedings of the 2007 ACM SIGMOD International Conference on Management of Data, pp. 1029\u20131040. ACM (2007)","DOI":"10.1145\/1247480.1247602"},{"key":"22_CR15","doi-asserted-by":"crossref","unstructured":"Vernica, R., Carey, M.J., Li, C.: Efficient parallel set-similarity joins using MapReduce. In: Proceedings of the ACM SIGMOD International Conference on Management of Data, pp. 495\u2013506 (2010)","DOI":"10.1145\/1807167.1807222"},{"key":"22_CR16","unstructured":"Gionis, A., Indyk, P., Motwan, R.: Similarity Search in High Dimensions via Hashing. VLDB 1999, 518\u2013529 (1999)"},{"key":"22_CR17","unstructured":"Graupmann, J., Schenkel, R., Weikum, G.: The spheresearch engine for unified ranked retrieval of heterogeneous XML and web documents. In: Proceedings of the 31st International Conference on Very Large Data Bases, VLDB Endowment, pp. 529\u2013540 (2005)"},{"issue":"6010","key":"22_CR18","doi-asserted-by":"publisher","first-page":"1549","DOI":"10.1126\/science.1195203","volume":"330","author":"L. Baxter","year":"2010","unstructured":"Baxter, L., Tripathy, S., Ishaque, N., et al.: Signatures of adaptation to obligate biotrophy in the Hyaloperonospora arabidopsidis genome. Science\u00a0330(6010), 1549\u20131551 (2010)","journal-title":"Science"},{"key":"22_CR19","doi-asserted-by":"crossref","unstructured":"Chakrabarti, K., et al.: An efficient filter for approximate membership checking. In: Proceedings of ACM SIGMOD International Conference on Management of Data 2008, pp. 805\u2013818 (2008)","DOI":"10.1145\/1376616.1376697"},{"key":"22_CR20","doi-asserted-by":"crossref","unstructured":"Xiao, C., et al.: Top-k set similarity joins. In: Proceedings of the 25th International Conference on Data Engineering, pp. 916\u2013927 (2009)","DOI":"10.1109\/ICDE.2009.111"},{"key":"22_CR21","doi-asserted-by":"crossref","unstructured":"Arasu, A., Chaudhuri, S., Kaushik, R.: Transformation-based framework for record matching. In: Proceedings of the 24th International Conference on Data Engineering, pp. 40\u201349 (2008)","DOI":"10.1109\/ICDE.2008.4497412"}],"container-title":["Lecture Notes in Computer Science","Database Systems for Advanced Applications"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-05813-9_22","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,26]],"date-time":"2019-05-26T16:29:34Z","timestamp":1558888174000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-05813-9_22"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783319058122","9783319058139"],"references-count":21,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-05813-9_22","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2014]]}}}