{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T05:02:36Z","timestamp":1755838956633,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":31,"publisher":"ACM","license":[{"start":{"date-parts":[[2020,4,20]],"date-time":"2020-04-20T00:00:00Z","timestamp":1587340800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2020,4,20]]},"DOI":"10.1145\/3366423.3380069","type":"proceedings-article","created":{"date-parts":[[2020,5,4]],"date-time":"2020-05-04T04:11:44Z","timestamp":1588565504000},"page":"2998-3004","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":6,"title":["LSF-Join: Locality Sensitive Filtering for Distributed All-Pairs Set Similarity Under Skew"],"prefix":"10.1145","author":[{"given":"Cyrus","family":"Rashtchian","sequence":"first","affiliation":[{"name":"UCSD"}]},{"given":"Aneesh","family":"Sharma","sequence":"additional","affiliation":[{"name":"Google"}]},{"given":"David","family":"Woodruff","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University"}]}],"member":"320","published-online":{"date-parts":[[2020,4,20]]},"reference":[{"volume-title":"Fuzzy Joins using MapReduce","author":"Afrati N","key":"e_1_3_2_1_1_1","unstructured":"Foto\u00a0N Afrati, Anish\u00a0Das Sarma, David Menestrina, Aditya Parameswaran, and Jeffrey\u00a0D Ullman. 2012. Fuzzy Joins using MapReduce. In ICDE. IEEE."},{"key":"e_1_3_2_1_2_1","unstructured":"Foto\u00a0N. Afrati Anish\u00a0Das Sarma Anand Rajaraman Pokey Rule Semih Salihoglu and Jeffrey\u00a0D. Ullman. 2014. Anchor-Points Algorithms for Hamming and Edit Distances Using MapReduce. In ICDT."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/2433396.2433422"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2010.70"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"crossref","unstructured":"Roberto\u00a0J Bayardo Yiming Ma and Ramakrishnan Srikant. 2007. Scaling up All Pairs Similarity Search. In WWW. ACM.","DOI":"10.1145\/1242572.1242591"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"crossref","unstructured":"Paul Beame Paraschos Koutris and Dan Suciu. 2013. Communication steps for parallel query processing. In PODS. ACM 273\u2013284.","DOI":"10.1145\/2463664.2465224"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"crossref","unstructured":"Paul Beame Paraschos Koutris and Dan Suciu. 2014. Skew in Parallel Query Processing. In PODS. ACM.","DOI":"10.1145\/2594538.2594558"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.5555\/3039686.3039705"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.5555\/3039686.3039689"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE.2018.00120"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/3183713.3183748"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.14778\/3231751.3231760"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.4086\/toc.2012.v008a014"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/3311967"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.5555\/1873601.1873677"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.5555\/3217510"},{"key":"e_1_3_2_1_17_1","unstructured":"Jure Leskovec and Andrej Krevl. 2014. SNAP Datasets: Stanford Large Network Dataset Collection. http:\/\/snap.stanford.edu\/data."},{"volume-title":"Mining of Massive Datasets","author":"Leskovec Jure","key":"e_1_3_2_1_18_1","unstructured":"Jure Leskovec, Anand Rajaraman, and Jeffrey\u00a0David Ullman. 2014. Mining of Massive Datasets. Cambridge University Press."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.14778\/2947618.2947620"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/3196959.3196985"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/3206333.3206340"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.14778\/2535570.2488334"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/3038912.3052633"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.14778\/2556549.2556574"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"crossref","unstructured":"Rares Vernica Michael\u00a0J Carey and Chen Li. 2010. Efficient Parallel Set-similarity Joins using MapReduce. In SIGMOD. ACM 495\u2013506.","DOI":"10.1145\/1807167.1807222"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/2505515.2505765"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/2213836.2213847"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.14778\/3099622.3099624"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/2000824.2000825"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2016.2638838"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.14778\/2994509.2994534"}],"event":{"name":"WWW '20: The Web Conference 2020","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web"],"location":"Taipei Taiwan","acronym":"WWW '20"},"container-title":["Proceedings of The Web Conference 2020"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3366423.3380069","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3366423.3380069","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T19:15:53Z","timestamp":1755803753000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3366423.3380069"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,4,20]]},"references-count":31,"alternative-id":["10.1145\/3366423.3380069","10.1145\/3366423"],"URL":"https:\/\/doi.org\/10.1145\/3366423.3380069","relation":{},"subject":[],"published":{"date-parts":[[2020,4,20]]},"assertion":[{"value":"2020-04-20","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}