{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,10]],"date-time":"2026-03-10T15:02:24Z","timestamp":1773154944031,"version":"3.50.1"},"reference-count":51,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2018,3,6]],"date-time":"2018-03-06T00:00:00Z","timestamp":1520294400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/100010667","name":"H2020 Industrial Leadership","doi-asserted-by":"publisher","award":["653747"],"award-info":[{"award-number":["653747"]}],"id":[{"id":"10.13039\/100010667","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["The VLDB Journal"],"published-print":{"date-parts":[[2018,6]]},"DOI":"10.1007\/s00778-018-0498-5","type":"journal-article","created":{"date-parts":[[2018,3,6]],"date-time":"2018-03-06T01:07:53Z","timestamp":1520298473000},"page":"297-320","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":15,"title":["Spatio-textual user matching and clustering based on set similarity joins"],"prefix":"10.1007","volume":"27","author":[{"given":"Alexandros","family":"Belesiotis","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6118-5227","authenticated-orcid":false,"given":"Dimitrios","family":"Skoutas","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Christodoulos","family":"Efstathiades","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Vassilis","family":"Kaffes","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dieter","family":"Pfoser","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2018,3,6]]},"reference":[{"key":"498_CR1","doi-asserted-by":"crossref","unstructured":"Adelfio, M.D., Nutanong, S., Samet, H.: Searching web documents as location sets. In: SIGSPATIAL, pp. 489\u2013492 (2011a)","DOI":"10.1145\/2093973.2094056"},{"key":"498_CR2","doi-asserted-by":"crossref","unstructured":"Adelfio, M.D., Nutanong, S., Samet, H.: Similarity search on a large collection of point sets. In: SIGSPATIAL, pp. 132\u2013141 (2011b)","DOI":"10.1145\/2093973.2093992"},{"key":"498_CR3","doi-asserted-by":"publisher","unstructured":"Aynaud, T., Blondel, V.D., Guillaume, J.-L., Lambiotte, R.: Multilevel local optimization of modularity. In: Bichot, C.-E., Siarry, P. (eds.) Graph Partitioning. Wiley, Hoboken, NJ (2013). https:\/\/doi.org\/10.1002\/9781118601181.ch13","DOI":"10.1002\/9781118601181.ch13"},{"key":"498_CR4","doi-asserted-by":"crossref","unstructured":"Ballesteros, J., Cary, A., Rishe, N.: SpSJoin: parallel spatial similarity joins. In: SIGSPATIAL, pp. 481\u2013484 (2011)","DOI":"10.1145\/2093973.2094054"},{"key":"498_CR5","doi-asserted-by":"crossref","unstructured":"Bayardo, R.J., Ma, Y., Srikant, R.: Scaling up all pairs similarity search. In: WWW, pp. 131\u2013140 (2007)","DOI":"10.1145\/1242572.1242591"},{"key":"498_CR6","doi-asserted-by":"publisher","DOI":"10.1002\/9781118601181","volume-title":"Graph Partitioning","author":"CE Bichot","year":"2013","unstructured":"Bichot, C.E., Siarry, P.: Graph Partitioning. Wiley, New York (2013)"},{"issue":"10","key":"498_CR7","doi-asserted-by":"publisher","first-page":"P10008","DOI":"10.1088\/1742-5468\/2008\/10\/P10008","volume":"2008","author":"VD Blondel","year":"2008","unstructured":"Blondel, V.D., Guillaume, J.L., Lambiotte, R., Lefebvre, E.: Fast unfolding of communities in large networks. J. Stat. Mech. Theory Exp. 2008(10), P10008 (2008)","journal-title":"J. Stat. Mech. Theory Exp."},{"issue":"1","key":"498_CR8","first-page":"1","volume":"6","author":"P Bouros","year":"2012","unstructured":"Bouros, P., Ge, S., Mamoulis, N.: Spatio-textual similarity joins. PVLDB 6(1), 1\u201312 (2012)","journal-title":"PVLDB"},{"key":"498_CR9","doi-asserted-by":"crossref","unstructured":"Brinkhoff, T., Kriegel, H., Seeger, B.: Efficient processing of spatial joins using r-trees. In: SIGMOD, pp. 237\u2013246 (1993)","DOI":"10.1145\/170035.170075"},{"key":"498_CR10","unstructured":"Bulu\u00e7, A., Meyerhenke, H., Safro, I., Sanders, P., Schulz, C.: Recent advances in graph partitioning. CoRR abs\/1311.3144 (2013)"},{"key":"498_CR11","doi-asserted-by":"crossref","unstructured":"Chaudhuri, S., Ganti, V., Kaushik, R.: A primitive operator for similarity joins in data cleaning. In: ICDE, p. 5 (2006)","DOI":"10.1109\/ICDE.2006.9"},{"issue":"3","key":"498_CR12","first-page":"217","volume":"6","author":"L Chen","year":"2013","unstructured":"Chen, L., Cong, G., Jensen, C.S., Wu, D.: Spatial keyword query processing: an experimental evaluation. PVLDB 6(3), 217\u2013228 (2013)","journal-title":"PVLDB"},{"key":"498_CR13","doi-asserted-by":"crossref","unstructured":"Chen, Y., Suel, T., Markowetz, A.: Efficient query processing in geographic web search engines. In: SIGMOD, pp. 277\u2013288 (2006)","DOI":"10.1145\/1142473.1142505"},{"issue":"6","key":"498_CR14","doi-asserted-by":"publisher","first-page":"889","DOI":"10.1080\/13658816.2014.999244","volume":"29","author":"Y Chen","year":"2015","unstructured":"Chen, Y., Xu, J., Xu, M.: Finding community structure in spatially constrained complex networks. Int. J. Geogr. Inf. Sci. 29(6), 889\u2013911 (2015)","journal-title":"Int. J. Geogr. Inf. Sci."},{"key":"498_CR15","doi-asserted-by":"crossref","unstructured":"Christoforaki, M., He, J., Dimopoulos, C., Markowetz, A., Suel, T.: Text versus space: efficient geo-search query processing. In: CIKM, pp. 423\u2013432 (2011)","DOI":"10.1145\/2063576.2063641"},{"issue":"6","key":"498_CR16","doi-asserted-by":"publisher","first-page":"066,111","DOI":"10.1103\/PhysRevE.70.066111","volume":"70","author":"A Clauset","year":"2004","unstructured":"Clauset, A., Newman, M.E., Moore, C.: Finding community structure in very large networks. Phys. Rev. E 70(6), 066,111 (2004)","journal-title":"Phys. Rev. E"},{"issue":"1","key":"498_CR17","first-page":"337","volume":"2","author":"G Cong","year":"2009","unstructured":"Cong, G., Jensen, C.S., Wu, D.: Efficient retrieval of the top-k most relevant spatial web objects. PVLDB 2(1), 337\u2013348 (2009)","journal-title":"PVLDB"},{"key":"498_CR18","unstructured":"Efstathiades, C., Belesiotis, A., Skoutas, D., Pfoser, D.: Similarity search on spatio-textual point sets. In: EDBT, pp. 329\u2013340 (2016)"},{"key":"498_CR19","doi-asserted-by":"crossref","unstructured":"Efstathiades, H., Antoniades, D., Pallis, G., Dikaiakos, M.D.: Identification of key locations based on online social network activity. In: ASONAM, pp. 218\u2013225 (2015)","DOI":"10.1145\/2808797.2808877"},{"key":"498_CR20","unstructured":"Eisenstein, J., O\u2019Connor, B., Smith, N.A., Xing, E.P.: A latent variable model for geographic lexical variation. In: EMNLP, pp. 1277\u20131287 (2010)"},{"issue":"19","key":"498_CR21","doi-asserted-by":"publisher","first-page":"7663","DOI":"10.1073\/pnas.1018962108","volume":"108","author":"P Expert","year":"2011","unstructured":"Expert, P., Evans, T.S., Blondel, V.D., Lambiotte, R.: Uncovering space-independent communities in spatial networks. Proc. Natl. Acad. Sci. 108(19), 7663\u20137668 (2011)","journal-title":"Proc. Natl. Acad. Sci."},{"issue":"9","key":"498_CR22","first-page":"824","volume":"5","author":"J Fan","year":"2012","unstructured":"Fan, J., Li, G., Zhou, L., Chen, S., Hu, J.: SEAL: spatio-textual similarity search. PVLDB 5(9), 824\u2013835 (2012)","journal-title":"PVLDB"},{"issue":"6","key":"498_CR23","first-page":"709","volume":"10","author":"Y Fang","year":"2017","unstructured":"Fang, Y., Cheng, R., Li, X., Luo, S., Hu, J.: Effective community search over large spatial graphs. PVLDB 10(6), 709\u2013720 (2017)","journal-title":"PVLDB"},{"key":"498_CR24","doi-asserted-by":"crossref","unstructured":"Felipe, I.D., Hristidis, V., Rishe, N.: Keyword search on spatial databases. In: ICDE, pp. 656\u2013665 (2008)","DOI":"10.1109\/ICDE.2008.4497474"},{"key":"498_CR25","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511815867","volume-title":"Statistical Models: Theory and Practice","author":"DA Freedman","year":"2009","unstructured":"Freedman, D.A.: Statistical Models: Theory and Practice. Cambridge University Press, Cambridge (2009)"},{"key":"498_CR26","unstructured":"Gionis, A., Indyk, P., Motwani, R.: Similarity search in high dimensions via hashing. In: VLDB, pp. 518\u2013529 (1999)"},{"issue":"1","key":"498_CR27","doi-asserted-by":"publisher","first-page":"7","DOI":"10.1145\/1206049.1206056","volume":"32","author":"EH Jacox","year":"2007","unstructured":"Jacox, E.H., Samet, H.: Spatial join techniques. TODS 32(1), 7 (2007)","journal-title":"TODS"},{"issue":"8","key":"498_CR28","first-page":"625","volume":"7","author":"Y Jiang","year":"2014","unstructured":"Jiang, Y., Li, G., Feng, J., Li, W.: String similarity joins: an experimental evaluation. PVLDB 7(8), 625\u2013636 (2014)","journal-title":"PVLDB"},{"key":"498_CR29","doi-asserted-by":"crossref","unstructured":"Liu, S., Li, G., Feng, J.: Star-join: spatio-textual similarity join. In: CIKM, pp. 2194\u20132198 (2012)","DOI":"10.1145\/2396761.2398600"},{"issue":"10","key":"498_CR30","first-page":"2354","volume":"26","author":"S Liu","year":"2014","unstructured":"Liu, S., Li, G., Feng, J.: A prefix-filter based method for spatio-textual similarity join. TKDE 26(10), 2354\u20132367 (2014)","journal-title":"TKDE"},{"issue":"23","key":"498_CR31","doi-asserted-by":"publisher","first-page":"8577","DOI":"10.1073\/pnas.0601602103","volume":"103","author":"ME Newman","year":"2006","unstructured":"Newman, M.E.: Modularity and community structure in networks. Proc. Natl. Acad. Sci. 103(23), 8577\u20138582 (2006)","journal-title":"Proc. Natl. Acad. Sci."},{"issue":"2","key":"498_CR32","doi-asserted-by":"publisher","first-page":"026,113","DOI":"10.1103\/PhysRevE.69.026113","volume":"69","author":"ME Newman","year":"2004","unstructured":"Newman, M.E., Girvan, M.: Finding and evaluating community structure in networks. Phys. Rev. E 69(2), 026,113 (2004)","journal-title":"Phys. Rev. E"},{"issue":"4","key":"498_CR33","doi-asserted-by":"publisher","first-page":"e16,939","DOI":"10.1371\/journal.pone.0016939","volume":"6","author":"JP Onnela","year":"2011","unstructured":"Onnela, J.P., Arbesman, S., Gonz\u00e1lez, M.C., Barab\u00e1si, A.L., Christakis, N.A.: Geographic constraints on social network groups. PLoS ONE 6(4), e16,939 (2011)","journal-title":"PLoS ONE"},{"key":"498_CR34","doi-asserted-by":"crossref","unstructured":"Papadias, D., Kalnis, P., Zhang, J., Tao, Y.: Efficient OLAP operations in spatial data warehouses. In: SSTD, pp. 443\u2013459 (2001)","DOI":"10.1007\/3-540-47724-1_23"},{"issue":"2","key":"498_CR35","doi-asserted-by":"publisher","first-page":"191","DOI":"10.7155\/jgaa.00124","volume":"10","author":"P Pons","year":"2006","unstructured":"Pons, P., Latapy, M.: Computing communities in large networks using random walks. J. Graph Algorithms Appl. 10(2), 191\u2013218 (2006)","journal-title":"J. Graph Algorithms Appl."},{"key":"498_CR36","doi-asserted-by":"crossref","unstructured":"Rao, J., Lin, J.J., Samet, H.: Partitioning strategies for spatio-textual similarity join. In: SIGSPATIAL, pp. 40\u201349 (2014)","DOI":"10.1145\/2676536.2676542"},{"key":"498_CR37","doi-asserted-by":"crossref","unstructured":"Rocha-Junior, J.B., Gkorgkas, O., Jonassen, S., N\u00f8rv\u00e5g, K.: Efficient processing of top-k spatial keyword queries. In: SSTD, pp. 205\u2013222 (2011)","DOI":"10.1007\/978-3-642-22922-0_13"},{"key":"498_CR38","doi-asserted-by":"crossref","unstructured":"Sarawagi, S., Kirpal, A.: Efficient set joins on similarity predicates. In: SIGMOD, pp. 743\u2013754 (2004)","DOI":"10.1145\/1007568.1007652"},{"issue":"1","key":"498_CR39","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1016\/j.cosrev.2007.05.001","volume":"1","author":"SE Schaeffer","year":"2007","unstructured":"Schaeffer, S.E.: Survey: graph clustering. Comput. Sci. Rev. 1(1), 27\u201364 (2007)","journal-title":"Comput. Sci. Rev."},{"key":"498_CR40","first-page":"583","volume":"3","author":"A Strehl","year":"2002","unstructured":"Strehl, A., Ghosh, J.: Cluster ensembles\u2014a knowledge reuse framework for combining multiple partitions. J. Mach. Learn. Res. JMLR 3, 583\u2013617 (2002)","journal-title":"J. Mach. Learn. Res. JMLR"},{"key":"498_CR41","unstructured":"Thomee, B., Shamma, D.A., Friedland, G., Elizalde, B., Ni, K., Poland, D., Borth, D., Li, L.J.: The new data and new challenges in multimedia research. arXiv preprint arXiv:1503.01817 (2015)"},{"key":"498_CR42","doi-asserted-by":"crossref","unstructured":"Vaid, S., Jones, C.B., Joho, H., Sanderson, M.: Spatio-textual indexing for geographical search on the web. In: SSTD, pp. 218\u2013235 (2005)","DOI":"10.1007\/11535331_13"},{"key":"498_CR43","doi-asserted-by":"crossref","unstructured":"Wakita, K., Tsurumi, T.: Finding community structure in mega-scale social networks. CoRR abs\/cs\/0702048 (2007)","DOI":"10.1145\/1242572.1242805"},{"key":"498_CR44","doi-asserted-by":"crossref","unstructured":"Wang, J., Li, G., Feng, J.: Can we beat the prefix filtering?: an adaptive framework for similarity join and search. In: SIGMOD, pp. 85\u201396 (2012)","DOI":"10.1145\/2213836.2213847"},{"issue":"6","key":"498_CR45","doi-asserted-by":"publisher","first-page":"797","DOI":"10.1007\/s00778-012-0271-0","volume":"21","author":"D Wu","year":"2012","unstructured":"Wu, D., Cong, G., Jensen, C.S.: A framework for efficient spatial web object retrieval. VLDB J. 21(6), 797\u2013822 (2012)","journal-title":"VLDB J."},{"issue":"3","key":"498_CR46","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1145\/2000824.2000825","volume":"36","author":"C Xiao","year":"2011","unstructured":"Xiao, C., Wang, W., Lin, X., Yu, J.X., Wang, G.: Efficient similarity joins for near-duplicate detection. TODS 36(3), 15 (2011)","journal-title":"TODS"},{"key":"498_CR47","doi-asserted-by":"crossref","unstructured":"Zhang, D., Tan, K., Tung, A.K.H.: Scalable top-k spatial keyword search. In: EDBT, pp. 359\u2013370 (2013)","DOI":"10.1145\/2452376.2452419"},{"key":"498_CR48","doi-asserted-by":"crossref","unstructured":"Zhang, D., Chan, C., Tan, K.: Processing spatial keyword query as a top-k aggregation query. In: SIGIR, pp. 355\u2013364 (2014a)","DOI":"10.1145\/2600428.2609562"},{"key":"498_CR49","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Ma, Y., Meng, X.: Efficient spatio-textual similarity join using mapreduce. In: WI-IAT, pp. 52\u201359 (2014b)","DOI":"10.1109\/WI-IAT.2014.16"},{"key":"498_CR50","unstructured":"Zhao, W.X., Jiang, J., He, J., Song, Y., Achananuparp, P., Lim, E., Li, X.: Topical keyphrase extraction from twitter. In: ACL, pp. 379\u2013388 (2011)"},{"key":"498_CR51","doi-asserted-by":"crossref","unstructured":"Zhou, Y., Xie, X., Wang, C., Gong, Y., Ma, W.: Hybrid index structures for location-based web search. In: CIKM, pp. 155\u2013162 (2005)","DOI":"10.1145\/1099554.1099584"}],"container-title":["The VLDB Journal"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00778-018-0498-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00778-018-0498-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00778-018-0498-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,12]],"date-time":"2019-10-12T03:28:59Z","timestamp":1570850939000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00778-018-0498-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,3,6]]},"references-count":51,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2018,6]]}},"alternative-id":["498"],"URL":"https:\/\/doi.org\/10.1007\/s00778-018-0498-5","relation":{},"ISSN":["1066-8888","0949-877X"],"issn-type":[{"value":"1066-8888","type":"print"},{"value":"0949-877X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,3,6]]},"assertion":[{"value":"29 June 2017","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 December 2017","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"23 February 2018","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 March 2018","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}