{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T11:31:55Z","timestamp":1725535915980},"publisher-location":"Berlin, Heidelberg","reference-count":12,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642030697"},{"type":"electronic","value":"9783642030703"}],"license":[{"start":{"date-parts":[[2009,1,1]],"date-time":"2009-01-01T00:00:00Z","timestamp":1230768000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2009]]},"DOI":"10.1007\/978-3-642-03070-3_30","type":"book-chapter","created":{"date-parts":[[2009,7,15]],"date-time":"2009-07-15T11:55:54Z","timestamp":1247658954000},"page":"398-412","source":"Crossref","is-referenced-by-count":2,"title":["Efficient Clustering of Web-Derived Data Sets"],"prefix":"10.1007","author":[{"given":"Lu\u00eds","family":"Sarmento","sequence":"first","affiliation":[]},{"given":"Alexander","family":"Kehlenbeck","sequence":"additional","affiliation":[]},{"given":"Eug\u00e9nio","family":"Oliveira","sequence":"additional","affiliation":[]},{"given":"Lyle","family":"Ungar","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"30_CR1","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"420","DOI":"10.1007\/3-540-44503-X_27","volume-title":"Database Theory - ICDT 2001","author":"C. Aggarwal","year":"2000","unstructured":"Aggarwal, C., Hinneburg, A., Keim, D.: On the Surprising Behavior of Distance Metrics in High Dimensional Spaces. In: Van den Bussche, J., Vianu, V. (eds.) ICDT 2001. LNCS, vol.\u00a01973, pp. 420\u2013434. Springer, Heidelberg (2000)"},{"issue":"3","key":"30_CR2","doi-asserted-by":"publisher","first-page":"515","DOI":"10.1109\/TKDE.2003.1198387","volume":"15","author":"S. Guha","year":"2003","unstructured":"Guha, S., Meyerson, A., Mishra, N., Motwani, R., O\u2019Callaghan, L.: Clustering Data Streams: Theory and Practice. IEEE Transactions on Knowledge and Data Engineering\u00a015(3), 515\u2013528 (2003)","journal-title":"IEEE Transactions on Knowledge and Data Engineering"},{"key":"30_CR3","doi-asserted-by":"publisher","first-page":"740","DOI":"10.1017\/S0021900200105273","volume":"14","author":"E. Samuel-Cahn","year":"1977","unstructured":"Samuel-Cahn, E., Zamir, S.: Algebraic characterization of infinite markov chains where movement to the right is limited to one step. Journal of Applied Probability\u00a014, 740\u2013747 (1977)","journal-title":"Journal of Applied Probability"},{"key":"30_CR4","unstructured":"Cormen, T.H., Leiserson, C.E., Rivest, R.L.: Introduction to Algorithms. MIT Press and McGraw-Hill Book Company (1990)"},{"issue":"6","key":"30_CR5","doi-asserted-by":"publisher","first-page":"372","DOI":"10.1145\/362248.362272","volume":"16","author":"J. Hopcroft","year":"1973","unstructured":"Hopcroft, J., Tarjan, R.: Algorithm 447: efficient algorithms for graph manipulation. Commun. ACM\u00a016(6), 372\u2013378 (1973)","journal-title":"Commun. ACM"},{"key":"30_CR6","doi-asserted-by":"publisher","first-page":"30","DOI":"10.1145\/780542.780548","volume-title":"STOC 2003: Proceedings of the thirty-fifth annual ACM symposium on Theory of computing","author":"M. Charikar","year":"2003","unstructured":"Charikar, M., O\u2019Callaghan, L., Panigrahy, R.: Better streaming algorithms for clustering problems. In: STOC 2003: Proceedings of the thirty-fifth annual ACM symposium on Theory of computing, pp. 30\u201339. ACM, New York (2003)"},{"key":"30_CR7","doi-asserted-by":"publisher","first-page":"169","DOI":"10.1145\/347090.347123","volume-title":"KDD 2000: Proceedings of the sixth ACM SIGKDD international conference on Knowledge discovery and data mining","author":"A. McCallum","year":"2000","unstructured":"McCallum, A., Nigam, K., Ungar, L.H.: Efficient clustering of high-dimensional data sets with application to reference matching. In: KDD 2000: Proceedings of the sixth ACM SIGKDD international conference on Knowledge discovery and data mining, pp. 169\u2013178. ACM, New York (2000)"},{"issue":"2","key":"30_CR8","doi-asserted-by":"publisher","first-page":"94","DOI":"10.1145\/276305.276314","volume":"27","author":"R. Agrawal","year":"1998","unstructured":"Agrawal, R., Gehrke, J., Gunopulos, D., Raghavan, P.: Automatic subspace clustering of high dimensional data for data mining applications. SIGMOD Rec.\u00a027(2), 94\u2013105 (1998)","journal-title":"SIGMOD Rec."},{"key":"30_CR9","doi-asserted-by":"crossref","first-page":"271","DOI":"10.1145\/1242572.1242610","volume-title":"WWW 2007: Proceedings of the 16th international conference on World Wide Web","author":"A.S. Das","year":"2007","unstructured":"Das, A.S., Datar, M., Garg, A., Rajaram, S.: Google news personalization: scalable online collaborative filtering. In: WWW 2007: Proceedings of the 16th international conference on World Wide Web, pp. 271\u2013280. ACM, New York (2007)"},{"key":"30_CR10","doi-asserted-by":"crossref","unstructured":"Indyk, P., Motwani, R.: Approximate nearest neighbors: towards removing the curse of dimensionality. In: Proc. of 30th STOC, pp. 604\u2013613 (1998)","DOI":"10.1145\/276698.276876"},{"key":"30_CR11","doi-asserted-by":"crossref","unstructured":"Broder, A.Z.: On the resemblance and containment of documents. In: SEQS: Sequences 1991 (1998)","DOI":"10.1109\/SEQUEN.1997.666900"},{"key":"30_CR12","unstructured":"Dean, J., Ghemawat, S.: Mapreduce: Simplified data processing on large clusters. In: OSDI 2004: Sixth Symposium on Operating System Design and Implementation (2004)"}],"container-title":["Lecture Notes in Computer Science","Machine Learning and Data Mining in Pattern Recognition"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-03070-3_30","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,10,8]],"date-time":"2021-10-08T14:02:59Z","timestamp":1633701779000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-03070-3_30"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009]]},"ISBN":["9783642030697","9783642030703"],"references-count":12,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-03070-3_30","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2009]]}}}