{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T14:01:13Z","timestamp":1742997673860,"version":"3.40.3"},"publisher-location":"Berlin, Heidelberg","reference-count":14,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642009570"},{"type":"electronic","value":"9783642009587"}],"license":[{"start":{"date-parts":[[2009,1,1]],"date-time":"2009-01-01T00:00:00Z","timestamp":1230768000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2009]]},"DOI":"10.1007\/978-3-642-00958-7_61","type":"book-chapter","created":{"date-parts":[[2009,4,17]],"date-time":"2009-04-17T08:11:17Z","timestamp":1239955877000},"page":"645-653","source":"Crossref","is-referenced-by-count":2,"title":["Evaluation of Text Clustering Algorithms with N-Gram-Based Document Fingerprints"],"prefix":"10.1007","author":[{"given":"Javier","family":"Parapar","sequence":"first","affiliation":[]},{"given":"\u00c1lvaro","family":"Barreiro","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"61_CR1","volume-title":"Information Retrieval","author":"C.V. Rijsbergen","year":"1979","unstructured":"Rijsbergen, C.V.: Information Retrieval. Butterworths, London (1979)"},{"key":"61_CR2","doi-asserted-by":"crossref","first-page":"186","DOI":"10.1145\/1008992.1009026","volume-title":"Proceedings of the 27th annual international ACM SIGIR conference on Research and Development in Information Retrieval","author":"X. Liu","year":"2004","unstructured":"Liu, X., Croft, W.B.: Cluster-based retrieval using language models. In: Proceedings of the 27th annual international ACM SIGIR conference on Research and Development in Information Retrieval, pp. 186\u2013193. ACM Press, New York (2004)"},{"key":"61_CR3","unstructured":"McQueen, J.: Some methods for classification and analysis of multivariate observations. In: Proceedings of the Fifth Berkeley Symposium on Mathematical Statistics and Probability, vol.\u00a01, pp. 281\u2013297 (1967)"},{"issue":"3","key":"61_CR4","doi-asserted-by":"publisher","first-page":"264","DOI":"10.1145\/331499.331504","volume":"31","author":"A.K. Jain","year":"1999","unstructured":"Jain, A.K., Murty, M.N., Flynn, P.J.: Data clustering: a review. ACM Computing Surveys\u00a031(3), 264\u2013323 (1999)","journal-title":"ACM Computing Surveys"},{"key":"61_CR5","first-page":"318","volume-title":"Proceedings of the 15th annual international ACM SIGIR conference on Research and Development in Information Retrieval","author":"D.R. Cutting","year":"1992","unstructured":"Cutting, D.R., Karger, D.R., Pedersen, J.O., Tukey, J.W.: Scatter\/gather: a cluster-based approach to browsing large document collections. In: Proceedings of the 15th annual international ACM SIGIR conference on Research and Development in Information Retrieval, pp. 318\u2013329. ACM Press, New York (1992)"},{"key":"61_CR6","first-page":"1157","volume-title":"Selected papers from the sixth international conference on World Wide Web","author":"A.Z. Broder","year":"1997","unstructured":"Broder, A.Z., Glassman, S.C., Manasse, M.S., Zweig, G.: Syntactic clustering of the web. In: Selected papers from the sixth international conference on World Wide Web, Essex, UK, pp. 1157\u20131166. Elsevier Science Publishers Ltd., Amsterdam (1997)"},{"key":"61_CR7","doi-asserted-by":"crossref","first-page":"880","DOI":"10.1145\/1183614.1183777","volume-title":"Proceedings of the 15th ACM international conference on Information and Knowledge Management","author":"D. Puppin","year":"2006","unstructured":"Puppin, D., Silvestri, F.: The query-vector document model. In: Proceedings of the 15th ACM international conference on Information and Knowledge Management, pp. 880\u2013881. ACM Press, New York (2006)"},{"key":"61_CR8","doi-asserted-by":"publisher","first-page":"76","DOI":"10.1145\/872757.872770","volume-title":"Proceedings of the 2003 ACM SIGMOD international conference on Management of Data","author":"S. Schleimer","year":"2003","unstructured":"Schleimer, S., Wilkerson, D.S., Aiken, A.: Winnowing: local algorithms for document fingerprinting. In: Proceedings of the 2003 ACM SIGMOD international conference on Management of Data, pp. 76\u201385. ACM Press, New York (2003)"},{"key":"61_CR9","doi-asserted-by":"crossref","first-page":"1353","DOI":"10.1145\/1458082.1458275","volume-title":"Proceeding of the 17th ACM conference on Information and Knowledge Management","author":"J. Parapar","year":"2008","unstructured":"Parapar, J., Barreiro, \u00c1.: Winnowing-based text clustering. In: Proceeding of the 17th ACM conference on Information and Knowledge Management, pp. 1353\u20131354. ACM, New York (2008)"},{"key":"61_CR10","doi-asserted-by":"crossref","unstructured":"Rivest, R.L.: The MD5 message digest algorithm. RFC 1321 (April 1992)","DOI":"10.17487\/rfc1321"},{"issue":"2","key":"61_CR11","doi-asserted-by":"publisher","first-page":"249","DOI":"10.1147\/rd.312.0249","volume":"31","author":"R.M. Karp","year":"1987","unstructured":"Karp, R.M., Rabin, M.O.: Efficient randomized pattern-matching algorithms. IBM Journal of Research and Development\u00a031(2), 249\u2013260 (1987)","journal-title":"IBM Journal of Research and Development"},{"key":"61_CR12","doi-asserted-by":"publisher","first-page":"312","DOI":"10.1109\/ITCC.2002.1000408","volume-title":"Proceedings of the International Conference on Information Technology: Coding and Computing","author":"F. Giannotti","year":"2002","unstructured":"Giannotti, F., Gozzi, C., Manco, G.: Characterizing web user accesses: A transactional approach to web log clustering. In: Proceedings of the International Conference on Information Technology: Coding and Computing, Washington, DC, USA, pp. 312\u2013317. IEEE Computer Society, Los Alamitos (2002)"},{"key":"61_CR13","doi-asserted-by":"crossref","first-page":"199","DOI":"10.1145\/564376.564412","volume-title":"Proceedings of the 25th annual international ACM SIGIR conference on Research and Development in Information Retrieval","author":"P. Pantel","year":"2002","unstructured":"Pantel, P., Lin, D.: Document clustering with committees. In: Proceedings of the 25th annual international ACM SIGIR conference on Research and Development in Information Retrieval, pp. 199\u2013206. ACM Press, New York (2002)"},{"key":"61_CR14","unstructured":"Rosell, M., Kann, V., Litton, J.E.: Comparing comparisons: Document clustering evaluation using two manual classifications. In: Proceedings of the International Conference on Natural Language Processing (2004)"}],"container-title":["Lecture Notes in Computer Science","Advances in Information Retrieval"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-00958-7_61","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,10,4]],"date-time":"2021-10-04T06:26:20Z","timestamp":1633328780000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-00958-7_61"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009]]},"ISBN":["9783642009570","9783642009587"],"references-count":14,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-00958-7_61","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2009]]}}}