{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T00:21:07Z","timestamp":1740097267944,"version":"3.37.3"},"publisher-location":"Cham","reference-count":14,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319279732"},{"type":"electronic","value":"9783319279749"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2015]]},"DOI":"10.1007\/978-3-319-27974-9_11","type":"book-chapter","created":{"date-parts":[[2015,12,9]],"date-time":"2015-12-09T05:55:33Z","timestamp":1449640533000},"page":"107-119","source":"Crossref","is-referenced-by-count":1,"title":["An Approach to Document Fingerprinting"],"prefix":"10.1007","author":[{"given":"Yunhyong","family":"Kim","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Seamus","family":"Ross","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2015,12,18]]},"reference":[{"key":"11_CR1","unstructured":"Baldwin, T., Lui, M.: Language identification: the long and the short of the matter. In: Human Language Technologies: The 2010 Annual Conference of the North American Chapter of the Association for Computational Linguistics, HLT 2010, pp. 229\u2013237. Association for Computational Linguistics, Stroudsburg (2010). http:\/\/dl.acm.org\/citation.cfm?id=1857999.1858026"},{"issue":"4","key":"11_CR2","doi-asserted-by":"publisher","first-page":"917","DOI":"10.1162\/COLI_a_00153","volume":"39","author":"A Barr\u00f3n-Cede\u00f1o","year":"2013","unstructured":"Barr\u00f3n-Cede\u00f1o, A., Vila, M., Mart\u00ed, M., Rosso, P.: Plagiarism meets paraphrasing: Insights for the next generation in automatic plagiarism detection. Comput. Linguist. 39(4), 917\u2013947 (2013). http:\/\/dx.doi.org\/10.1162\/COLI_a_00153","journal-title":"Comput. Linguist."},{"key":"11_CR3","unstructured":"Cohen, H., Crammer, K.: Learning multiple tasks in parallel with a shared annotator. In: Ghahramani, Z., Welling, M., Cortes, C., Lawrence, N.D., Weinberger, K.Q. (eds.) NIPS, pp. 1170\u20131178 (2014). http:\/\/dblp.uni-trier.de\/db\/conf\/nips\/nips2014.html#CohenC14"},{"key":"11_CR4","unstructured":"Donais, J.A., Frost, R.A., Peelar, S.M., Roddy, R.A.: A system for the automated author attribution of text and instant messages. In: Proceedings of the 2013 IEEE\/ACM International Conference on Advances in Social Networks Analysis and Mining, ASONAM 2013, pp. 1484\u20131485. ACM, New York (2013). http:\/\/doi.acm.org\/10.1145\/2492517.2500308"},{"key":"11_CR5","unstructured":"Fang, A.C., Cao, J.: Enhanced genre classification through linguistically fine-grained pos tags. In: Otoguro, R., Ishikawa, K., Umemoto, H., Yoshimoto, K., Harada, Y. (eds.) PACLIC, pp. 85\u201394. Institute for Digital Enhancement of Cognitive Development, Waseda University (2010)"},{"issue":"23","key":"11_CR6","doi-asserted-by":"publisher","first-page":"146","DOI":"10.1080\/00437956.1954.11659520","volume":"10","author":"Z Harris","year":"1954","unstructured":"Harris, Z.: Distributional structure. Word 10(23), 146\u2013162 (1954)","journal-title":"Word"},{"key":"11_CR7","unstructured":"Harvey, R.: Appraisal and selection. In: Curation Reference Manual. Digital Curation Center (2007). http:\/\/www.dcc.ac.uk\/resources\/curation-reference-manual\/completed-chapters\/appraisal-and-selection"},{"issue":"6","key":"11_CR8","doi-asserted-by":"publisher","first-page":"779","DOI":"10.1016\/S0306-4573(00)00015-7","volume":"36","author":"KS Jones","year":"2000","unstructured":"Jones, K.S., Walker, S., Robertson, S.E.: A probabilistic model of information retrieval: development and comparative experiments - part 1. Inf. Process. Manage. 36(6), 779\u2013808 (2000). http:\/\/dblp.uni-trier.de\/db\/journals\/ipm\/ipm36.html#JonesWR00","journal-title":"Inf. Process. Manage."},{"key":"11_CR9","unstructured":"Kim, Y., Ross, S.: Closing the loop: assisting archival appraisal and information retrieval in one sweep. In: Proceedings of the 76th ASIS&T Annual Meeting: Beyond the Cloud: Rethinking Information Boundaries, ASIST 2013, pp. 16:1\u201316:10. American Society for Information Science, Silver Springs (2013). http:\/\/dl.acm.org\/citation.cfm?id=2655780.2655796"},{"key":"11_CR10","doi-asserted-by":"crossref","first-page":"27","DOI":"10.1162\/tacl_a_00163","volume":"2","author":"M Lui","year":"2014","unstructured":"Lui, M., Lau, J.H., Baldwin, T.: Automatic detection and language identification of multilingual documents. TACL 2, 27\u201340 (2014)","journal-title":"TACL"},{"key":"11_CR11","unstructured":"Manku, G.S., Jain, A., Das Sarma, A.: Detecting near-duplicates for web crawling. In: Proceedings of the 16th International Conference on World Wide Web, WWW 2007, pp. 141\u2013150. ACM, New York (2007). http:\/\/doi.acm.org\/10.1145\/1242572.1242592"},{"key":"11_CR12","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"171","DOI":"10.1007\/978-3-642-19400-9_14","volume-title":"Computational Linguistics and Intelligent Text Processing","author":"CD Manning","year":"2011","unstructured":"Manning, C.D.: Part-of-speech tagging from 97% to 100%: is it time for some linguistics? In: Gelbukh, A.F. (ed.) CICLing 2011, Part I. LNCS, vol. 6608, pp. 171\u2013189. Springer, Heidelberg (2011). http:\/\/nlp.stanford.edu\/~manning\/papers\/CICLing2011-manning-tagging.pdf"},{"key":"11_CR13","unstructured":"Oliver, G., Ross, S., Guercio, M., Pala, C.: Report on automated re-appraisal: Managing archives in digital libraries (2008). https:\/\/www.academia.edu\/10963951\/Report_on_Automated_re-Appraisal_Managing_Archives_in_Digital_Libraries_Deliverable_6.10.1_"},{"key":"11_CR14","doi-asserted-by":"publisher","first-page":"295","DOI":"10.1007\/s10502-009-9090-5","volume":"8","author":"G Oliver","year":"2008","unstructured":"Oliver, G., Kim, Y., Ross, S.: Documentary genre and digital recordkeeping: red herring or a way forward? Archival Science 8, 295\u2013305 (2008)","journal-title":"Archival Science"}],"container-title":["Lecture Notes in Computer Science","Digital Libraries: Providing Quality Information"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-27974-9_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,9,12]],"date-time":"2020-09-12T10:17:55Z","timestamp":1599905875000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-27974-9_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015]]},"ISBN":["9783319279732","9783319279749"],"references-count":14,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-27974-9_11","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2015]]}}}