{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,10]],"date-time":"2025-09-10T22:36:48Z","timestamp":1757543808061,"version":"3.37.3"},"reference-count":36,"publisher":"Springer Science and Business Media LLC","issue":"2-3","license":[{"start":{"date-parts":[[2017,3,21]],"date-time":"2017-03-21T00:00:00Z","timestamp":1490054400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"name":"CNRS"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Digit Libr"],"published-print":{"date-parts":[[2018,9]]},"DOI":"10.1007\/s00799-017-0211-0","type":"journal-article","created":{"date-parts":[[2017,3,21]],"date-time":"2017-03-21T09:12:14Z","timestamp":1490087534000},"page":"113-126","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Reuse and plagiarism in Speech and Natural Language Processing publications"],"prefix":"10.1007","volume":"19","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7488-293X","authenticated-orcid":false,"given":"Joseph","family":"Mariani","sequence":"first","affiliation":[]},{"given":"Gil","family":"Francopoulo","sequence":"additional","affiliation":[]},{"given":"Patrick","family":"Paroubek","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,3,21]]},"reference":[{"key":"211_CR1","unstructured":"Barron-Cedeno, A., Potthast, M., Rosso, P., Stein, B., Eiselt, A.: Corpus and evaluation measures for automatic plagiarism detection. In: Proceedings of LREC 2010, pp. 771\u2013774. Valletta (2010)"},{"issue":"4","key":"211_CR2","doi-asserted-by":"publisher","first-page":"917","DOI":"10.1162\/COLI_a_00153","volume":"39","author":"A Barron-Cedeno","year":"2013","unstructured":"Barron-Cedeno, A., Vila, M., Marti, M.A., Rosso, P.: Plagiarism meets paraphrasing insights for the next generation in automatic plagiarism detection. Comput. Linguist. 39(4), 917\u2013947 (2013)","journal-title":"Comput. Linguist."},{"key":"211_CR3","doi-asserted-by":"crossref","unstructured":"Bensalem, I., Rosso, P., Chikhi, S.,: Intrinsic plagiarism detection using n-gram classes. In: Proceedings of the Conference on Empirical Methods in Natural Language Processing 2014, pp. 1459\u20131464. Doha (2014)","DOI":"10.3115\/v1\/D14-1153"},{"key":"211_CR4","unstructured":"Berne Convention for the Protection of Literary and Artistic Works (as amended on Sept. 28, 1979). http:\/\/www.wipo.int\/wipolex\/en\/treaties\/text.jsp?file_id=283693"},{"key":"211_CR5","unstructured":"Bird, S., Dale, R., Dorr, B.J., Gibson, B., Joseph, M.T., Kan, M.-Y., Dongwon, L., Powley, B., Radev, D.R., Tan Y.F.: The ACL anthology reference corpus: a reference dataset for bibliographic research in Computational linguistics. In: Proceedings of LREC 2008, pp. 1755\u20131759. Marrakesh (2008)"},{"key":"211_CR6","unstructured":"Calzolari, N., Del Gratta, R., Francopoulo, G., Mariani, J., Rubino, F., Russo, I., Soria, C.: The LRE map. Harmonising community descriptions of resources. In: Proceedings of LREC 2012, pp. 1084\u20131089. Istanbul (2012)"},{"key":"211_CR7","unstructured":"Ceska, Z., Fox, C.: The influence of text pre-processing on plagiarism detection. In: Proceedings of the Recent Advances in Natural Language Processing Conference 2009, pp. 55\u201359. Borovets (2009)"},{"key":"211_CR8","unstructured":"Chong, M., Specia, L.: Lexical generalisation for word-level matching in plagiarism detection. In: Proceedings of the Recent Advances in Natural Language Processing Conference 2011, pp. 704\u2013709. Hissar (2011)"},{"issue":"1","key":"211_CR9","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1073\/pnas.1415135111","volume":"112","author":"DT Citron","year":"2014","unstructured":"Citron, D.T., Ginsparg, P.: Patterns of text reuse in a scientific corpus. Proc. Natl. Acad. Sci. 112(1), 25\u201330 (2014). doi: 10.1073\/pnas.1415135111","journal-title":"Proc. Natl. Acad. Sci."},{"key":"211_CR10","unstructured":"Clough, P., Gaizauskas, R., Piao, S.S.L., Wilks, Y.: Measuring text reuse. In: Proceedings of ACL\u20192002, pp. 152\u2013159. Philadelphia (2002)"},{"key":"211_CR11","unstructured":"Clough, P., Gaizauskas, R., Piao, S.S.L.: Building and annotating a corpus for the study of journalistic text reuse. In: Proceedings of LREC 2002, pp. 1678\u20131691. Las Palmas (2002)"},{"issue":"1","key":"211_CR12","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1007\/s10579-009-9112-1","volume":"45","author":"P Clough","year":"2011","unstructured":"Clough, P., Stevenson, M.: Developing a corpus of plagiarised short answers. Lang. Resour. Eval. 45(1), 5\u201324 (2011)","journal-title":"Lang. Resour. Eval."},{"key":"211_CR13","unstructured":"Councill, I.G., Giles, C.L., Kan, M.-Y.: ParsCit: an open-source CRF reference string parsing package. In: Proceedings of LREC 2008, pp. 661\u2013667. Marrakesh (2008)"},{"key":"211_CR14","unstructured":"Francopoulo, G.: TagParser: well on the way to ISO-TC37 conformance. In: Proceedings of ICGL (International Conference on Global Interoperability for Language Resources) 2008. Hong Kong (2008)"},{"key":"211_CR15","doi-asserted-by":"crossref","unstructured":"Francopoulo, G., Marcoul, F., Causse, D., Piparo, G.: Global atlas: proper nouns, from Wikipedia to LMF. In: Francopoulo, G. (ed) LMF Lexical Markup Framework. ISTE Wiley (2013)","DOI":"10.1002\/9781118712696.ch16"},{"key":"211_CR16","doi-asserted-by":"crossref","unstructured":"Francopoulo, G., Mariani, J., Paroubek, P.: NLP4NLP: the cobbler\u2019s children won\u2019t go unshod. D-Lib Mag. 21(11\/12). www.dlib.org\/dlib\/november15\/francopoulo\/11francopoulo.html (2015)","DOI":"10.1045\/november2015-francopoulo"},{"key":"211_CR17","unstructured":"Francopoulo, G., Mariani, J., Paroubek, P.: A study of reuse and plagiarism in LREC papers. In: Proceedings of LREC 2016, pp. 72\u201383. Portoro\u017e (2016)"},{"key":"211_CR18","doi-asserted-by":"crossref","unstructured":"Frey, M., Kern, R.: Efficient table annotation for digital articles. D-Lib Mag. 21(11\/12). www.dlib.org\/dlib\/november15\/frey\/11frey.html (2015)","DOI":"10.1045\/november2015-frey"},{"key":"211_CR19","unstructured":"Gaizauskas, R., Foster, J., Wilks, Y., Arundel, J., Clough, P., Piao, S.S.L.: The METER corpus: a corpus for analysing journalistic text reuse. In: Proceedings of the Corpus Linguistics Conference 2001, pp. 214\u2013223. Lancaster (2001)"},{"key":"211_CR20","unstructured":"Grove, J.: Sinister buttocks? Roget would blush at the crafty cheek. Middlesex lecturer gets to the bottom of meaningless phrases found while marking essays. Times Higher Education, 7 August (2014). https:\/\/www.timeshighereducation.com\/news\/sinister-buttocks-roget-would-blush-at-the-crafty-cheek\/2015027.article"},{"key":"211_CR21","unstructured":"Guo, Y., Che, W., Liu, T., Li, S.: A graph-based method for entity linking. In: Proceedings of the International Joint Conference on NLP 2011, pp. 1010\u20131018. Chiang Mai (2011)"},{"key":"211_CR22","unstructured":"Gupta, P., Rosso, P.: Text reuse with ACL: (upward) trends. In: Proceedings ACL\u20192012 Special Workshop on Rediscovering 50\u00a0Years of Discoveries, pp. 76\u201382. Jeju (2012)"},{"issue":"3","key":"211_CR23","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1002\/asi.10170","volume":"54","author":"TC Hoad","year":"2003","unstructured":"Hoad, T.C., Zobel, J.: Methods for identifying versioned and plagiarised documents. J. Am. Soc. Inf. Sci. Technol. 54(3), 203\u2013215 (2003)","journal-title":"J. Am. Soc. Inf. Sci. Technol."},{"key":"211_CR24","unstructured":"HaCohen-Kerner, Y., Tayeb, A., Ben-Dror, N.: Detection of simple plagiarism in computer science papers. In: Proceedings of the 23rd International Conference on Computational Linguistics (COLING), pp. 421\u2013429. Beijing (2010)"},{"key":"211_CR25","unstructured":"Kasprzak, J., Brandejs, M.: Improving the reliability of the plagiarism detection system lab. In: Proceedings of the Uncovering Plagiarism, Authorship and Social Software Misuse (PAN) at CLEF\u20192010. Padua (2010)"},{"key":"211_CR26","unstructured":"Lyon, C., Malcolm, J., Dickerson, B.: Detecting short passages of similar text in large document collections. In: Proceedings of the Empirical Methods in Natural Language Processing Conference 2001, pp. 118\u2013125. Pittsburgh (2001)"},{"key":"211_CR27","doi-asserted-by":"crossref","unstructured":"Mariani, J., Paroubek, P., Francopoulo, G., Delaborde, M.: Rediscovering 25\u00a0years of discoveries in spoken language processing: a preliminary ISCA archive analysis. In: Proceedings of Interspeech 2013, pp. 4632\u20134669. Lyon (2013)","DOI":"10.21437\/Interspeech.2013-745"},{"key":"211_CR28","doi-asserted-by":"crossref","first-page":"231","DOI":"10.1162\/tacl_a_00179","volume":"2","author":"A Moro","year":"2014","unstructured":"Moro, A., Raganato, A., Navigli, R.: Entity linking meets word sense disambiguation: a unified approach. Trans. Assoc. Comput. Linguist. 2, 231\u2013244 (2014)","journal-title":"Trans. Assoc. Comput. Linguist."},{"key":"211_CR29","unstructured":"Nawab R.M.A., Stevenson, M., Clough, P.: Detecting text reuse with modified and weighted n-grams. In: Proceedings of the First Joint Conference on Lexical and Computational Semantics, pp. 54\u201358. Montr\u00e9al (2012)"},{"key":"211_CR30","unstructured":"Potthast, M., Stein, B., Barron-Cedeno, A., Rosso, P.: An evaluation framework for plagiarism detection. In: Proceedings of the 23rd International Conference on Computational Linguistics (COLING), pp. 997\u20131005. Beijing (2010)"},{"issue":"4","key":"211_CR31","doi-asserted-by":"publisher","first-page":"919","DOI":"10.1007\/s10579-012-9211-2","volume":"47","author":"DR Radev","year":"2013","unstructured":"Radev, D.R., Muthukrishnan, P., Qazvinian, V., Abu-Jbara, A.: The ACL anthology network corpus. Lang. Resour. Eval. 47(4), 919\u2013944 (2013)","journal-title":"Lang. Resour. Eval."},{"issue":"8","key":"211_CR32","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1145\/179606.179731","volume":"37","author":"P Samuelson","year":"1994","unstructured":"Samuelson, P.: Self-plagiarism or fair use? Commun. ACM 37(8), 21\u201325 (1994)","journal-title":"Commun. ACM"},{"issue":"1","key":"211_CR33","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10579-011-9136-1","volume":"45","author":"E Stamatatos","year":"2011","unstructured":"Stamatatos, E., Koppel, M.: Plagiarism and authorship analysis: introduction to the special issue. Lang. Resour. Eval. 45(1), 1\u20135 (2011)","journal-title":"Lang. Resour. Eval."},{"issue":"12","key":"211_CR34","doi-asserted-by":"publisher","first-page":"2512","DOI":"10.1002\/asi.21630","volume":"62","author":"E Stamatatos","year":"2011","unstructured":"Stamatatos, E.: Plagiarism detection using stopword n-grams. J. Am. Soc. Inf. Sci. Technol. 62(12), 2512\u20132527 (2011)","journal-title":"J. Am. Soc. Inf. Sci. Technol."},{"issue":"1","key":"211_CR35","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1007\/s10579-010-9115-y","volume":"45","author":"B Stein","year":"2011","unstructured":"Stein, B., Lipka, N., Prettenhofer, P.: Intrinsic plagiarism analysis. Lang. Resour. Eval. 45(1), 63\u201382 (2011)","journal-title":"Lang. Resour. Eval."},{"key":"211_CR36","unstructured":"Vilnat, A., Paroubek, P., de la Clergerie, E.V., Francopoulo, G., Gu\u00e9not, M.-L.: PASSAGE syntactic representation: a minimal common ground for evaluation. In: Proceedings of LREC 2010, pp. 2478\u20132485. Valletta (2010)"}],"container-title":["International Journal on Digital Libraries"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00799-017-0211-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00799-017-0211-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00799-017-0211-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,22]],"date-time":"2023-08-22T18:57:40Z","timestamp":1692730660000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00799-017-0211-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,3,21]]},"references-count":36,"journal-issue":{"issue":"2-3","published-print":{"date-parts":[[2018,9]]}},"alternative-id":["211"],"URL":"https:\/\/doi.org\/10.1007\/s00799-017-0211-0","relation":{},"ISSN":["1432-5012","1432-1300"],"issn-type":[{"type":"print","value":"1432-5012"},{"type":"electronic","value":"1432-1300"}],"subject":[],"published":{"date-parts":[[2017,3,21]]},"assertion":[{"value":"5 October 2016","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 March 2017","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 March 2017","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 March 2017","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}