{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,17]],"date-time":"2026-03-17T19:44:58Z","timestamp":1773776698888,"version":"3.50.1"},"publisher-location":"Berlin, Heidelberg","reference-count":12,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"value":"9783642327896","type":"print"},{"value":"9783642327902","type":"electronic"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2012]]},"DOI":"10.1007\/978-3-642-32790-2_23","type":"book-chapter","created":{"date-parts":[[2012,8,6]],"date-time":"2012-08-06T07:45:48Z","timestamp":1344239148000},"page":"191-198","source":"Crossref","is-referenced-by-count":9,"title":["Application of Lemmatization and Summarization Methods in Topic Identification Module for Large Scale Language Modeling Data Filtering"],"prefix":"10.1007","author":[{"given":"Lucie","family":"Skorkovsk\u00e1","sequence":"first","affiliation":[]}],"member":"297","reference":[{"key":"23_CR1","first-page":"658","volume-title":"Proceedings of the 11th International Conference on Information Integration and Web-based Applications & Services, iiWAS 2009","author":"A.D. Asy\u2019arie","year":"2009","unstructured":"Asy\u2019arie, A.D., Pribadi, A.W.: Automatic news articles classification in indonesian language by using naive bayes classifier method. In: Proceedings of the 11th International Conference on Information Integration and Web-based Applications & Services, iiWAS 2009, pp. 658\u2013662. ACM, New York (2009)"},{"issue":"2","key":"23_CR2","doi-asserted-by":"publisher","first-page":"264","DOI":"10.1145\/321510.321519","volume":"16","author":"H.P. Edmundson","year":"1969","unstructured":"Edmundson, H.P.: New methods in automatic extracting. J. ACM\u00a016(2), 264\u2013285 (1969)","journal-title":"J. ACM"},{"issue":"1","key":"23_CR3","first-page":"457","volume":"22","author":"G. Erkan","year":"2004","unstructured":"Erkan, G., Radev, D.R.: Lexrank: graph-based lexical centrality as salience in text summarization. J. Artif. Int. Res.\u00a022(1), 457\u2013479 (2004)","journal-title":"J. Artif. Int. Res."},{"key":"23_CR4","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"759","DOI":"10.1007\/978-3-540-74999-8_95","volume-title":"Evaluation of Multilingual and Multi-modal Information Retrieval","author":"P. Ircing","year":"2007","unstructured":"Ircing, P., M\u00fcller, L.: Benefit of Proper Language Processing for Czech Speech Retrieval in the CL-SR Task at CLEF 2006. In: Peters, C., Clough, P., Gey, F.C., Karlgren, J., Magnini, B., Oard, D.W., de Rijke, M., Stempfhuber, M. (eds.) CLEF 2006. LNCS, vol.\u00a04730, pp. 759\u2013765. Springer, Heidelberg (2007)"},{"key":"23_CR5","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"132","DOI":"10.1007\/11551874_17","volume-title":"Text, Speech and Dialogue","author":"J. Kanis","year":"2005","unstructured":"Kanis, J., M\u00fcller, L.: Automatic Lemmatizer Construction with Focus on OOV Words Lemmatization. In: Matou\u0161ek, V., Mautner, P., Pavelka, T. (eds.) TSD 2005. LNCS (LNAI), vol.\u00a03658, pp. 132\u2013139. Springer, Heidelberg (2005)"},{"key":"23_CR6","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"93","DOI":"10.1007\/978-3-642-15760-8_13","volume-title":"Text, Speech and Dialogue","author":"J. Kanis","year":"2010","unstructured":"Kanis, J., Skorkovsk\u00e1, L.: Comparison of Different Lemmatization Approaches through the Means of Information Retrieval Performance. In: Sojka, P., Hor\u00e1k, A., Kope\u010dek, I., Pala, K. (eds.) TSD 2010. LNCS, vol.\u00a06231, pp. 93\u2013100. Springer, Heidelberg (2010)"},{"key":"23_CR7","doi-asserted-by":"publisher","first-page":"68","DOI":"10.1145\/215206.215333","volume-title":"Proceedings of the 18th Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, SIGIR 1995","author":"J. Kupiec","year":"1995","unstructured":"Kupiec, J., Pedersen, J., Chen, F.: A trainable document summarizer. In: Proceedings of the 18th Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, SIGIR 1995, pp. 68\u201373. ACM, New York (1995)"},{"issue":"2","key":"23_CR8","doi-asserted-by":"publisher","first-page":"159","DOI":"10.1147\/rd.22.0159","volume":"2","author":"H.P. Luhn","year":"1958","unstructured":"Luhn, H.P.: The automatic creation of literature abstracts. IBM J. Res. Dev.\u00a02(2), 159\u2013165 (1958)","journal-title":"IBM J. Res. Dev."},{"key":"23_CR9","doi-asserted-by":"crossref","unstructured":"Psutka, J., Ircing, P., Psutka, J.V., Radov\u00e1, V., Byrne, W., Haji\u010d, J., M\u00edrovsk\u00fd, J., Gustman, S.: Large vocabulary ASR for spontaneous Czech in the MALACH project. In: Proceedings of Eurospeech 2003, Geneva, pp. 1821\u20131824 (2003)","DOI":"10.21437\/Eurospeech.2003-551"},{"key":"23_CR10","doi-asserted-by":"crossref","unstructured":"Psutka, J., \u0160vec, J., Psutka, J.V., Van\u011bk, J., Pra\u017e\u00e1k, A., \u0160m\u00eddl, L., Ircing, P.: System for fast lexical and phonetic spoken term detection in a czech cultural heritage archive. EURASIP J. Audio, Speech and Music Processing 2011 (2011)","DOI":"10.1186\/1687-4722-2011-10"},{"key":"23_CR11","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"64","DOI":"10.1007\/978-3-642-23538-2_9","volume-title":"Text, Speech and Dialogue","author":"L. Skorkovsk\u00e1","year":"2011","unstructured":"Skorkovsk\u00e1, L., Ircing, P., Pra\u017e\u00e1k, A., Lehe\u010dka, J.: Automatic Topic Identification for Large Scale Language Modeling Data Filtering. In: Habernal, I., Matou\u0161ek, V. (eds.) TSD 2011. LNCS, vol.\u00a06836, pp. 64\u201371. Springer, Heidelberg (2011)"},{"key":"23_CR12","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"356","DOI":"10.1007\/978-3-642-23538-2_45","volume-title":"Text, Speech and Dialogue","author":"J. \u0160vec","year":"2011","unstructured":"\u0160vec, J., Hoidekr, J., Soutner, D., Vavru\u0161ka, J.: Web Text Data Mining for Building Large Scale Language Modelling Corpus. In: Habernal, I., Matou\u0161ek, V. (eds.) TSD 2011. LNCS, vol.\u00a06836, pp. 356\u2013363. Springer, Heidelberg (2011)"}],"container-title":["Lecture Notes in Computer Science","Text, Speech and Dialogue"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-32790-2_23.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,6,25]],"date-time":"2023-06-25T05:24:47Z","timestamp":1687670687000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-32790-2_23"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012]]},"ISBN":["9783642327896","9783642327902"],"references-count":12,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-32790-2_23","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012]]}}}