{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T14:46:20Z","timestamp":1743086780249,"version":"3.40.3"},"publisher-location":"Cham","reference-count":26,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319999715"},{"type":"electronic","value":"9783319999722"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-319-99972-2_47","type":"book-chapter","created":{"date-parts":[[2018,8,28]],"date-time":"2018-08-28T06:14:23Z","timestamp":1535436863000},"page":"571-586","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Text Augmentation Techniques for Document Vector Generation from Russian News Articles"],"prefix":"10.1007","author":[{"given":"Christoffer","family":"Aminoff","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Aleksei","family":"Romanenko","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Onni","family":"Kosomaa","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jouko","family":"Vankka","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2018,8,29]]},"reference":[{"unstructured":"Van Asch, V.: Macro- and micro-averaged evaluation measures. Tech. Rep., (2013)","key":"47_CR1"},{"unstructured":"Bjerva, J., Plank, B., Bos, J.: Semantic tagging with deep residual networks. CoRR abs\/1609.07053 (2016). \nhttp:\/\/arxiv.org\/abs\/1609.07053","key":"47_CR2"},{"unstructured":"Bojanowski, P., Grave, E., Joulin, A., Mikolov, T.: Enriching word vectors with subword information. CoRR abs\/1607.04606 (2016). \nhttp:\/\/arxiv.org\/abs\/1607.04606","key":"47_CR3"},{"unstructured":"Bonatti, R., de Paula, A.G., Lamarca, V.S., Cozman, F.G.: Effect of part-of-speech and lemmatization filtering in email classification for automatic reply. In: AAAI Workshop: Knowledge Extraction from Text (2016)","key":"47_CR4"},{"unstructured":"Galke, L., Saleh, A., Scherp, A.: Word embeddings for practical information retrieval. In: Eibl, M., Gaedke, M. (eds.) INFORMATIK 2017, pp. 2155\u20132167. Gesellschaft f\u00fcr Informatik, Bonn (2017)","key":"47_CR5"},{"key":"47_CR6","series-title":"Advances in Intelligent Systems and Computing","doi-asserted-by":"publisher","first-page":"877","DOI":"10.1007\/978-3-319-00969-8_86","volume-title":"Proceedings of the 8th International Conference on Computer Recognition Systems CORES 2013","author":"M Hrala","year":"2013","unstructured":"Hrala, M., Kr\u00e1l, P.: Evaluation of the document classification approaches. In: Burduk, R., Jackowski, K., Kurzynski, M., Wozniak, M., Zolnierek, A. (eds.) CORES 2013. AISC, pp. 877\u2013885. Springer, Heidelberg (2013). \nhttps:\/\/doi.org\/10.1007\/978-3-319-00969-8_86"},{"key":"47_CR7","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1108\/eb026526","volume":"28","author":"KS Jones","year":"1972","unstructured":"Jones, K.S.: A statistical interpretation of term specificity and its application in retrieval. J. Doc. 28, 11\u201321 (1972)","journal-title":"J. Doc."},{"doi-asserted-by":"publisher","unstructured":"Korpusik, M., Huang, C., Price, M., Glass, J.: Distributional semantics for understanding spoken meal descriptions. In: 2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 6070\u20136074 (2016). \nhttps:\/\/doi.org\/10.1109\/ICASSP.2016.7472843","key":"47_CR8","DOI":"10.1109\/ICASSP.2016.7472843"},{"unstructured":"Kutuzov, A., Andreev, I.: Texts in, meaning out: neural language models in semantic similarity task for Russian. ArXiv e-prints, April 2015","key":"47_CR9"},{"issue":"4","key":"47_CR10","doi-asserted-by":"publisher","first-page":"721","DOI":"10.1109\/TPAMI.2008.110","volume":"31","author":"M Lan","year":"2009","unstructured":"Lan, M., Tan, C.L., Su, J., Lu, Y.: Supervised and traditional term weighting methods for automatic text categorization. IEEE Trans. Pattern Anal. Mach. Intell. 31(4), 721\u2013735 (2009). \nhttps:\/\/doi.org\/10.1109\/TPAMI.2008.110","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"unstructured":"Le, Q.V., Mikolov, T.: Distributed representations of sentences and documents. CoRR abs\/1405.4053 (2014). \nhttp:\/\/arxiv.org\/abs\/1405.4053","key":"47_CR11"},{"doi-asserted-by":"publisher","unstructured":"Liu, M., Yang, J.: An improvement of TFIDF weighting in text categorization. In: International Conference on Computer Technology and Science (ICCTS), vol. 47, pp. 44\u201347 (2012). \nhttps:\/\/doi.org\/10.7763\/IPCSIT.2012.V47.9","key":"47_CR12","DOI":"10.7763\/IPCSIT.2012.V47.9"},{"issue":"2","key":"47_CR13","doi-asserted-by":"publisher","first-page":"258","DOI":"10.1515\/jazcas-2017-0035","volume":"68","author":"O Lyashevskaya","year":"2017","unstructured":"Lyashevskaya, O., Bocharov, V., Sorokin, A., Shavrina, T., Granovsky, D., Alexeeva, S.: Text collections for evaluation of Russian morphological taggers. J. Linguist.\/Jazykovedn\u00fd casopis 68(2), 258\u2013267 (2017)","journal-title":"J. Linguist.\/Jazykovedn\u00fd casopis"},{"unstructured":"Mikolov, T., Chen, K., Corrado, G., Dean, J.: Efficient estimation of word representations in vector space. CoRR abs\/1301.3781 (2013). \nhttp:\/\/arxiv.org\/abs\/1301.3781","key":"47_CR14"},{"unstructured":"Mikolov, T., Sutskever, I., Chen, K., Corrado, G., Dean, J.: Distributed representations of words and phrases and their compositionality. CoRR abs\/1310.4546 (2013). \nhttp:\/\/arxiv.org\/abs\/1310.4546","key":"47_CR15"},{"issue":"3","key":"47_CR16","doi-asserted-by":"publisher","first-page":"409","DOI":"10.3233\/AIC-150698","volume":"29","author":"DQ Nguyen","year":"2016","unstructured":"Nguyen, D.Q., Nguyen, D.Q., Pham, D.D., Pham, S.B.: A robust transformation-based learning approach using ripple down rules for part-of-speech tagging. AI Commun. 29(3), 409\u2013422 (2016). \nhttps:\/\/doi.org\/10.3233\/AIC-150698","journal-title":"AI Commun."},{"key":"47_CR17","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa, F., et al.: Scikit-learn: machine learning in Python. J. Mach. Learn. Res. 12, 2825\u20132830 (2011)","journal-title":"J. Mach. Learn. Res."},{"unstructured":"Pennington, J., Socher, R., Manning, C.D.: Glove: global vectors for word representation. In: Empirical Methods in Natural Language Processing (EMNLP), pp. 1532\u20131543 (2014). \nhttp:\/\/www.aclweb.org\/anthology\/D14-1162","key":"47_CR18"},{"unstructured":"\u0158eh\u016f\u0159ek, R., Sojka, P.: Software framework for topic modelling with large corpora. In: Proceedings of the LREC 2010 Workshop on New Challenges for NLP Frameworks, pp. 45\u201350. ELRA, Valletta, May 2010. \nhttp:\/\/is.muni.cz\/publication\/884893\/en","key":"47_CR19"},{"issue":"5","key":"47_CR20","doi-asserted-by":"publisher","first-page":"513","DOI":"10.1016\/0306-4573(88)90021-0","volume":"24","author":"G Salton","year":"1988","unstructured":"Salton, G., Buckley, C.: Term-weighting approaches in automatic text retrieval. Inf. Process. Manag. 24(5), 513\u2013523 (1988). \nhttps:\/\/doi.org\/10.1016\/0306-4573(88)90021-0","journal-title":"Inf. Process. Manag."},{"unstructured":"Segalovich, I.: A fast morphological algorithm with unknown word guessing induced by a dictionary for a web search engine. In: MLMTA, pp. 273\u2013280 (2003). \nhttp:\/\/cache-mskstoredata09.cdn.yandex.net\/download.yandex.ru\/company\/iseg-las-vegas.pdf","key":"47_CR21"},{"issue":"10","key":"47_CR22","doi-asserted-by":"publisher","first-page":"1769","DOI":"10.1109\/TASLP.2018.2837384","volume":"26","author":"Lutfi Kerem Senel","year":"2018","unstructured":"Senel, L.K., Utlu, I., Yucesoy, V., Koc, A., Cukur, T.: Semantic structure and interpretability of word embeddings. IEEE\/ACM Trans. Audio Speech Lang. Process., 1 (2018). \nhttps:\/\/doi.org\/10.1109\/TASLP.2018.2837384","journal-title":"IEEE\/ACM Transactions on Audio, Speech, and Language Processing"},{"unstructured":"Shazeer, N., Doherty, R., Evans, C., Waterson, C.: Swivel: improving embeddings by noticing what\u2019s missing. CoRR abs\/1602.02215 (2016). \nhttp:\/\/arxiv.org\/abs\/1602.02215","key":"47_CR23"},{"unstructured":"Toman, M., Tesar, R., Jezek, K.: Influence of word normalization on text classification. In: Proceedings of InSciT, pp. 354\u2013358 (2006). \nhttp:\/\/www.kiv.zcu.cz\/research\/groups\/text\/publications\/inscit20060710.pdf","key":"47_CR24"},{"key":"47_CR25","series-title":"Communications in Computer and Information Science","doi-asserted-by":"publisher","first-page":"525","DOI":"10.1007\/978-3-319-46254-7_42","volume-title":"Information and Software Technologies","author":"V Venekoski","year":"2016","unstructured":"Venekoski, V., Puuska, S., Vankka, J.: Vector space representations of documents in classifying finnish social media texts. In: Dregvaite, G., Damasevicius, R. (eds.) ICIST 2016. CCIS, vol. 639, pp. 525\u2013535. Springer, Cham (2016). \nhttps:\/\/doi.org\/10.1007\/978-3-319-46254-7_42"},{"unstructured":"Wang, S., Manning, C.D.: Baselines and bigrams: simple, good sentiment and topic classification. In: Proceedings of the 50th Annual Meeting of the Association for Computational Linguistics: Short Papers, ACL 2012, vol. 2, pp. 90\u201394. Association for Computational Linguistics, Stroudsburg (2012). \nhttp:\/\/dl.acm.org\/citation.cfm?id=2390665.2390688","key":"47_CR26"}],"container-title":["Communications in Computer and Information Science","Information and Software Technologies"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-99972-2_47","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2018,10,17]],"date-time":"2018-10-17T08:12:59Z","timestamp":1539763979000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-99972-2_47"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783319999715","9783319999722"],"references-count":26,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-99972-2_47","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"type":"print","value":"1865-0929"},{"type":"electronic","value":"1865-0937"}],"subject":[],"published":{"date-parts":[[2018]]},"assertion":[{"value":"ICIST","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Information and Software Technologies","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Vilnius","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Lithuania","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"6 October 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"24","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icist2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/icist.if.ktu.lt\/index.php\/ICIST","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information"}},{"value":"Open Journal System","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information"}},{"value":"124","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information"}},{"value":"48","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information"}},{"value":"39% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information"}},{"value":"0","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information"}}]}}