{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T13:56:57Z","timestamp":1742997417007,"version":"3.40.3"},"publisher-location":"Cham","reference-count":39,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783031208331"},{"type":"electronic","value":"9783031208348"}],"license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-031-20834-8_6","type":"book-chapter","created":{"date-parts":[[2022,11,17]],"date-time":"2022-11-17T20:03:58Z","timestamp":1668715438000},"page":"109-123","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Evaluation and Analysis of the NLP Model Zoo for Ukrainian Text Classification"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5454-5661","authenticated-orcid":false,"given":"Dmytro","family":"Panchenko","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3223-5130","authenticated-orcid":false,"given":"Daniil","family":"Maksymenko","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1089-3055","authenticated-orcid":false,"given":"Olena","family":"Turuta","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8867-993X","authenticated-orcid":false,"given":"Andriy","family":"Yerokhin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3895-0744","authenticated-orcid":false,"given":"Yana","family":"Daniiel","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0970-8617","authenticated-orcid":false,"given":"Oleksii","family":"Turuta","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,11,18]]},"reference":[{"key":"6_CR1","unstructured":"Panchenko D., Maksymenko, D., Turuta, O., Luzan, M., Tytarenko, S., Turuta, O.: Ukrainian news corpus as text classification benchmark. In: Proceedings of the 17th International Conference on ICT in Education, Research and Industrial Applications. Integration, Harmonization and Knowledge Transfer. Volume II: Workshops, pp. 717\u2013726"},{"key":"6_CR2","unstructured":"https:\/\/www.kaggle.com\/c\/ukrainian-news-classification\/"},{"key":"6_CR3","unstructured":"Vaswani, A., et al.: Attention is all you need. In: Proceedings of the 31st International Conference on Neural Information Processing Systems (NIPS 2017), pp. 6000\u20136010. Curran Associates Inc., Red Hook (2017)"},{"key":"6_CR4","unstructured":"Devlin, J., Chang, M.-W., Lee, K., Toutanova, K.: BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding (2019)"},{"key":"6_CR5","doi-asserted-by":"crossref","unstructured":"Lewis, M., et al.: BART: Denoising Sequence-to-Sequence Pre-training for Natural Language Generation, Translation, and Comprehension. CoRR, abs\/1910.13461 (2019)","DOI":"10.18653\/v1\/2020.acl-main.703"},{"key":"6_CR6","doi-asserted-by":"crossref","unstructured":"Liu, Y., et al.: Multilingual denoising pre-training for neural machine translation (2020)","DOI":"10.1162\/tacl_a_00343"},{"key":"6_CR7","unstructured":"Tang, Y., et al.: Multilingual Translation with Extensible Multilingual Pretraining and Finetuning (2020)"},{"key":"6_CR8","unstructured":"Radchenko, V.: We Trained the Ukrainian Language Model. https:\/\/youscan.io\/blog\/ukrainian-language-model\/"},{"key":"6_CR9","doi-asserted-by":"publisher","unstructured":"Schweter, S.: Ukrainian ELECTRA model. https:\/\/github.com\/stefan-it\/ukrainian-electra. https:\/\/doi.org\/10.5281\/zenodo.4267880","DOI":"10.5281\/zenodo.4267880"},{"key":"6_CR10","unstructured":"Babenko, D.: Determining sentiment and important properties of Ukrainian-language user reviews: Master Thesis: manuscript rights\/Dmytro Babenko; Supervisor Vsevolod Dyomkin; Ukrainian Catholic University, Department of Computer Sciences. Lviv [s.n.] (2020). 35 p.: ill"},{"key":"6_CR11","unstructured":"Babenko, D., Dyomkin, V.: Determining Sentiment and Important Properties of Ukrainian Language User Reviews (2019). http:\/\/ceur-ws.org\/Vol-2566\/MS-AMLV-2019-paper39-p106.pdf"},{"key":"6_CR12","unstructured":"NER Annotation Corpus. https:\/\/lang.org.ua\/en\/corpora\/"},{"key":"6_CR13","unstructured":"https:\/\/mova.institute\/"},{"key":"6_CR14","doi-asserted-by":"crossref","unstructured":"Conneau, A., et al.: Unsupervised Cross-Lingual Representation Learning at Scale. CoRR, abs\/1911.02116 (2019)","DOI":"10.18653\/v1\/2020.acl-main.747"},{"key":"6_CR15","unstructured":"https:\/\/commoncrawl.github.io\/cc-crawl-statistics\/plots\/languages"},{"key":"6_CR16","doi-asserted-by":"crossref","unstructured":"Conneau, A., et al.: XNLI: evaluating cross-lingual sentence representations. In: Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing. Association for Computational Linguistics (2018)","DOI":"10.18653\/v1\/D18-1269"},{"key":"6_CR17","doi-asserted-by":"crossref","unstructured":"Artetxe, M., Ruder, S., Yogatama, D.: On the cross-lingual transferability of monolingual representations. arXiv preprint arXiv:1910.11856 (2019)","DOI":"10.18653\/v1\/2020.acl-main.421"},{"key":"6_CR18","unstructured":"https:\/\/www.bbc.com\/ukrainian"},{"key":"6_CR19","unstructured":"https:\/\/nv.ua\/"},{"key":"6_CR20","unstructured":"https:\/\/www.pravda.com.ua\/"},{"key":"6_CR21","unstructured":"https:\/\/www.epravda.com.ua\/"},{"key":"6_CR22","unstructured":"https:\/\/www.eurointegration.com.ua\/"},{"key":"6_CR23","unstructured":"https:\/\/life.pravda.com.ua\/"},{"key":"6_CR24","unstructured":"https:\/\/www.unian.ua\/"},{"key":"6_CR25","doi-asserted-by":"crossref","unstructured":"Shen, Y., et al.: Improving Medical Short Text Classification with Semantic Expansion Using Word-Cluster Embedding. ArXiv abs\/1812.01885 (2018). n. pag","DOI":"10.1007\/978-981-13-1056-0_41"},{"key":"6_CR26","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1007\/s13042-010-0001-0","volume":"1","author":"Y Zhang","year":"2010","unstructured":"Zhang, Y., Jin, R., Zhou, Z.-H.: Understanding bag-of-words model: a statistical framework. Int. J. Mach. Learn. Cybern. 1, 43\u201352 (2010). https:\/\/doi.org\/10.1007\/s13042-010-0001-0","journal-title":"Int. J. Mach. Learn. Cybern."},{"key":"6_CR27","doi-asserted-by":"publisher","unstructured":"Kaufman, S., Rosset, S., Perlich, C.: Leakage in data mining: formulation, detection, and avoidance. In: Proceedings of the ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, vol. 6, pp. 556\u2013563 (2011). https:\/\/doi.org\/10.1145\/2020408.2020496","DOI":"10.1145\/2020408.2020496"},{"key":"6_CR28","unstructured":"Norvig, P.: How to Write a Spelling Corrector. http:\/\/norvig.com\/spell-correct.html"},{"key":"6_CR29","unstructured":"Shuyo, N.: Language Detection Library for Java (2010)"},{"key":"6_CR30","doi-asserted-by":"publisher","unstructured":"TF-IDF. In: Sammut C., Webb G.I. (eds.) Encyclopedia of Machine Learning, pp. 986\u2013987. Springer, Boston (2011). https:\/\/doi.org\/10.1007\/978-0-387-30164-8_832","DOI":"10.1007\/978-0-387-30164-8_832"},{"key":"6_CR31","doi-asserted-by":"crossref","unstructured":"Arkhipov, A.: Tuning multilingual transformers for language-specific named entity recognition. In: Proceedings of the 7th Workshop on Balto-Slavic Natural Language Processing, pp. 89\u201393. Association for Computational Linguistics (2019)","DOI":"10.18653\/v1\/W19-3712"},{"key":"6_CR32","unstructured":"Wang, C.: Baselines and bigrams: simple, good sentiment and topic classification. In: Proceedings of the 50th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers), pp. 90\u201394. Association for Computational Linguistics (2012)"},{"key":"6_CR33","unstructured":"Liu, Y., et al.: RoBERTa: A Robustly Optimized BERT Pretraining Approach. CoRR, abs\/1907.11692 (2019)"},{"key":"6_CR34","unstructured":"Ortiz Su\u00e1rez, P., Sagot, B., Romary, L.: Asynchronous pipeline for processing huge corpora on medium to low resource infrastructures. In: 7th Workshop on the Challenges in the Management of Large Corpora (CMLC-7). Leibniz-Institut f\u00fcr Deutsche Sprache (2019)"},{"key":"6_CR35","unstructured":"Clark, K., Luong, M.-T., Le, Q.V., Manning, C.D.: ELECTRA: Pre-training Text Encoders as Discriminators Rather Than Generators. In: International Conference on Learning Representations (2020)"},{"key":"6_CR36","unstructured":"Lundberg, S.M., Lee, S.-I.: A unified approach to interpreting model predictions. In: Guyon, I., et al. (eds.): Advances in Neural Information Processing Systems, vol. 30 (2017)"},{"key":"6_CR37","doi-asserted-by":"publisher","unstructured":"Yerokhin, A., Turuta, O., Babii, A., Nechyporenko, A., Mahdalina, I.: Usage of phase space diagram to finding significant features of rhinomanometric signals. In: XIth International Scientific and Technical Conference Computer Sciences and Information Technologies (CSIT), pp. 70\u201372 (2016). https:\/\/doi.org\/10.1109\/STC-CSIT.2016.7589871","DOI":"10.1109\/STC-CSIT.2016.7589871"},{"key":"6_CR38","doi-asserted-by":"crossref","unstructured":"Erdem, E., et al.: Neural natural language generation: a survey on multilinguality, multimodality, controllability and learning. J. Artif. Int. Res. 73 (2022)","DOI":"10.1613\/jair.1.12918"},{"key":"6_CR39","doi-asserted-by":"publisher","unstructured":"Dashenkov, D., Smelyakov, K., Turuta, O.: Methods of multilanguage question answering. In: 2021 IEEE 8th International Conference on Problems of Infocommunications, Science and Technology (PIC S &T), pp. 251\u2013255 (2011). https:\/\/doi.org\/10.1109\/PICST54195.2021.9772145","DOI":"10.1109\/PICST54195.2021.9772145"}],"container-title":["Communications in Computer and Information Science","Information and Communication Technologies in Education, Research, and Industrial Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-20834-8_6","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,11,17]],"date-time":"2022-11-17T20:07:13Z","timestamp":1668715633000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-20834-8_6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"ISBN":["9783031208331","9783031208348"],"references-count":39,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-20834-8_6","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"type":"print","value":"1865-0929"},{"type":"electronic","value":"1865-0937"}],"subject":[],"published":{"date-parts":[[2022]]},"assertion":[{"value":"18 November 2022","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICTERI","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Information and Communication Technologies in Education, Research, and Industrial Applications","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Kherson","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Ukraine","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28 September 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2 October 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icteri2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/icteri.org\/icteri-2021\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"EasyChair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"24","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"12","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"50% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1.6","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}