{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,7]],"date-time":"2026-03-07T19:13:56Z","timestamp":1772910836703,"version":"3.50.1"},"publisher-location":"Cham","reference-count":36,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031227912","type":"print"},{"value":"9783031227929","type":"electronic"}],"license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-031-22792-9_5","type":"book-chapter","created":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T01:22:43Z","timestamp":1672536163000},"page":"51-62","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["MACEDONIZER - The Macedonian Transformer Language Model"],"prefix":"10.1007","author":[{"given":"Jovana","family":"Dobreva","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tashko","family":"Pavlov","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kostadin","family":"Mishev","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Monika","family":"Simjanoska","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Stojancho","family":"Tudzarski","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dimitar","family":"Trajanov","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ljupcho","family":"Kocarev","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,1,1]]},"reference":[{"issue":"1","key":"5_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s12911-021-01394-0","volume":"21","author":"MA Al-Garadi","year":"2021","unstructured":"Al-Garadi, M.A., et al.: Text classification models for the automatic detection of nonmedical prescription medication use from social media. BMC Med. Inform. Decis. Mak. 21(1), 1\u201313 (2021)","journal-title":"BMC Med. Inform. Decis. Mak."},{"key":"5_CR2","unstructured":"Antoun, W., Baly, F., Hajj, H.: AraBERT: transformer-based model for Arabic language understanding. In: Proceedings of the 4th Workshop on Open-Source Arabic Corpora and Processing Tools, with a Shared Task on Offensive Language Detection, Marseille, France, pp. 9\u201315. European Language Resource Association (2020). https:\/\/aclanthology.org\/2020.osact-1.2"},{"key":"5_CR3","unstructured":"Araci, D.: FinBERT: financial sentiment analysis with pre-trained language models. CoRR abs\/1908.10063 (2019). http:\/\/arxiv.org\/abs\/1908.10063"},{"key":"5_CR4","doi-asserted-by":"crossref","unstructured":"Arkhipov, M., Trofimova, M., Kuratov, Y., Sorokin, A.: Tuning multilingual transformers for language-specific named entity recognition. In: Proceedings of the 7th Workshop on Balto-Slavic Natural Language Processing, pp. 89\u201393 (2019)","DOI":"10.18653\/v1\/W19-3712"},{"key":"5_CR5","unstructured":"Brown, T.B., et al.: Language models are few-shot learners. CoRR abs\/2005.14165 (2020). https:\/\/arxiv.org\/abs\/2005.14165"},{"key":"5_CR6","unstructured":"Carmo, D., Piau, M., Campiotti, I., Nogueira, R., de Alencar Lotufo, R.: PTT5: pretraining and validating the T5 model on Brazilian Portuguese data. CoRR abs\/2008.09144 (2020). https:\/\/arxiv.org\/abs\/2008.09144"},{"key":"5_CR7","doi-asserted-by":"publisher","unstructured":"Chung, H.W., Garrette, D., Tan, K.C., Riesa, J.: Improving multilingual models with language-clustered vocabularies. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 4536\u20134546. Association for Computational Linguistics (2020). https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.367. https:\/\/aclanthology.org\/2020.emnlp-main.367","DOI":"10.18653\/v1\/2020.emnlp-main.367"},{"key":"5_CR8","unstructured":"Clark, K., Luong, M., Le, Q.V., Manning, C.D.: ELECTRA: pre-training text encoders as discriminators rather than generators. CoRR abs\/2003.10555 (2020). https:\/\/arxiv.org\/abs\/2003.10555"},{"key":"5_CR9","unstructured":"Conneau, A., et al.: Unsupervised cross-lingual representation learning at scale. CoRR abs\/1911.02116 (2019). http:\/\/arxiv.org\/abs\/1911.02116"},{"key":"5_CR10","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"301","DOI":"10.1007\/978-3-030-61534-5_27","volume-title":"Artificial Intelligence and Soft Computing","author":"S Dadas","year":"2020","unstructured":"Dadas, S., Pere\u0142kiewicz, M., Po\u015bwiata, R.: Pre-training polish transformer-based language models at scale. In: Rutkowski, L., Scherer, R., Korytkowski, M., Pedrycz, W., Tadeusiewicz, R., Zurada, J.M. (eds.) ICAISC 2020. LNCS (LNAI), vol. 12416, pp. 301\u2013314. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-61534-5_27"},{"key":"5_CR11","unstructured":"Devlin, J., Chang, M., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding. CoRR abs\/1810.04805 (2018). http:\/\/arxiv.org\/abs\/1810.04805"},{"key":"5_CR12","unstructured":"Farahani, M., Gharachorloo, M., Farahani, M., Manthouri, M.: ParsBERT: transformer-based model for Persian language understanding. CoRR abs\/2005.12515 (2020). https:\/\/arxiv.org\/abs\/2005.12515"},{"key":"5_CR13","unstructured":"He, P., Liu, X., Gao, J., Chen, W.: DeBERTa: decoding-enhanced BERT with disentangled attention. CoRR abs\/2006.03654 (2020). https:\/\/arxiv.org\/abs\/2006.03654"},{"key":"5_CR14","unstructured":"Lample, G., Conneau, A.: Cross-lingual language model pretraining. CoRR abs\/1901.07291 (2019). http:\/\/arxiv.org\/abs\/1901.07291"},{"key":"5_CR15","unstructured":"Lan, Z., Chen, M., Goodman, S., Gimpel, K., Sharma, P., Soricut, R.: ALBERT: a lite BERT for self-supervised learning of language representations. CoRR abs\/1909.11942 (2019). http:\/\/arxiv.org\/abs\/1909.11942"},{"key":"5_CR16","unstructured":"Le, H., et al.: FlauBERT: unsupervised language model pre-training for French. CoRR abs\/1912.05372 (2019). http:\/\/arxiv.org\/abs\/1912.05372"},{"key":"5_CR17","unstructured":"Lewis, M., et al.: BART: denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension. CoRR abs\/1910.13461 (2019). http:\/\/arxiv.org\/abs\/1910.13461"},{"key":"5_CR18","doi-asserted-by":"publisher","unstructured":"Liu, Y., et al.: RoBERTa: a robustly optimized BERT pretraining approach (2019). https:\/\/doi.org\/10.48550\/ARXIV.1907.11692. https:\/\/arxiv.org\/abs\/1907.11692","DOI":"10.48550\/ARXIV.1907.11692"},{"key":"5_CR19","unstructured":"Livinska, H.V., Makarevych, O.: Feasibility of improving BERT for linguistic prediction on Ukrainian corpus. In: COLINS (2020)"},{"key":"5_CR20","unstructured":"Ljube\u0161i\u0107, N., Lauc, D.: Berti\u0107-the transformer language model for Bosnian, Croatian, Montenegrin and Serbian. In: Proceedings of the 8th Workshop on Balto-Slavic Natural Language Processing, pp. 37\u201342 (2021)"},{"key":"5_CR21","unstructured":"MacCartney, B.: Natural Language Inference. Stanford University (2009)"},{"key":"5_CR22","unstructured":"Martin, L., et al.: CamemBERT: a tasty French language model. CoRR abs\/1911.03894 (2019). http:\/\/arxiv.org\/abs\/1911.03894"},{"issue":"4","key":"5_CR23","doi-asserted-by":"publisher","first-page":"1093","DOI":"10.1016\/j.asej.2014.04.011","volume":"5","author":"W Medhat","year":"2014","unstructured":"Medhat, W., Hassan, A., Korashy, H.: Sentiment analysis algorithms and applications: a survey. Ain Shams Eng. J. 5(4), 1093\u20131113 (2014)","journal-title":"Ain Shams Eng. J."},{"key":"5_CR24","doi-asserted-by":"publisher","first-page":"131662","DOI":"10.1109\/ACCESS.2020.3009626","volume":"8","author":"K Mishev","year":"2020","unstructured":"Mishev, K., Gjorgjevikj, A., Vodenska, I., Chitkushev, L.T., Trajanov, D.: Evaluation of sentiment analysis in finance: from lexicons to transformers. IEEE Access 8, 131662\u2013131682 (2020)","journal-title":"IEEE Access"},{"issue":"1","key":"5_CR25","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1075\/li.30.1.03nad","volume":"30","author":"D Nadeau","year":"2007","unstructured":"Nadeau, D., Sekine, S.: A survey of named entity recognition and classification. Lingvisticae Investigationes 30(1), 3\u201326 (2007)","journal-title":"Lingvisticae Investigationes"},{"key":"5_CR26","unstructured":"Pikuliak, M., et al.: SlovakBERT: Slovak masked language model. CoRR abs\/2109.15254 (2021). https:\/\/arxiv.org\/abs\/2109.15254"},{"issue":"8","key":"5_CR27","first-page":"9","volume":"1","author":"A Radford","year":"2019","unstructured":"Radford, A., Wu, J., Child, R., Luan, D., Amodei, D., Sutskever, I., et al.: Language models are unsupervised multitask learners. OpenAI Blog 1(8), 9 (2019)","journal-title":"OpenAI Blog"},{"key":"5_CR28","unstructured":"Raffel, C., et al.: Exploring the limits of transfer learning with a unified text-to-text transformer. CoRR abs\/1910.10683 (2019). http:\/\/arxiv.org\/abs\/1910.10683"},{"issue":"1","key":"5_CR29","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/s41746-021-00455-y","volume":"4","author":"L Rasmy","year":"2021","unstructured":"Rasmy, L., Xiang, Y., Xie, Z., Tao, C., Zhi, D.: Med-BERT: pretrained contextualized embeddings on large-scale structured electronic health records for disease prediction. NPJ Digit. Med. 4(1), 1\u201313 (2021)","journal-title":"NPJ Digit. Med."},{"key":"5_CR30","unstructured":"Sanh, V., Debut, L., Chaumond, J., Wolf, T.: DistilBERT, a distilled version of BERT: smaller, faster, cheaper and lighter. CoRR abs\/1910.01108 (2019). http:\/\/arxiv.org\/abs\/1910.01108"},{"key":"5_CR31","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1007\/978-3-030-61377-8_28","volume-title":"Intelligent Systems","author":"F Souza","year":"2020","unstructured":"Souza, F., Nogueira, R., Lotufo, R.: BERTimbau: pretrained BERT models for Brazilian Portuguese. In: Cerri, R., Prati, R.C. (eds.) BRACIS 2020. LNCS (LNAI), vol. 12319, pp. 403\u2013417. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-61377-8_28"},{"key":"5_CR32","doi-asserted-by":"crossref","unstructured":"Ul\u010dar, M., Robnik-\u0160ikonja, M.: Finest BERT and crosloengual BERT: less is more in multilingual models. CoRR abs\/2006.07890 (2020). https:\/\/arxiv.org\/abs\/2006.07890","DOI":"10.1007\/978-3-030-58323-1_11"},{"key":"5_CR33","unstructured":"Vaswani, A., et al.: Attention is all you need. In: Advances in Neural Information Processing Systems, pp. 5998\u20136008 (2017)"},{"key":"5_CR34","doi-asserted-by":"crossref","unstructured":"de Vries, W., Nissim, M.: As good as new. How to successfully recycle English GPT-2 to make models for other languages. CoRR abs\/2012.05628 (2020). https:\/\/arxiv.org\/abs\/2012.05628","DOI":"10.18653\/v1\/2021.findings-acl.74"},{"key":"5_CR35","unstructured":"Yang, Z., Dai, Z., Yang, Y., Carbonell, J., Salakhutdinov, R.R., Le, Q.V.: XLNet: generalized autoregressive pretraining for language understanding. In: Advances in Neural Information Processing Systems, vol. 32 (2019)"},{"key":"5_CR36","doi-asserted-by":"crossref","unstructured":"Zhu, Y., et al.: Aligning books and movies: towards story-like visual explanations by watching movies and reading books. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 19\u201327 (2015)","DOI":"10.1109\/ICCV.2015.11"}],"container-title":["Communications in Computer and Information Science","ICT Innovations 2022. Reshaping the Future Towards a New Normal"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-22792-9_5","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T02:05:19Z","timestamp":1672538719000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-22792-9_5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"ISBN":["9783031227912","9783031227929"],"references-count":36,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-22792-9_5","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"value":"1865-0929","type":"print"},{"value":"1865-0937","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022]]},"assertion":[{"value":"1 January 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICT Innovations","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on ICT Innovations","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Skopje","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"North Macedonia","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2022","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2022","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"1 October 2022","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ictinnovations2022","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.ictinnovations.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Easychair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"42","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"14","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"33% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.5135","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1.2037","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2 extended abstracts are in the preface","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}