{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,11]],"date-time":"2025-09-11T21:17:06Z","timestamp":1757625426937,"version":"3.44.0"},"publisher-location":"Cham","reference-count":33,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783032025500"},{"type":"electronic","value":"9783032025517"}],"license":[{"start":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T00:00:00Z","timestamp":1755820800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T00:00:00Z","timestamp":1755820800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-032-02551-7_24","type":"book-chapter","created":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T05:27:20Z","timestamp":1755754040000},"page":"275-286","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Morphological Segmentation with\u00a0Neural Networks: Performance Effects of\u00a0Architecture, Data Size, and\u00a0Cross-Lingual Transfer in\u00a0Seven Languages"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0008-2832-3211","authenticated-orcid":false,"given":"Michal","family":"Olbrich","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8149-4054","authenticated-orcid":false,"given":"Zden\u011bk","family":"\u017dabokrtsk\u00fd","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,8,22]]},"reference":[{"key":"24_CR1","volume-title":"The CELEX Lexical Database (release 2)","author":"RH Baayen","year":"1995","unstructured":"Baayen, R.H., Piepenbrock, R., Gulikers, L.: The CELEX Lexical Database (release 2). University of Pennsylvania, Distributed by the linguistic data consortium (1995)"},{"doi-asserted-by":"crossref","unstructured":"Batsuren, K., et al.: The SIGMORPHON 2022 shared task on morpheme segmentation (2022). arXiv preprint arXiv:2206.07615","key":"24_CR2","DOI":"10.18653\/v1\/2022.sigmorphon-1.11"},{"doi-asserted-by":"crossref","unstructured":"Batsuren, K., Bella, G., Giunchiglia, F.: MorphyNet: a large multilingual database of derivational and inflectional morphology. In: Proceedings of the 18th Sigmorphon Workshop on Computational Research in Phonetics, Phonology, and Morphology, pp. 39\u201348 (2021)","key":"24_CR3","DOI":"10.18653\/v1\/2021.sigmorphon-1.5"},{"unstructured":"Batsuren, K., et\u00a0al.: UniMorph 4.0: universal morphology (2022). arXiv preprint arXiv:2205.03608","key":"24_CR4"},{"doi-asserted-by":"crossref","unstructured":"Bodn\u00e1r, J., \u017dabokrtsk\u00fd, Z., \u0160ev\u010d\u00edkov\u00e1, M.: Semi-supervised induction of morpheme boundaries in Czech using a word-formation network. In: International Conference on Text, Speech, and Dialogue, pp. 189\u2013196. Springer (2020)","key":"24_CR5","DOI":"10.1007\/978-3-030-58323-1_20"},{"unstructured":"Bolshakova, E.I., Sapin, A.S.: An Experimental Study of Neural Morpheme Segmentation Models for Russian Word Forms. In: CMCL, pp. 79\u201389 (2020)","key":"24_CR6"},{"key":"24_CR7","doi-asserted-by":"publisher","DOI":"10.7717\/peerj-cs.2465","volume":"10","author":"D Dr\u017e\u00edk","year":"2024","unstructured":"Dr\u017e\u00edk, D., Forgac, F.: Slovak morphological tokenizer using the byte-pair encoding algorithm. PeerJ Comput. Sci. 10, e2465 (2024)","journal-title":"PeerJ Comput. Sci."},{"issue":"2","key":"24_CR8","first-page":"23","volume":"12","author":"P Gage","year":"1994","unstructured":"Gage, P.: A new algorithm for data compression. C Users J. 12(2), 23\u201338 (1994)","journal-title":"C Users J."},{"doi-asserted-by":"crossref","unstructured":"Garipov, T., Morozov, D., Glazkova, A.: Generalization ability of CNN-based Morpheme Segmentation. In: 2023 Ivannikov Ispras Open Conference (ISPRAS), pp. 58\u201362. IEEE (2023)","key":"24_CR9","DOI":"10.1109\/ISPRAS60948.2023.10508171"},{"issue":"2","key":"24_CR10","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1007\/s11525-020-09355-5","volume":"30","author":"M Haspelmath","year":"2020","unstructured":"Haspelmath, M.: The morph as a minimal linguistic form. Morphology 30(2), 117\u2013134 (2020). https:\/\/doi.org\/10.1007\/s11525-020-09355-5","journal-title":"Morphology"},{"doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","key":"24_CR11","DOI":"10.1109\/CVPR.2016.90"},{"unstructured":"Hled\u00edkov\u00e1, H.: Verbs annotated for morphemic structure in Czech, English, German, Spanish (2024). http:\/\/hdl.handle.net\/11234\/1-5824. LINDAT\/CLARIAH-CZ digital library at the Institute of Formal and Applied Linguistics (\u00daFAL), Faculty of Mathematics and Physics, Charles University","key":"24_CR12"},{"issue":"8","key":"24_CR13","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S., Schmidhuber, J.: Long short-term memory. Neural Comput. 9(8), 1735\u20131780 (1997)","journal-title":"Neural Comput."},{"issue":"1","key":"24_CR14","doi-asserted-by":"publisher","first-page":"1","DOI":"10.3366\/word.2023.0218","volume":"16","author":"R Huyghe","year":"2023","unstructured":"Huyghe, R., Varvara, R.: Affix rivalry: theoretical and methodological challenges. Word Struct. 16(1), 1\u201323 (2023)","journal-title":"Word Struct."},{"doi-asserted-by":"crossref","unstructured":"Kocmi, T., Bojar, O.: Trivial transfer learning for low-resource neural machine translation (2018). arXiv preprint arXiv:1809.00357","key":"24_CR15","DOI":"10.18653\/v1\/W18-6325"},{"unstructured":"Koehn, P.: Europarl: A parallel corpus for statistical machine translation. In: Proceedings of machine translation summit x: papers, pp. 79\u201386 (2005)","key":"24_CR16"},{"doi-asserted-by":"crossref","unstructured":"Kudo, T.: Subword regularization: Improving neural network translation models with multiple subword candidates (2018). arXiv preprint arXiv:1804.10959","key":"24_CR17","DOI":"10.18653\/v1\/P18-1007"},{"unstructured":"Kurimo, M., Virpioja, S., Turunen, V., Lagus, K.: Morpho challenge 2005-2010: Evaluations and results. In: Proceedings of the 11th Meeting of the ACL Special Interest Group on Computational Morphology and Phonology, pp. 87\u201395 (2010)","key":"24_CR18"},{"doi-asserted-by":"crossref","unstructured":"Libovick\u00fd, J., Helcl, J.: Lexically grounded subword segmentation (2024). arXiv preprint arXiv:2406.13560","key":"24_CR19","DOI":"10.18653\/v1\/2024.emnlp-main.421"},{"key":"24_CR20","doi-asserted-by":"publisher","first-page":"1008","DOI":"10.3758\/s13428-019-01297-z","volume":"52","author":"H Mailhot","year":"2020","unstructured":"Mailhot, H., Wilson, M.A., Macoir, J., Deacon, S.H., S\u00e1nchez-Guti\u00e9rrez, C.: MorphoLex-FR: a derivational morphological database for 38,840 French words. Behav. Res. Methods 52, 1008\u20131025 (2020)","journal-title":"Behav. Res. Methods"},{"issue":"4","key":"24_CR21","doi-asserted-by":"publisher","first-page":"71","DOI":"10.17323\/jle.2024.22237","volume":"10","author":"D Morozov","year":"2024","unstructured":"Morozov, D., Garipov, T., Lyashevskaya, O., Savchuk, S., Iomdin, B., Glazkova, A.: Automatic morpheme segmentation for russian: can an algorithm re-place experts? J. Lang. Educ. 10(4), 71\u201384 (2024)","journal-title":"J. Lang. Educ."},{"unstructured":"Olo\u0161tiak, M., Gen\u010di, J., Re\u0161ovsk\u00e1, S.: Retrogr\u00e1dny morfematick\u00fd slovn\u00edk sloven\u010diny. Filozofick\u00e1 fakulta Pre\u0161ovskej univerzity v Pre\u0161ove (2015)","key":"24_CR22"},{"unstructured":"Pelegrinov\u00e1, K., El\u0161\u00edk, V., \u010cech, R., Ma\u010dutek, J.: MorfoCzech 1.1 (2021). http:\/\/hdl.handle.net\/11234\/1-5202. LINDAT\/CLARIAH-CZ digital library at the Institute of Formal and Applied Linguistics (\u00daFAL), Faculty of Mathematics and Physics, Charles University","key":"24_CR23"},{"issue":"2","key":"24_CR24","first-page":"405","volume":"72","author":"K Pelegrinov\u00e1","year":"2021","unstructured":"Pelegrinov\u00e1, K., Ma\u010dutek, J., \u010cech, R.: The Menzerath-Altmann law as the relation between lengths of words and morphemes in Czech. Jazykovedny Casopis 72(2), 405\u2013414 (2021)","journal-title":"Jazykovedny Casopis"},{"doi-asserted-by":"crossref","unstructured":"Peters, B., Martins, A.F.: Beyond characters: Subword-level morpheme segmentation. In: Proceedings of the 19th SIGMORPHON Workshop on Computational Research in Phonetics, Phonology, and Morphology, pp. 131\u2013138 (2022)","key":"24_CR25","DOI":"10.18653\/v1\/2022.sigmorphon-1.14"},{"unstructured":"Pranji\u0107, M., Robnik-\u0160ikonja, M., Pollak, S.: Llmsegm: surface-level morphological segmentation using large language model. In: Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024), pp. 10665\u201310674 (2024)","key":"24_CR26"},{"doi-asserted-by":"crossref","unstructured":"Sennrich, R., Haddow, B., Birch, A.: Neural machine translation of rare words with subword units (2015). arXiv preprint arXiv:1508.07909","key":"24_CR27","DOI":"10.18653\/v1\/P16-1162"},{"unstructured":"Slav\u00ed\u010dkov\u00e1, E.: Retrogr\u00e1dn\u00ed morfematick\u00fd slovn\u00edk \u010de\u0161tiny. Academia (1975)","key":"24_CR28"},{"unstructured":"Svoboda, E., \u0160ev\u010d\u00edkov\u00e1, M.: Compounds in universal dependencies: a survey in five european languages. In: Proceedings of the 6th Workshop on Research in Computational Linguistic Typology and Multilingual NLP, pp. 88\u201399 (2024)","key":"24_CR29"},{"issue":"1","key":"24_CR30","doi-asserted-by":"publisher","first-page":"72","DOI":"10.3366\/word.2016.0087","volume":"9","author":"L Talamo","year":"2016","unstructured":"Talamo, L., Celata, C., Bertinetto, P.M.: DerIvaTario: Aa annotated lexicon of Italian derivatives. Word Struct. 9(1), 72\u2013102 (2016)","journal-title":"Word Struct."},{"unstructured":"Virpioja, S., Smit, P., Gr\u00f6nroos, S.A., Kurimo, M.: Morfessor 2.0: Python implementation and extensions for Morfessor Baseline (2013)","key":"24_CR31"},{"unstructured":"von\u00a0der Wense, K., Cotterell, R., Sch\u00fctze, H.: Neural morphological analysis: encoding-decoding canonical segments. In: Proceedings of the 2016 Conference on Empirical Methods in Natural Language Processing, pp. 961\u2013967 (2016)","key":"24_CR32"},{"unstructured":"\u017dabokrtsk\u00fd, Z., Bafna, N., Bodn\u00e1r, J., Kyj\u00e1nek, L., Svoboda, E., \u0160ev\u010d\u00edkov\u00e1, M., Vidra, J.: Towards universal segmentations: UniSegments 1.0. In: Proceedings of the Thirteenth Language Resources and Evaluation Conference, pp. 1137\u20131149 (2022)","key":"24_CR33"}],"container-title":["Lecture Notes in Computer Science","Text, Speech, and Dialogue"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-032-02551-7_24","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T18:04:43Z","timestamp":1757441083000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-032-02551-7_24"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,22]]},"ISBN":["9783032025500","9783032025517"],"references-count":33,"URL":"https:\/\/doi.org\/10.1007\/978-3-032-02551-7_24","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2025,8,22]]},"assertion":[{"value":"22 August 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"TSD","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Text, Speech, and Dialogue","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Erlangen","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Germany","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"25 August 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28 August 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"tsd2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/www.kiv.zcu.cz\/tsd2025\/index.php","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}