{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,2]],"date-time":"2025-10-02T23:41:32Z","timestamp":1759448492285,"version":"build-2065373602"},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"34","license":[{"start":{"date-parts":[[2025,4,15]],"date-time":"2025-04-15T00:00:00Z","timestamp":1744675200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,4,15]],"date-time":"2025-04-15T00:00:00Z","timestamp":1744675200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"Social Science Fund of Shaanxi Province","award":["2024K015"],"award-info":[{"award-number":["2024K015"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-025-20836-9","type":"journal-article","created":{"date-parts":[[2025,4,15]],"date-time":"2025-04-15T06:56:37Z","timestamp":1744700197000},"page":"42507-42522","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Bilingual and monolingual features enhanced morphological segmentation for spoken language neural machine translation"],"prefix":"10.1007","volume":"84","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-6903-8774","authenticated-orcid":false,"given":"Chenggang","family":"Mi","sequence":"first","affiliation":[]},{"given":"Shaoliang","family":"Xie","sequence":"additional","affiliation":[]},{"given":"Qi","family":"Liu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,4,15]]},"reference":[{"key":"20836_CR1","doi-asserted-by":"publisher","unstructured":"Ataman D, Federico M (2018) Compositional representation of morphologically-rich input for neural machine translation. In: Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers). Association for Computational Linguistics, Melbourne, Australia, pp 305\u2013311. https:\/\/doi.org\/10.18653\/v1\/P18-2049. https:\/\/aclanthology.org\/P18-2049","DOI":"10.18653\/v1\/P18-2049"},{"key":"20836_CR2","doi-asserted-by":"publisher","first-page":"331","DOI":"10.1515\/pralin-2017-0031","volume":"108","author":"D Ataman","year":"2017","unstructured":"Ataman D, Negri M, Turchi M et al (2017) Linguistically motivated vocabulary reduction for neural machine translation from turkish to english. Prague Bull Math Ling 108:331\u2013342","journal-title":"Prague Bull Math Ling"},{"key":"20836_CR3","doi-asserted-by":"publisher","unstructured":"Bauwens T, Delobelle P (2024) BPE-knockout: Pruning pre-existing BPE tokenisers with backwards-compatible morphological semi-supervision. In: Duh K, Gomez H, Bethard S (eds) Proceedings of the 2024 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (Volume 1: Long Papers). Association for Computational Linguistics, Mexico City, Mexico, pp 5810\u20135832. https:\/\/doi.org\/10.18653\/v1\/2024.naacl-long.324. https:\/\/aclanthology.org\/2024.naacl-long.324","DOI":"10.18653\/v1\/2024.naacl-long.324"},{"key":"20836_CR4","unstructured":"Bengio Y, Ducharme R, Vincent P (2000) A neural probabilistic language model. Adv Neural Inf Process Syst 13"},{"issue":"2","key":"20836_CR5","first-page":"263","volume":"19","author":"PF Brown","year":"1993","unstructured":"Brown PF, Della Pietra SA, Della Pietra VJ et al (1993) The mathematics of statistical machine translation: Parameter estimation. Comput Linguist 19(2):263\u2013311","journal-title":"Comput Linguist"},{"key":"20836_CR6","doi-asserted-by":"publisher","first-page":"330","DOI":"10.1109\/TASLP.2021.3138714","volume":"30","author":"K Chen","year":"2022","unstructured":"Chen K, Wang R, Utiyama M et al (2022) Integrating prior translation knowledge into neural machine translation. IEEE\/ACM Trans Audio Speech Lang Process 30:330\u2013339. https:\/\/doi.org\/10.1109\/TASLP.2021.3138714","journal-title":"IEEE\/ACM Trans Audio Speech Lang Process"},{"issue":"11","key":"20836_CR7","doi-asserted-by":"publisher","first-page":"4568","DOI":"10.1109\/TFUZZ.2022.3167129","volume":"30","author":"K Chen","year":"2022","unstructured":"Chen K, Yang M, Zhao T et al (2022) Data-driven fuzzy target-side representation for intelligent translation system. IEEE Transactions on Fuzzy Systems 30(11):4568\u20134577","journal-title":"IEEE Transactions on Fuzzy Systems"},{"key":"20836_CR8","doi-asserted-by":"publisher","unstructured":"Gaser M, Mager M, Hamed I et\u00a0al (2023) Exploring segmentation approaches for neural machine translation of code-switched Egyptian Arabic-English text. In: Vlachos A, Augenstein I (eds) Proceedings of the 17th Conference of the European Chapter of the Association for Computational Linguistics. Association for Computational Linguistics, Dubrovnik, Croatia, pp 3523\u20133538. https:\/\/doi.org\/10.18653\/v1\/2023.eacl-main.256. https:\/\/aclanthology.org\/2023.eacl-main.256","DOI":"10.18653\/v1\/2023.eacl-main.256"},{"key":"20836_CR9","unstructured":"Gr\u00f6nroos SA, Virpioja S, Smit P et\u00a0al (2014) Morfessor flatcat: An hmm-based method for unsupervised and semi-supervised learning of morphology. In: Proceedings of COLING 2014, the 25th International Conference on Computational Linguistics: Technical Papers, pp 1177\u20131185"},{"key":"20836_CR10","doi-asserted-by":"publisher","unstructured":"Gr\u00f6nroos SA, Virpioja S, Kurimo M (2018) Cognate-aware morphological segmentation for multilingual neural translation. In: Proceedings of the Third Conference on Machine Translation: Shared Task Papers. Association for Computational Linguistics, Belgium, Brussels, pp 386\u2013393. https:\/\/doi.org\/10.18653\/v1\/W18-6410. https:\/\/aclanthology.org\/W18-6410","DOI":"10.18653\/v1\/W18-6410"},{"issue":"8","key":"20836_CR11","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter S, Schmidhuber J (1997) Long short-term memory. Neural Comput 9(8):1735\u20131780","journal-title":"Neural Comput"},{"key":"20836_CR12","doi-asserted-by":"publisher","unstructured":"Hou J, Katinskaia A, Vu AD et\u00a0al (2023) Effects of sub-word segmentation on performance of transformer language models. In: Bouamor H, Pino J, Bali K (eds) Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing. Association for Computational Linguistics, Singapore, pp 7413\u2013742. https:\/\/doi.org\/10.18653\/v1\/2023.emnlp-main.459. https:\/\/aclanthology.org\/2023.emnlp-main.459","DOI":"10.18653\/v1\/2023.emnlp-main.459"},{"issue":"102","key":"20836_CR13","first-page":"022","volume":"102","author":"H Huang","year":"2024","unstructured":"Huang H, Wu S, Chen K et al (2024) Multi-view fusion for universal translation quality estimation. Inf Fus 102(102):022","journal-title":"Inf Fus"},{"key":"20836_CR14","doi-asserted-by":"publisher","unstructured":"Huck M, Riess S, Fraser A (2017) Target-side word segmentation strategies for neural machine translation. In: Proceedings of the Second Conference on Machine Translation. Association for Computational Linguistics, Copenhagen, Denmark, pp 56\u20136. https:\/\/doi.org\/10.18653\/v1\/W17-4706, https:\/\/aclanthology.org\/W17-4706","DOI":"10.18653\/v1\/W17-4706"},{"key":"20836_CR15","doi-asserted-by":"publisher","unstructured":"Jean S, Cho K (2020) Log-linear reformulation of the noisy channel model for document-level neural machine translation. In: Proceedings of the Fourth Workshop on Structured Prediction for NLP. Association for Computational Linguistics, Online, pp 95\u201310. https:\/\/doi.org\/10.18653\/v1\/2020.spnlp-1.11. https:\/\/aclanthology.org\/2020.spnlp-1.11","DOI":"10.18653\/v1\/2020.spnlp-1.11"},{"key":"20836_CR16","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511815829","volume-title":"Statistical machine translation","author":"P Koehn","year":"2009","unstructured":"Koehn P (2009) Statistical machine translation. Cambridge University Press"},{"key":"20836_CR17","unstructured":"Lafferty JD, McCallum A, Pereira FCN (2001) Conditional random fields: Probabilistic models for segmenting and labeling sequence data. In: Proceedings of the Eighteenth International Conference on Machine Learning. Morgan Kaufmann Publishers Inc., San Francisco, CA, USA, ICML \u201901, pp 282\u2013289"},{"key":"20836_CR18","doi-asserted-by":"publisher","unstructured":"Meyer F, Buys J (2024) A systematic analysis of subwords and cross-lingual transfer in multilingual translation. In: Duh K, Gomez H, Bethard S (eds) Findings of the Association for Computational Linguistics: NAACL 2024. Association for Computational Linguistics, Mexico City, Mexico, pp 2194\u2013220. https:\/\/doi.org\/10.18653\/v1\/2024.findings-naacl.141. https:\/\/aclanthology.org\/2024.findings-naacl.141","DOI":"10.18653\/v1\/2024.findings-naacl.141"},{"key":"20836_CR19","doi-asserted-by":"publisher","unstructured":"Nguyen T, Chiang D (2018) Improving lexical choice in neural machine translation. In: Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long Papers). Association for Computational Linguistics, New Orleans, Louisiana, pp 334\u201334. https:\/\/doi.org\/10.18653\/v1\/N18-1031. https:\/\/aclanthology.org\/N18-1031","DOI":"10.18653\/v1\/N18-1031"},{"key":"20836_CR20","doi-asserted-by":"crossref","unstructured":"Papineni K, Roukos S, Ward T et\u00a0al (2002) Bleu: a method for automatic evaluation of machine translation. In: Proceedings of the 40th annual meeting of the Association for Computational Linguistics, pp 311\u2013318","DOI":"10.3115\/1073083.1073135"},{"key":"20836_CR21","doi-asserted-by":"publisher","unstructured":"Saleva J, Lignos C (2021) The effectiveness of morphology-aware segmentation in low-resource neural machine translation. In: Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: Student Research Workshop. Association for Computational Linguistics, Online, pp 164\u201317. https:\/\/doi.org\/10.18653\/v1\/2021.eacl-srw.22. https:\/\/aclanthology.org\/2021.eacl-srw.22","DOI":"10.18653\/v1\/2021.eacl-srw.22"},{"key":"20836_CR22","unstructured":"Scherrer Y, Gr\u00f6nroos SA, Virpioja S (2020) The University of Helsinki and aalto university submissions to the WMT 2020 news and low-resource translation tasks. In: Proceedings of the Fifth Conference on Machine Translation. Association for Computational Linguistics, Online, pp 1129\u20131138. https:\/\/aclanthology.org\/2020.wmt-1.134"},{"key":"20836_CR23","doi-asserted-by":"publisher","unstructured":"Sennrich R, Haddow B, Birch A (2016) Neural machine translation of rare words with subword units. In: Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers). Association for Computational Linguistics, Berlin, Germany, pp 1715\u20131725. https:\/\/doi.org\/10.18653\/v1\/P16-1162. https:\/\/aclanthology.org\/P16-1162","DOI":"10.18653\/v1\/P16-1162"},{"key":"20836_CR24","doi-asserted-by":"publisher","unstructured":"Sreedhar MN, Wan X, Cheng Y et\u00a0al (2023) Local byte fusion for neural machine translation. In: Rogers A, Boyd-Graber J, Okazaki N (eds) Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers). Association for Computational Linguistics, Toronto, Canada, pp 7199\u2013721. https:\/\/doi.org\/10.18653\/v1\/2023.acl-long.397. https:\/\/aclanthology.org\/2023.acl-long.397","DOI":"10.18653\/v1\/2023.acl-long.397"},{"key":"20836_CR25","doi-asserted-by":"crossref","unstructured":"Stolcke A (2002) Srilm-an extensible language modeling toolkit. In: Seventh international conference on spoken language processing","DOI":"10.21437\/ICSLP.2002-303"},{"key":"20836_CR26","doi-asserted-by":"publisher","unstructured":"Tawfik A, Emam M, Essam K et\u00a0al (2019) Morphology-aware word-segmentation in dialectal Arabic adaptation of neural machine translation. In: Proceedings of the Fourth Arabic Natural Language Processing Workshop. Association for Computational Linguistics, Florence, Italy, pp 11\u201317. https:\/\/doi.org\/10.18653\/v1\/W19-4602. https:\/\/aclanthology.org\/W19-4602","DOI":"10.18653\/v1\/W19-4602"},{"key":"20836_CR27","doi-asserted-by":"crossref","unstructured":"Tiedemann J (2009) News from opus-a collection of multilingual parallel corpora with tools and interfaces. In: Recent advances in natural language processing, pp 237\u2013248","DOI":"10.1075\/cilt.309.19tie"},{"issue":"8","key":"20836_CR28","doi-asserted-by":"publisher","first-page":"5929","DOI":"10.1007\/s10462-020-09838-1","volume":"53","author":"G Van Houdt","year":"2020","unstructured":"Van Houdt G, Mosquera C, N\u00e1poles G (2020) A review on the long short-term memory model. Artif Intell Rev 53(8):5929\u20135955","journal-title":"Artif Intell Rev"},{"key":"20836_CR29","doi-asserted-by":"crossref","unstructured":"Zeng X, Chao LS, Wong DF et\u00a0al (2014) Toward better chinese word segmentation for smt via bilingual constraints. In: Proceedings of the 52nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp 1360\u20131369","DOI":"10.3115\/v1\/P14-1128"},{"issue":"4","key":"20836_CR30","doi-asserted-by":"publisher","first-page":"2527","DOI":"10.1007\/s11277-018-5274-8","volume":"102","author":"S Zhu","year":"2018","unstructured":"Zhu S (2018) A neural attention based model for morphological segmentation. Wirel Pers Commun 102(4):2527\u2013253. https:\/\/doi.org\/10.1007\/s11277-018-5274-8","journal-title":"Wirel Pers Commun"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-025-20836-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-025-20836-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-025-20836-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,2]],"date-time":"2025-10-02T23:08:38Z","timestamp":1759446518000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-025-20836-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,15]]},"references-count":30,"journal-issue":{"issue":"34","published-online":{"date-parts":[[2025,10]]}},"alternative-id":["20836"],"URL":"https:\/\/doi.org\/10.1007\/s11042-025-20836-9","relation":{},"ISSN":["1573-7721"],"issn-type":[{"type":"electronic","value":"1573-7721"}],"subject":[],"published":{"date-parts":[[2025,4,15]]},"assertion":[{"value":"15 June 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 April 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 April 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 April 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"On behalf of all authors, the corresponding author states that there is no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflicts of Interest"}}]}}