{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T07:54:13Z","timestamp":1743062053588,"version":"3.40.3"},"publisher-location":"Cham","reference-count":46,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030687861"},{"type":"electronic","value":"9783030687878"}],"license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-68787-8_24","type":"book-chapter","created":{"date-parts":[[2021,2,20]],"date-time":"2021-02-20T17:55:55Z","timestamp":1613843755000},"page":"326-338","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["A Comparison of Character-Based Neural Machine Translations Techniques Applied to Spelling Normalization"],"prefix":"10.1007","author":[{"given":"Miguel","family":"Domingo","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Francisco","family":"Casacuberta","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,2,21]]},"reference":[{"key":"24_CR1","unstructured":"Bahdanau, D., Cho, K., Bengio, Y.: Neural machine translation by jointly learning to align and translate. arXiv:1409.0473 (2015)"},{"key":"24_CR2","unstructured":"Baron, A., Rayson, P.: VARD2: a tool for dealing with spelling variation in historical corpora. In: Postgraduate Conference in Corpus Linguistics (2008)"},{"key":"24_CR3","unstructured":"Bollmann, M.: Normalization of historical texts with neural network models. Ph.D. thesis, Sprachwissenschaftliches Institut, Ruhr-Universit\u00e4t (2018)"},{"key":"24_CR4","unstructured":"Bollmann, M., S\u00f8gaard, A.: Improving historical spelling normalization with bi-directional LSTMs and multi-task learning. In: Proceedings of the International Conference on the Computational Linguistics, pp. 131\u2013139 (2016)"},{"issue":"2","key":"24_CR5","first-page":"263","volume":"19","author":"PF Brown","year":"1993","unstructured":"Brown, P.F., Pietra, V.J.D., Pietra, S.A.D., Mercer, R.L.: The mathematics of statistical machine translation: parameter estimation. Comput. Linguist. 19(2), 263\u2013311 (1993)","journal-title":"Comput. Linguist."},{"key":"24_CR6","doi-asserted-by":"crossref","unstructured":"Chatterjee, R., Farajian, M.A., Negri, M., Turchi, M., Srivastava, A., Pal, S.: Multi-source neural automatic post-editing: FBK\u2019s participation in the WMT 2017 APE shared task. In: Proceedings of the Second Conference on Machine Translation, pp. 630\u2013638 (2017)","DOI":"10.18653\/v1\/W17-4773"},{"key":"24_CR7","doi-asserted-by":"crossref","unstructured":"Chung, J., Cho, K., Bengio, Y.: A character-level decoder without explicit segmentation for neural machine translation. In: Proceedings of the Annual Meeting of the Association for Computational Linguistics, pp. 1693\u20131703 (2016)","DOI":"10.18653\/v1\/P16-1160"},{"key":"24_CR8","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1007\/s10590-017-9196-0","volume":"31","author":"MR Costa-Juss\u00e0","year":"2017","unstructured":"Costa-Juss\u00e0, M.R., Ald\u00f3n, D., Fonollosa, J.A.: Chinese-Spanish neural machine translation enhanced with character and word bitmap fonts. Mach. Transl. 31, 35\u201347 (2017)","journal-title":"Mach. Transl."},{"key":"24_CR9","doi-asserted-by":"crossref","unstructured":"Costa-Juss\u00e0, M.R., Fonollosa, J.A.: Character-based neural machine translation. In: Proceedings of the Annual Meeting of the Association for Computational Linguistics, pp. 357\u2013361 (2016)","DOI":"10.18653\/v1\/P16-2058"},{"key":"24_CR10","unstructured":"Domingo, M., Casacuberta, F.: Spelling normalization of historical documents by using a machine translation approach. In: Proceedings of the Annual Conference of the European Association for Machine Translation, pp. 129\u2013137 (2018)"},{"key":"24_CR11","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1007\/978-3-030-30754-7_7","volume-title":"New Trends in Image Analysis and Processing \u2013 ICIAP 2019","author":"M Domingo","year":"2019","unstructured":"Domingo, M., Casacuberta, F.: Enriching character-based neural machine translation with modern documents for achieving an orthography consistency in historical documents. In: Cristani, M., Prati, A., Lanz, O., Messelodi, S., Sebe, N. (eds.) ICIAP 2019. LNCS, vol. 11808, pp. 59\u201369. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-30754-7_7"},{"key":"24_CR12","unstructured":"Domingo, M., et al.: A user study of the incremental learning in NMT. In: Proceedings of the European Association for Machine Translation, pp. 319\u2013328 (2020)"},{"key":"24_CR13","volume-title":"Works of Miguel de Cervantes in Old- and Modern-Spelling","author":"F Jehle","year":"2001","unstructured":"Jehle, F.: Works of Miguel de Cervantes in Old- and Modern-Spelling. Indiana University Purdue University, Fort Wayne (2001)"},{"key":"24_CR14","unstructured":"Gehring, J., Auli, M., Grangier, D., Yarats, D., Dauphin, Y.N.: Convolutional sequence to sequence learning. arXiv:1705.03122 (2017)"},{"issue":"10","key":"24_CR15","doi-asserted-by":"publisher","first-page":"2451","DOI":"10.1162\/089976600300015015","volume":"12","author":"FA Gers","year":"2000","unstructured":"Gers, F.A., Schmidhuber, J., Cummins, F.: Learning to forget: continual prediction with LSTM. Neural Comput. 12(10), 2451\u20132471 (2000)","journal-title":"Neural Comput."},{"key":"24_CR16","unstructured":"H\u00e4m\u00e4l\u00e4inen, M., S\u00e4ily, T., Rueter, J., Tiedemann, J., M\u00e4kel\u00e4, E.: Normalizing early English letters to present-day English spelling. In: Proceedings of the Workshop on Computational Linguistics for Cultural Heritage, Social Sciences, Humanities and Literature, pp. 87\u201396 (2018)"},{"key":"24_CR17","unstructured":"Kingma, D.P., Ba, J.: Adam: a method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)"},{"key":"24_CR18","doi-asserted-by":"crossref","unstructured":"Klein, G., Kim, Y., Deng, Y., Senellart, J., Rush, A.M.: OpenNMT: open-source toolkit for neural machine translation. In: Proceedings of the Association for Computational Linguistics: System Demonstration, pp. 67\u201372 (2017)","DOI":"10.18653\/v1\/P17-4012"},{"key":"24_CR19","doi-asserted-by":"crossref","unstructured":"Koehn, P., et al.: Moses: open source toolkit for statistical machine translation. In: Proceedings of the Annual Meeting of the Association for Computational Linguistics, pp. 177\u2013180 (2007)","DOI":"10.3115\/1557769.1557821"},{"key":"24_CR20","doi-asserted-by":"crossref","unstructured":"Koehn, P., Och, F.J., Marcu, D.: Statistical phrase-based translation. In: Proceedings of the Conference of the North American Chapter of the Association for Computational Linguistics on Human Language Technology, pp. 48\u201354 (2003)","DOI":"10.3115\/1073445.1073462"},{"key":"24_CR21","unstructured":"Korchagina, N.: Normalizing medieval German texts: from rules to deep learning. In: Proceedings of the Nordic Conference on Computational Linguistics Workshop on Processing Historical Language, pp. 12\u201317 (2017)"},{"key":"24_CR22","doi-asserted-by":"crossref","unstructured":"Laing, M.: The linguistic analysis of medieval vernacular texts: two projects at Edinburgh. In: Rissanen, M., Kytd, M., Wright, S. (eds.) Corpora Across the Centuries: Proceedings of the First International Colloquium on English Diachronic Corpora, vol. 25427, pp. 121\u2013141. St Catharine\u2019s College, Cambridge (1993)","DOI":"10.1163\/9789004657311_017"},{"key":"24_CR23","unstructured":"Ling, W., Trancoso, I., Dyer, C., Black, A.W.: Character-based neural machine translation. arXiv preprint arXiv:1511.04586 (2015)"},{"key":"24_CR24","unstructured":"Lison, P., Tiedemann, J.: Opensubtitles 2016: extracting large parallel corpora from movie and tv subtitles. In: Proceedings of the International Conference on Language Resources Association, pp. 923\u2013929 (2016)"},{"key":"24_CR25","unstructured":"Ljube\u0161i\u0107, N., Zupan, K., Fi\u0161er, D., Erjavec, T.: Dataset of normalised Slovene text KonvNormSl 1.0. Slovenian language resource repository CLARIN. SI (2016). http:\/\/hdl.handle.net\/11356\/1068"},{"key":"24_CR26","unstructured":"Ljube\u0161ic, N., Zupan, K., Fi\u0161er, D., Erjavec, T.: Normalising Slovene data: historical texts vs. user-generated content. In: Proceedings of the Conference on Natural Language Processing, pp. 146\u2013155 (2016)"},{"key":"24_CR27","unstructured":"Nakov, P., Tiedemann, J.: Combining word-level and character-level models for machine translation between closely-related languages. In: Proceedings of the Annual Meeting of the Association for Computational Linguistics, pp. 301\u2013305 (2012)"},{"key":"24_CR28","doi-asserted-by":"crossref","unstructured":"Och, F.J.: Minimum error rate training in statistical machine translation. In: Proceedings of the Annual Meeting of the Association for Computational Linguistics, pp. 160\u2013167 (2003)","DOI":"10.3115\/1075096.1075117"},{"key":"24_CR29","doi-asserted-by":"crossref","unstructured":"Och, F.J., Ney, H.: Discriminative training and maximum entropy models for statistical machine translation. In: Proceedings of the Annual Meeting of the Association for Computational Linguistics, pp. 295\u2013302 (2002)","DOI":"10.3115\/1073083.1073133"},{"key":"24_CR30","doi-asserted-by":"crossref","unstructured":"Papineni, K., Roukos, S., Ward, T., Zhu, W.J.: BLEU: a method for automatic evaluation of machine translation. In: Proceedings of the Annual Meeting of the Association for Computational Linguistics, pp. 311\u2013318 (2002)","DOI":"10.3115\/1073083.1073135"},{"key":"24_CR31","unstructured":"Porta, J., Sancho, J.L., G\u00f3mez, J.: Edit transducers for spelling variation in old Spanish. In: Proceedings of the Workshop on Computational Historical Linguistics, pp. 70\u201379 (2013)"},{"key":"24_CR32","doi-asserted-by":"crossref","unstructured":"Post, M.: A call for clarity in reporting BLEU scores. In: Proceedings of the Third Conference on Machine Translation, pp. 186\u2013191 (2018)","DOI":"10.18653\/v1\/W18-6319"},{"key":"24_CR33","unstructured":"Riezler, S., Maxwell, J.T.: On some pitfalls in automatic evaluation and significance testing for MT. In: Proceedings of the Workshop on Intrinsic and Extrinsic Evaluation Measures for Machine Translation and\/or Summarization, pp. 57\u201364 (2005)"},{"key":"24_CR34","doi-asserted-by":"publisher","first-page":"400","DOI":"10.1214\/aoms\/1177729586","volume":"22","author":"H Robbins","year":"1951","unstructured":"Robbins, H., Monro, S.: A stochastic approximation method. Ann. Math. Stat. 22, 400\u2013407 (1951)","journal-title":"Ann. Math. Stat."},{"issue":"6088","key":"24_CR35","doi-asserted-by":"publisher","first-page":"533","DOI":"10.1038\/323533a0","volume":"323","author":"DE Rumelhart","year":"1986","unstructured":"Rumelhart, D.E., Hinton, G.E., Williams, R.J.: Learning representations by back-propagating errors. Nature 323(6088), 533\u2013536 (1986)","journal-title":"Nature"},{"key":"24_CR36","unstructured":"Scherrer, Y., Erjavec, T.: Modernizing historical Slovene words with character-based SMT. In: Proceedings of the Workshop on Balto-Slavic Natural Language Processing, pp. 58\u201362 (2013)"},{"key":"24_CR37","doi-asserted-by":"crossref","unstructured":"Sennrich, R., Haddow, B., Birch, A.: Neural machine translation of rare words with subword units. In: Proceedings of the Annual Meeting of the Association for Computational Linguistics, pp. 1715\u20131725 (2016)","DOI":"10.18653\/v1\/P16-1162"},{"key":"24_CR38","unstructured":"Snover, M., Dorr, B., Schwartz, R., Micciulla, L., Makhoul, J.: A study of translation edit rate with targeted human annotation. In: Proceedings of the Association for Machine Translation in the Americas, pp. 223\u2013231 (2006)"},{"key":"24_CR39","doi-asserted-by":"crossref","unstructured":"Stolcke, A.: SRILM - an extensible language modeling toolkit. In: Proceedings of the International Conference on Spoken Language Processing, pp. 257\u2013286 (2002)","DOI":"10.21437\/ICSLP.2002-303"},{"key":"24_CR40","unstructured":"Sutskever, I., Vinyals, O., Le, Q.V.: Sequence to sequence learning with neural networks. In: Proceedings of the Advances in Neural Information Processing Systems, vol. 27, pp. 3104\u20133112 (2014)"},{"key":"24_CR41","doi-asserted-by":"crossref","unstructured":"Szegedy, C., et al.: Going deeper with convolutions. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1\u20139 (2015)","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"24_CR42","unstructured":"Tang, G., Cap, F., Pettersson, E., Nivre, J.: An evaluation of neural machine translation models on historical spelling normalization. In: Proceedings of the International Conference on Computational Linguistics, pp. 1320\u20131331 (2018)"},{"key":"24_CR43","unstructured":"Tiedemann, J.: Character-based PSMT for closely related languages. In: Proceedings of the Annual Conference of the European Association for Machine Translation, pp. 12\u201319 (2009)"},{"key":"24_CR44","unstructured":"Vaswani, A., et al.: Attention is all you need. In: Advances in Neural Information Processing Systems, pp. 5998\u20136008 (2017)"},{"key":"24_CR45","unstructured":"Wu, Y., et al.: Google\u2019s neural machine translation system: bridging the gap between human and machine translation. arXiv:1609.08144 (2016)"},{"key":"24_CR46","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"18","DOI":"10.1007\/3-540-45751-8_2","volume-title":"KI 2002: Advances in Artificial Intelligence","author":"R Zens","year":"2002","unstructured":"Zens, R., Och, F.J., Ney, H.: Phrase-based statistical machine translation. In: Jarke, M., Lakemeyer, G., Koehler, J. (eds.) KI 2002. LNCS (LNAI), vol. 2479, pp. 18\u201332. Springer, Heidelberg (2002). https:\/\/doi.org\/10.1007\/3-540-45751-8_2"}],"container-title":["Lecture Notes in Computer Science","Pattern Recognition. ICPR International Workshops and Challenges"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-68787-8_24","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,24]],"date-time":"2024-08-24T15:16:22Z","timestamp":1724512582000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-030-68787-8_24"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"ISBN":["9783030687861","9783030687878"],"references-count":46,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-68787-8_24","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2021]]},"assertion":[{"value":"21 February 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICPR","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Pattern Recognition","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"10 January 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"11 January 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ICPR2020","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.icpr2020.it\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}