{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:24:04Z","timestamp":1750220644197,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":30,"publisher":"ACM","license":[{"start":{"date-parts":[[2020,12,18]],"date-time":"2020-12-18T00:00:00Z","timestamp":1608249600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2020,12,18]]},"DOI":"10.1145\/3443279.3443310","type":"proceedings-article","created":{"date-parts":[[2021,2,1]],"date-time":"2021-02-01T22:50:44Z","timestamp":1612219844000},"page":"149-156","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":10,"title":["Character-Level Transformer-Based Neural Machine Translation"],"prefix":"10.1145","author":[{"given":"Nikolay","family":"Banar","sequence":"first","affiliation":[{"name":"CliPS, University of Antwerp, ACDC, University of Antwerp Antwerp, Belgium"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Walter","family":"Daelemans","sequence":"additional","affiliation":[{"name":"CliPS, University of Antwerp, Antwerp, Belgium"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mike","family":"Kestemont","sequence":"additional","affiliation":[{"name":"CliPS, University of Antwerp, ACDC, University of Antwerp Antwerp, Belgium"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2021,2]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Proceedings of the International Conference on Learning Representations, ICLR 2015","author":"Bahdanau D.","year":"2015","unstructured":"D. Bahdanau , K. Cho , and Y. Bengio . Neural machine translation by jointly learning to align and translate . In Proceedings of the International Conference on Learning Representations, ICLR 2015 , 2015 . D. Bahdanau, K. Cho, and Y. Bengio. Neural machine translation by jointly learning to align and translate. In Proceedings of the International Conference on Learning Representations, ICLR 2015, 2015."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.5220\/0009167205220529"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1008"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D18-1461"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/W14-4012"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1179"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P16-1160"},{"key":"e_1_3_2_1_8_1","first-page":"357","volume-title":"Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","author":"Fonollosa M. R.","year":"2016","unstructured":"M. R. Costa-juss\u00e0 and J. A. Fonollosa . Character-based neural machine translation . In Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers) , pages 357 -- 361 , 2016 . M. R. Costa-juss\u00e0 and J. A. Fonollosa. Character-based neural machine translation. In Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers), pages 357--361, 2016."},{"key":"e_1_3_2_1_9_1","first-page":"249","volume-title":"Proceedings of the thirteenth international conference on artificial intelligence and statistics","author":"Glorot X.","year":"2010","unstructured":"X. Glorot and Y. Bengio . Understanding the difficulty of training deep feedforward neural networks . In Proceedings of the thirteenth international conference on artificial intelligence and statistics , pages 249 -- 256 , 2010 . X. Glorot and Y. Bengio. Understanding the difficulty of training deep feedforward neural networks. In Proceedings of the thirteenth international conference on artificial intelligence and statistics, pages 249--256, 2010."},{"key":"e_1_3_2_1_10_1","volume-title":"Character-based nmt with transformer. arXiv preprint arXiv:1911.04997","author":"Gupta R.","year":"2019","unstructured":"R. Gupta , L. Besacier , M. Dymetman , and M. Gall\u00e9 . Character-based nmt with transformer. arXiv preprint arXiv:1911.04997 , 2019 . R. Gupta, L. Besacier, M. Dymetman, and M. Gall\u00e9. Character-based nmt with transformer. arXiv preprint arXiv:1911.04997, 2019."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00065"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.5555\/3016100.3016285"},{"key":"e_1_3_2_1_14_1","volume-title":"Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980","author":"Kingma D. P.","year":"2014","unstructured":"D. P. Kingma and J. Ba . Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980 , 2014 . D. P. Kingma and J. Ba. Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980, 2014."},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P17-4012"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.5555\/1557769.1557821"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00067"},{"key":"e_1_3_2_1_18_1","volume-title":"Character-based neural machine translation. arXiv preprint arXiv:1511.04586","author":"Ling W.","year":"2015","unstructured":"W. Ling , I. Trancoso , C. Dyer , and A. W. Black . Character-based neural machine translation. arXiv preprint arXiv:1511.04586 , 2015 . W. Ling, I. Trancoso, C. Dyer, and A. W. Black. Character-based neural machine translation. arXiv preprint arXiv:1511.04586, 2015."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P16-1100"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D15-1166"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W18-6450"},{"key":"e_1_3_2_1_22_1","first-page":"311","volume-title":"Proceedings of the 40th annual meeting on association for computational linguistics","author":"Papineni K.","year":"2002","unstructured":"K. Papineni , S. Roukos , T. Ward , and W.-J. Zhu . Bleu : a method for automatic evaluation of machine translation . In Proceedings of the 40th annual meeting on association for computational linguistics , pages 311 -- 318 . Association for Computational Linguistics , 2002 . K. Papineni, S. Roukos, T. Ward, and W.-J. Zhu. Bleu: a method for automatic evaluation of machine translation. In Proceedings of the 40th annual meeting on association for computational linguistics, pages 311--318. Association for Computational Linguistics, 2002."},{"key":"e_1_3_2_1_23_1","first-page":"8026","volume-title":"Advances in Neural Information Processing Systems","author":"Paszke A.","year":"2019","unstructured":"A. Paszke , S. Gross , F. Massa , A. Lerer , J. Bradbury , G. Chanan , T. Killeen , Z. Lin , N. Gimelshein , L. Antiga , : An imperative style, high-performance deep learning library . In Advances in Neural Information Processing Systems , pages 8026 -- 8037 , 2019 . A. Paszke, S. Gross, F. Massa, A. Lerer, J. Bradbury, G. Chanan, T. Killeen, Z. Lin, N. Gimelshein, L. Antiga, et al. Pytorch: An imperative style, high-performance deep learning library. In Advances in Neural Information Processing Systems, pages 8026--8037, 2019."},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.2478\/pralin-2018-0002"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W15-3049"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P16-1162"},{"key":"e_1_3_2_1_27_1","first-page":"2377","volume-title":"Advances in neural information processing systems","author":"Srivastava R. K.","year":"2015","unstructured":"R. K. Srivastava , K. Greff , and J. Schmidhuber . Training very deep networks . In Advances in neural information processing systems , pages 2377 -- 2385 , 2015 . R. K. Srivastava, K. Greff, and J. Schmidhuber. Training very deep networks. In Advances in neural information processing systems, pages 2377--2385, 2015."},{"key":"e_1_3_2_1_28_1","first-page":"3104","volume-title":"Advances in neural information processing systems","author":"Sutskever I.","year":"2014","unstructured":"I. Sutskever , O. Vinyals , and Q. V. Le . Sequence to sequence learning with neural networks . In Advances in neural information processing systems , pages 3104 -- 3112 , 2014 . I. Sutskever, O. Vinyals, and Q. V. Le. Sequence to sequence learning with neural networks. In Advances in neural information processing systems, pages 3104--3112, 2014."},{"key":"e_1_3_2_1_29_1","first-page":"5998","volume-title":"Advances in neural information processing systems","author":"Vaswani A.","year":"2017","unstructured":"A. Vaswani , N. Shazeer , N. Parmar , J. Uszkoreit , L. Jones , A. N. Gomez , \u0141. Kaiser, and I. Polosukhin . Attention is all you need . In Advances in neural information processing systems , pages 5998 -- 6008 , 2017 . A. Vaswani, N. Shazeer, N. Parmar, J. Uszkoreit, L. Jones, A. N. Gomez, \u0141. Kaiser, and I. Polosukhin. Attention is all you need. In Advances in neural information processing systems, pages 5998--6008, 2017."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W16-2342"}],"event":{"name":"NLPIR 2020: 4th International Conference on Natural Language Processing and Information Retrieval","sponsor":["FernUniversit\u00e4t in Hagen"],"location":"Seoul Republic of Korea","acronym":"NLPIR 2020"},"container-title":["Proceedings of the 4th International Conference on Natural Language Processing and Information Retrieval"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3443279.3443310","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3443279.3443310","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T22:02:12Z","timestamp":1750197732000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3443279.3443310"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,12,18]]},"references-count":30,"alternative-id":["10.1145\/3443279.3443310","10.1145\/3443279"],"URL":"https:\/\/doi.org\/10.1145\/3443279.3443310","relation":{},"subject":[],"published":{"date-parts":[[2020,12,18]]},"assertion":[{"value":"2021-02-01","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}