{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,2]],"date-time":"2026-04-02T15:54:50Z","timestamp":1775145290435,"version":"3.50.1"},"reference-count":42,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2022,1,13]],"date-time":"2022-01-13T00:00:00Z","timestamp":1642032000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,1,13]],"date-time":"2022-01-13T00:00:00Z","timestamp":1642032000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Mach Learn"],"published-print":{"date-parts":[[2022,3]]},"DOI":"10.1007\/s10994-021-06073-9","type":"journal-article","created":{"date-parts":[[2022,1,13]],"date-time":"2022-01-13T00:03:47Z","timestamp":1642032227000},"page":"1181-1203","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":28,"title":["End-to-end entity-aware neural machine translation"],"prefix":"10.1007","volume":"111","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7126-0139","authenticated-orcid":false,"given":"Shufang","family":"Xie","sequence":"first","affiliation":[]},{"given":"Yingce","family":"Xia","sequence":"additional","affiliation":[]},{"given":"Lijun","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Yiqing","family":"Huang","sequence":"additional","affiliation":[]},{"given":"Yang","family":"Fan","sequence":"additional","affiliation":[]},{"given":"Tao","family":"Qin","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,1,13]]},"reference":[{"key":"6073_CR1","doi-asserted-by":"crossref","unstructured":"Bojar, O., Chatterjee, R., Federmann, C., Graham, Y., Haddow, B., Huang, S., Huck, M., Koehn, P., Liu, Q., Logacheva, V., Monz, C., Negri, M., Post, M., Rubino, R., Specia, L., & Turchi, M. (2017). Findings of the 2017 conference on machine translation (WMT17). In: Proceedings of the Second Conference on Machine Translation, pp. 169\u2013214. Copenhagen, Denmark.","DOI":"10.18653\/v1\/W17-4717"},{"key":"6073_CR2","doi-asserted-by":"crossref","unstructured":"Burtsev, M., Seliverstov, A., Airapetyan, R., Arkhipov, M., Baymurzina, D., Bushkov, N., Gureenkova, O., Khakhulin, T., Kuratov, Y., Kuznetsov, D., Litinsky, A., Logacheva, V., Lymar, A., Malykh, V., Petrov, M., Polulyakh, V., Pugachev, L., Sorokin, A., Vikhreva, M., & Zaynutdinov, M. (2018). DeepPavlov: Open-source library for dialogue systems. In: Proceedings of ACL 2018, System Demonstrations, pp. 122\u2013127. Melbourne, Australia.","DOI":"10.18653\/v1\/P18-4021"},{"key":"6073_CR3","unstructured":"Cettolo, M., Girardi, C., & Federico, M. (2012). WIT3: Web inventory of transcribed and translated talks. In: Proceedings of the 16th Annual conference of the European Association for Machine Translation, pp. 261\u2013268. Trento, Italy"},{"key":"6073_CR4","doi-asserted-by":"crossref","unstructured":"Clinchant, S., Jung, K.W., & Nikoulina, V. (2019). On the use of bert for neural machine translation. arXiv preprint arXiv:1909.12744.","DOI":"10.18653\/v1\/D19-5611"},{"key":"6073_CR5","unstructured":"Devlin, J., Chang, M.W., Lee, K., & Toutanova, K. (2019). BERT: Pre-training of deep bidirectional transformers for language understanding. In: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers), pp. 4171\u20134186. Minneapolis, Minnesota."},{"key":"6073_CR6","unstructured":"Dyer, C., Chahuneau, V., & Smith, N.A. (2013). A simple, fast, and effective reparameterization of IBM model 2. In: Proceedings of the 2013 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 644\u2013648. Atlanta, Georgia."},{"key":"6073_CR7","doi-asserted-by":"crossref","unstructured":"Finkel, J.R., Grenager, T., & Manning, C. (2005). Incorporating non-local information into information extraction systems by Gibbs sampling. In: Proceedings of the 43rd Annual Meeting of the Association for Computational Linguistics (ACL\u201905), pp. 363\u2013370. Ann Arbor, Michigan.","DOI":"10.3115\/1219840.1219885"},{"key":"6073_CR8","unstructured":"Fonollosa, J.A.R., Casas, N., & Costa-juss\u00e0, M. (2019). Joint source-target self attention with locality constraints. ArXiv preprint arXiv:1905.06596"},{"key":"6073_CR9","unstructured":"Hassan, H., Aue, A., Chen, C., Chowdhary, V., Clark, J., Federmann, C., Huang, X., Junczys-Dowmunt, M., Lewis, W., & Li, M., et\u00a0al. (2018). Achieving human parity on automatic chinese to english news translation. arXiv preprint arXiv:1803.05567"},{"key":"6073_CR10","doi-asserted-by":"crossref","unstructured":"Kim, Y.J., Junczys-Dowmunt, M., Hassan, H., Fikri\u00a0Aji, A., Heafield, K., Grundkiewicz, R., & Bogoychev, N. (2019). From research to production and back: Ludicrously fast neural machine translation. In: Proceedings of the 3rd Workshop on Neural Generation and Translation, pp. 280\u2013288. Hong Kong.","DOI":"10.18653\/v1\/D19-5632"},{"key":"6073_CR11","unstructured":"Kingma, D.P., & Ba, J. (2015). Adam: A method for stochastic optimization. In: 3rd International Conference on Learning Representations, ICLR 2015."},{"key":"6073_CR12","unstructured":"Koehn, P. (2004). Statistical significance tests for machine translation evaluation. In: Proceedings of the 2004 Conference on EMNLP, pp. 388\u2013395. Barcelona, Spain."},{"key":"6073_CR13","doi-asserted-by":"crossref","unstructured":"Li, X., Yan, J., Zhang, J., & Zong, C. (2018). Neural name translation improves neural machine translation. In: China Workshop on Machine Translation, pp. 93\u2013100. Springer.","DOI":"10.1007\/978-981-13-3083-4_9"},{"key":"6073_CR14","doi-asserted-by":"crossref","unstructured":"Li, Z., Wang, X., Aw, A.T., Chng, E.S., & Li, H. (2018). Named-entity tagging and domain adaptation for better customized translation. In: Proceedings of the Seventh Named Entities Workshop, pp. 41\u201346.","DOI":"10.18653\/v1\/W18-2407"},{"key":"6073_CR15","doi-asserted-by":"crossref","unstructured":"Lin, T., Goyal, P., Girshick, R.B., He, K., & Doll\u00e1r, P. (2017). Focal loss for dense object detection. In: IEEE International Conference on Computer Vision, pp. 2999\u20133007. IEEE Computer Society.","DOI":"10.1109\/ICCV.2017.324"},{"key":"6073_CR16","unstructured":"Liu, Y., Ott, M., Goyal, N., Du, J., Joshi, M., Chen, D., Levy, O., Lewis, M., Zettlemoyer, L., & Stoyanov, V. (2019). Roberta: A robustly optimized bert pretraining approach. arXiv preprint arXiv:1907.11692"},{"key":"6073_CR17","doi-asserted-by":"crossref","unstructured":"Lu, Y., Zhang, J., & Zong, C. (2018). Exploiting knowledge graph in neural machine translation. In: China Workshop on Machine Translation, pp. 27\u201338. Springer.","DOI":"10.1007\/978-981-13-3083-4_3"},{"key":"6073_CR18","doi-asserted-by":"crossref","unstructured":"Luo, Y., Xiao, F., & Zhao, H. (2020). Hierarchical contextualized representation for named entity recognition. The Thirty-Fourth AAAI Conference on Artificial Intelligence (pp. 8441\u20138448). AAAI Press.","DOI":"10.1609\/aaai.v34i05.6363"},{"key":"6073_CR19","unstructured":"Luong, T., Cho, K., & Manning, C.D. (2016). Neural machine translation. In: Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics: Tutorial Abstracts. Berlin, Germany."},{"key":"6073_CR20","doi-asserted-by":"crossref","unstructured":"Michel, P., & Neubig, G. (2018). MTNT: A testbed for machine translation of noisy text. In: Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, pp. 543\u2013553.","DOI":"10.18653\/v1\/D18-1050"},{"key":"6073_CR21","unstructured":"Modrzejewski, M., Exel, M., Buschbeck, B., Ha, T.L., & Waibel, A. (2020). Incorporating external annotation to improve named entity translation in NMT. In: Proceedings of the 22nd Annual Conference of the European Association for Machine Translation, pp. 45\u201351. Lisboa, Portugal."},{"key":"6073_CR22","unstructured":"Neubig, G. (2011). The kyoto free translation task"},{"key":"6073_CR23","doi-asserted-by":"crossref","unstructured":"Niehues, J., & Cho, E. (2017). Exploiting linguistic resources for neural machine translation using multi-task learning. In: Proceedings of the Second Conference on Machine Translation, pp. 80\u201389.","DOI":"10.18653\/v1\/W17-4708"},{"key":"6073_CR24","doi-asserted-by":"crossref","unstructured":"Ott, M., Edunov, S., Baevski, A., Fan, A., Gross, S., Ng, N., Grangier, D., & Auli, M. (2019). fairseq: A fast, extensible toolkit for sequence modeling. In: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics (Demonstrations), pp. 48\u201353.","DOI":"10.18653\/v1\/N19-4009"},{"key":"6073_CR25","doi-asserted-by":"crossref","unstructured":"Post, M. (2018). A call for clarity in reporting BLEU scores. In: Proceedings of the Third Conference on Machine Translation: Research Papers, pp. 186\u2013191. Brussels, Belgium.","DOI":"10.18653\/v1\/W18-6319"},{"key":"6073_CR26","unstructured":"Post, M., Ding, S., Martindale, M., & Wu, W. (2019). An exploration of placeholding in neural machine translation. In: Proceedings of Machine Translation Summit XVII Volume 1: Research Track, pp. 182\u2013192."},{"key":"6073_CR27","unstructured":"Pryzant, R., Chung, Y., Jurafsky, D., & Britz, D. (2018). JESC: Japanese-English subtitle corpus. In: Proceedings of the Eleventh International Conference on Language Resources and Evaluation."},{"key":"6073_CR28","doi-asserted-by":"crossref","unstructured":"Sennrich, R., & Haddow, B. (2016). Linguistic input features improve neural machine translation. In: Proceedings of the First Conference on Machine Translation, pp. 83\u201391. Berlin, Germany.","DOI":"10.18653\/v1\/W16-2209"},{"key":"6073_CR29","doi-asserted-by":"crossref","unstructured":"Sennrich, R., Haddow, B., & Birch, A. (2016). Neural machine translation of rare words with subword units. In: Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 1715\u20131725. Berlin, Germany.","DOI":"10.18653\/v1\/P16-1162"},{"key":"6073_CR30","doi-asserted-by":"crossref","unstructured":"Shavarani, H.S., Sarkar, A.: Better neural machine translation by extracting linguistic information from bert. arXiv preprint arXiv:2104.02831 (2021)","DOI":"10.18653\/v1\/2021.eacl-main.241"},{"key":"6073_CR31","doi-asserted-by":"crossref","unstructured":"Song, K., Zhang, Y., Yu, H., Luo, W., Wang, K., & Zhang, M. (2019). Code-switching for enhancing NMT with pre-specified translation. In: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics, pp. 449\u2013459. Minneapolis, Minnesota.","DOI":"10.18653\/v1\/N19-1044"},{"key":"6073_CR32","unstructured":"Ugawa, A., Tamura, A., Ninomiya, T., Takamura, H., & Okumura, M. (2018). Neural machine translation incorporating named entity. In: Proceedings of the 27th International Conference on Computational Linguistics, pp. 3240\u20133250. Santa Fe, New Mexico, USA."},{"key":"6073_CR33","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A.N., Kaiser, L., Polosukhin, I.: Attention is all you need. In: Advances in Neural Information Processing Systems, pp. 5998\u20136008 (2017)"},{"key":"6073_CR34","doi-asserted-by":"crossref","unstructured":"Wang, C., Cho, K., Gu, J.: Neural machine translation with byte-level subwords. arXiv preprint arXiv:1909.03341 (2019)","DOI":"10.1609\/aaai.v34i05.6451"},{"key":"6073_CR35","doi-asserted-by":"crossref","unstructured":"Wang, Y., Cheng, S., Jiang, L., Yang, J., Chen, W., Li, M., Shi, L., Wang, Y., & Yang, H. (2017). Sogou neural machine translation systems for WMT17. In: Proceedings of the Second Conference on Machine Translation, pp. 410\u2013415. Copenhagen, Denmark.","DOI":"10.18653\/v1\/W17-4742"},{"key":"6073_CR36","volume-title":"Ontonotes release 5.0 ldc2013t19","author":"R Weischedel","year":"2013","unstructured":"Weischedel, R., Palmer, M., Marcus, M., Hovy, E., Pradhan, S., Ramshaw, L., et al. (2013). Ontonotes release 5.0 ldc2013t19. Philadelphia, PA: Linguistic Data Consortium."},{"key":"6073_CR37","unstructured":"Wu, F., Fan, A., Baevski, A., Dauphin, Y.N., & Auli, M. (2019). Pay less attention with lightweight and dynamic convolutions. In: 7th International Conference on Learning Representations, ICLR 2019."},{"key":"6073_CR38","unstructured":"Wu, Y., Schuster, M., Chen, Z., Le, Q.V., Norouzi, M., Macherey, W., Krikun, M., Cao, Y., Gao, Q., Macherey, K., et\u00a0al.: Google\u2019s neural machine translation system: Bridging the gap between human and machine translation. arXiv:1609.08144 (2016)"},{"key":"6073_CR39","doi-asserted-by":"crossref","unstructured":"Yang, J., Wang, M., Zhou, H., Zhao, C., Zhang, W., Yu, Y., & Li, L. (2020). Towards making the most of bert in neural machine translation. In: Proceedings of the AAAI Conference on Artificial Intelligence, pp. 9378\u20139385.","DOI":"10.1609\/aaai.v34i05.6479"},{"key":"6073_CR40","doi-asserted-by":"crossref","unstructured":"Zhao, Y., Xiang, L., Zhu, J., Zhang, J., Zhou, Y., & Zong, C. (2020). Knowledge graph enhanced neural machine translation via multi-task learning on sub-entity granularity. In: Proceedings of the 28th International Conference on Computational Linguistics, pp. 4495\u20134505.","DOI":"10.18653\/v1\/2020.coling-main.397"},{"key":"6073_CR41","doi-asserted-by":"crossref","unstructured":"Zhao, Y., Zhang, J., Zhou, Y., Zong, C.: Knowledge graphs enhanced neural machine translation. In: IJCAI, pp. 4039\u20134045 (2020)","DOI":"10.24963\/ijcai.2020\/559"},{"key":"6073_CR42","unstructured":"Zhu, J., Xia, Y., Wu, L., He, D., Qin, T., Zhou, W., Li, H., Liu, T.: Incorporating BERT into neural machine translation. In: 8th International Conference on Learning Representations, ICLR 2020, Addis Ababa, Ethiopia, April 26\u201330, 2020 (2020)"}],"container-title":["Machine Learning"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10994-021-06073-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10994-021-06073-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10994-021-06073-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,13]],"date-time":"2023-01-13T01:02:54Z","timestamp":1673571774000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10994-021-06073-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,1,13]]},"references-count":42,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2022,3]]}},"alternative-id":["6073"],"URL":"https:\/\/doi.org\/10.1007\/s10994-021-06073-9","relation":{},"ISSN":["0885-6125","1573-0565"],"issn-type":[{"value":"0885-6125","type":"print"},{"value":"1573-0565","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,1,13]]},"assertion":[{"value":"13 May 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 August 2021","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 September 2021","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 January 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declaration"}},{"value":"The authors declare that they have no Conflicts of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}