{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,23]],"date-time":"2024-09-23T04:31:27Z","timestamp":1727065887019},"reference-count":40,"publisher":"Association for Natural Language Processing","issue":"2","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Journal of Natural Language Processing"],"published-print":{"date-parts":[[2023]]},"DOI":"10.5715\/jnlp.30.401","type":"journal-article","created":{"date-parts":[[2023,6,14]],"date-time":"2023-06-14T22:14:08Z","timestamp":1686780848000},"page":"401-431","source":"Crossref","is-referenced-by-count":2,"title":["Generic Mechanism for Reducing Repetitions in Encoder-decoder Models"],"prefix":"10.5715","volume":"30","author":[{"given":"Ying","family":"Zhang","sequence":"first","affiliation":[{"name":"Tokyo Institute of Technology"}]},{"given":"Hidetaka","family":"Kamigaito","sequence":"additional","affiliation":[{"name":"NARA Institute of Science and Technology (NAIST)"}]},{"given":"Tatsuya","family":"Aoki","sequence":"additional","affiliation":[{"name":"Tokyo Institute of Technology"}]},{"given":"Hiroya","family":"Takamura","sequence":"additional","affiliation":[{"name":"National Institute of Advanced Industrial Science and Technology (AIST)"}]},{"given":"Manabu","family":"Okumura","sequence":"additional","affiliation":[{"name":"Tokyo Institute of Technology"}]}],"member":"3685","reference":[{"key":"1","unstructured":"Bahdanau, D., Cho, K. H., and Bengio, Y. (2015). \u201cNeural Machine Translation by Jointly Learning to Align and Translate.\u201d In <i>3rd International Conference on Learning Representations, ICLR 2015<\/i>."},{"key":"2","doi-asserted-by":"crossref","unstructured":"Bengio, Y. et al. (2009). \u201cLearning Deep Architectures for AI.\u201d <i>Foundations and Trends\u00ae in Machine Learning<\/i>, 2 (1), pp. 1\u2013127.","DOI":"10.1561\/2200000006"},{"key":"3","doi-asserted-by":"crossref","unstructured":"Bojar, O., Buck, C., Federmann, C., Haddow, B., Koehn, P., Leveling, J., Monz, C., Pecina, P., Post, M., Saint-Amand, H., Soricut, R., Specia, L., and Tamchyna, A. (2014). \u201cFindings of the 2014 Workshop on Statistical Machine Translation.\u201d In <i>Proceedings of the 9th Workshop on Statistical Machine Translation<\/i>, pp. 12\u201358, Baltimore, Maryland, USA. Association for Computational Linguistics.","DOI":"10.3115\/v1\/W14-3302"},{"key":"4","doi-asserted-by":"crossref","unstructured":"Brier, G. W. (1950). \u201cVerification of Forecasts Expressed in Terms of Probability.\u201d <i>Monthly Weather Review<\/i>, 78 (1), pp. 1\u20133.","DOI":"10.1175\/1520-0493(1950)078<0001:VOFEIT>2.0.CO;2"},{"key":"5","unstructured":"Cettolo, M., Niehues, J., St\u00fcker, S., Bentivogli, L., and Federico, M. (2014). \u201cReport on the 11th IWSLT Evaluation Campaign, IWSLT 2014.\u201d In <i>Proceedings of the International Workshop on Spoken Language Translation, Hanoi, Vietnam<\/i>, p. 57."},{"key":"6","doi-asserted-by":"crossref","unstructured":"Cho, K., van Merri\u00ebnboer, B., Bahdanau, D., and Bengio, Y. (2014). \u201cOn the Properties of Neural Machine Translation: Encoder\u2013Decoder Approaches.\u201d In <i>Proceedings of SSST-8, Eighth Workshop on Syntax, Semantics and Structure in Statistical Translation<\/i>, pp. 103\u2013111, Doha, Qatar. Association for Computational Linguistics.","DOI":"10.3115\/v1\/W14-4012"},{"key":"7","doi-asserted-by":"crossref","unstructured":"Denkowski, M. and Lavie, A. (2014). \u201cMeteor Universal: Language Specific Translation Evaluation for Any Target Language.\u201d In <i>Proceedings of the 9th Workshop on Statistical Machine Translation<\/i>, pp. 376\u2013380, Baltimore, Maryland, USA. Association for Computational Linguistics.","DOI":"10.3115\/v1\/W14-3348"},{"key":"8","doi-asserted-by":"crossref","unstructured":"Fan, A., Lewis, M., and Dauphin, Y. (2018). \u201cHierarchical Neural Story Generation.\u201d In <i>Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)<\/i>, pp. 889\u2013898, Melbourne, Australia. Association for Computational Linguistics.","DOI":"10.18653\/v1\/P18-1082"},{"key":"9","unstructured":"Fonollosa, J. A., Casas, N., and Costa-juss\u00e0, M. R. (2019). \u201cJoint Source-Target Self Attention with Locality Constraints.\u201d <i>arXiv preprint arXiv:1905.06596<\/i>."},{"key":"10","doi-asserted-by":"crossref","unstructured":"Fu, Z., Lam, W., So, A. M.-C., and Shi, B. (2021). \u201cA Theoretical Analysis of the Repetition Problem in Text Generation.\u201d <i>Proceedings of the AAAI Conference on Artificial Intelligence<\/i>, 35 (14), pp. 12848\u201312856.","DOI":"10.1609\/aaai.v35i14.17520"},{"key":"11","unstructured":"Gehring, J., Auli, M., Grangier, D., Yarats, D., and Dauphin, Y. N. (2017). \u201cConvolutional Sequence to Sequence Learning.\u201d In <i>Proceedings of the 34th International Conference on Machine Learning - Volume 70<\/i>, ICML\u201917, pp. 1243\u20131252. JMLR.org."},{"key":"12","doi-asserted-by":"crossref","unstructured":"Hochreiter, S. and Schmidhuber, J. (1997). \u201cLong Short-Term Memory.\u201d <i>Neural Computation<\/i>, 9 (8), pp. 1735\u20131780.","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"13","unstructured":"Holtzman, A., Buys, J., Du, L., Forbes, M., and Choi, Y. (2020). \u201cThe Curious Case of Neural Text Degeneration.\u201d In <i>International Conference on Learning Representations<\/i>."},{"key":"14","unstructured":"Kiyono, S., Takase, S., Suzuki, J., Okazaki, N., Inui, K., and Nagata, M. (2018). \u201cReducing Odd Generation from Neural Headline Generation.\u201d In <i>Proceedings of the 32nd Pacific Asia Conference on Language, Information and Computation<\/i>, Hong Kong. Association for Computational Linguistics."},{"key":"15","doi-asserted-by":"crossref","unstructured":"Lewis, M., Liu, Y., Goyal, N., Ghazvininejad, M., Mohamed, A., Levy, O., Stoyanov, V., and Zettlemoyer, L. (2020). \u201cBART: Denoising Sequence-to-Sequence Pre-training for Natural Language Generation, Translation, and Comprehension.\u201d In <i>Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics<\/i>, pp. 7871\u20137880, Online. Association for Computational Linguistics.","DOI":"10.18653\/v1\/2020.acl-main.703"},{"key":"16","doi-asserted-by":"crossref","unstructured":"Li, P., Lam, W., Bing, L., and Wang, Z. (2017). \u201cDeep Recurrent Generative Decoder for Abstractive Text Summarization.\u201d In <i>Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing<\/i>, pp. 2091\u20132100, Copenhagen, Denmark. Association for Computational Linguistics.","DOI":"10.18653\/v1\/D17-1222"},{"key":"17","doi-asserted-by":"crossref","unstructured":"Liu, T., Luo, F., Xia, Q., Ma, S., Chang, B., and Sui, Z. (2019). \u201cHierarchical Encoder with Auxiliary Supervision for Neural Table-to-Text Generation: Learning Better Representation for Tables.\u201d In <i>Proceedings of the Thirty-Third AAAI Conference on Artificial Intelligence and Thirty-First Innovative Applications of Artificial Intelligence Conference and 9th AAAI Symposium on Educational Advances in Artificial Intelligence<\/i>, AAAI\u201919\/IAAI\u201919\/EAAI\u201919. AAAI Press.","DOI":"10.1609\/aaai.v33i01.33016786"},{"key":"18","doi-asserted-by":"crossref","unstructured":"Luo, L., Xu, J., Lin, J., Zeng, Q., and Sun, X. (2018). \u201cAn Auto-Encoder Matching Model for Learning Utterance-Level Semantic Dependency in Dialogue Generation.\u201d In <i>Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing<\/i>, pp. 702\u2013707, Brussels, Belgium. Association for Computational Linguistics.","DOI":"10.18653\/v1\/D18-1075"},{"key":"19","unstructured":"Luong, M.-T., Le, Q. V., Sutskever, I., Vinyals, O., and Kaiser, L. (2015a). \u201cMulti-task Sequence to Sequence Learning.\u201d <i>arXiv preprint arXiv:1511.06114<\/i>."},{"key":"20","doi-asserted-by":"crossref","unstructured":"Luong, T., Pham, H., and Manning, C. D. (2015b). \u201cEffective Approaches to Attention-based Neural Machine Translation.\u201d In <i>Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing<\/i>, pp. 1412\u20131421, Lisbon, Portugal. Association for Computational Linguistics.","DOI":"10.18653\/v1\/D15-1166"},{"key":"21","doi-asserted-by":"crossref","unstructured":"Ma, S., Sun, X., Lin, J., and Wang, H. (2018). \u201cAutoencoder as Assistant Supervisor: Improving Text Representation for Chinese Social Media Text Summarization.\u201d In <i>Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)<\/i>, pp. 725\u2013731, Melbourne, Australia. Association for Computational Linguistics.","DOI":"10.18653\/v1\/P18-2115"},{"key":"22","doi-asserted-by":"crossref","unstructured":"Mi, H., Sankaran, B., Wang, Z., and Ittycheriah, A. (2016). \u201cCoverage Embedding Models for Neural Machine Translation.\u201d In <i>Proceedings of the 2016 Conference on Empirical Methods in Natural Language Processing<\/i>, pp. 955\u2013960, Austin, Texas. Association for Computational Linguistics.","DOI":"10.18653\/v1\/D16-1096"},{"key":"23","unstructured":"Mikolov, T., Sutskever, I., Chen, K., Corrado, G. S., and Dean, J. (2013). \u201cDistributed Representations of Words and Phrases and Their Compositionality.\u201d In <i>Advances in Neural Information Processing Systems<\/i>, pp. 3111\u20133119."},{"key":"24","doi-asserted-by":"crossref","unstructured":"Miller, A., Feng, W., Batra, D., Bordes, A., Fisch, A., Lu, J., Parikh, D., and Weston, J. (2017). \u201cParlAI: A Dialog Research Software Platform.\u201d In <i>Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing: System Demonstrations<\/i>, pp. 79\u201384, Copenhagen, Denmark. Association for Computational Linguistics.","DOI":"10.18653\/v1\/D17-2014"},{"key":"25","doi-asserted-by":"crossref","unstructured":"Ott, M., Edunov, S., Baevski, A., Fan, A., Gross, S., Ng, N., Grangier, D., and Auli, M. (2019). \u201cfairseq: A Fast, Extensible Toolkit for Sequence Modeling.\u201d In <i>Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics (Demonstrations)<\/i>, pp. 48\u201353, Minneapolis, Minnesota. Association for Computational Linguistics.","DOI":"10.18653\/v1\/N19-4009"},{"key":"26","doi-asserted-by":"crossref","unstructured":"Papineni, K., Roukos, S., Ward, T., and Zhu, W.-J. (2002). \u201cBleu: a Method for Automatic Evaluation of Machine Translation.\u201d In <i>Proceedings of the 40th Annual Meeting of the Association for Computational Linguistics<\/i>, pp. 311\u2013318, Philadelphia, Pennsylvania, USA. Association for Computational Linguistics.","DOI":"10.3115\/1073083.1073135"},{"key":"27","doi-asserted-by":"crossref","unstructured":"Pasunuru, R. and Bansal, M. (2018). \u201cGame-Based Video-Context Dialogue.\u201d In <i>Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing<\/i>, pp. 125\u2013136, Brussels, Belgium. Association for Computational Linguistics.","DOI":"10.18653\/v1\/D18-1012"},{"key":"28","unstructured":"Radford, A., Narasimhan, K., Salimans, T., and Sutskever, I. (2018). \u201cImproving Language Understanding by Generative Pre-training.\u201d."},{"key":"29","doi-asserted-by":"crossref","unstructured":"See, A., Liu, P. J., and Manning, C. D. (2017). \u201cGet To The Point: Summarization with Pointer-Generator Networks.\u201d In <i>Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)<\/i>, pp. 1073\u20131083, Vancouver, Canada. Association for Computational Linguistics.","DOI":"10.18653\/v1\/P17-1099"},{"key":"30","doi-asserted-by":"crossref","unstructured":"Sennrich, R., Haddow, B., and Birch, A. (2016). \u201cNeural Machine Translation of Rare Words with Subword Units.\u201d In <i>Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)<\/i>, pp. 1715\u20131725, Berlin, Germany. Association for Computational Linguistics.","DOI":"10.18653\/v1\/P16-1162"},{"key":"31","unstructured":"Sutskever, I., Vinyals, O., and Le, Q. V. (2014). \u201cSequence to Sequence Learning with Neural Networks.\u201d In Ghahramani, Z., Welling, M., Cortes, C., Lawrence, N., and Weinberger, K. (Eds.), <i>Advances in Neural Information Processing Systems<\/i>, Vol. 27. Curran Associates, Inc."},{"key":"32","doi-asserted-by":"crossref","unstructured":"Suzuki, J. and Nagata, M. (2017). \u201cCutting-off Redundant Repeating Generations for Neural Abstractive Summarization.\u201d In <i>Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics: Volume 2, Short Papers<\/i>, pp. 291\u2013297, Valencia, Spain. Association for Computational Linguistics.","DOI":"10.18653\/v1\/E17-2047"},{"key":"33","doi-asserted-by":"crossref","unstructured":"Tu, Z., Lu, Z., Liu, Y., Liu, X., and Li, H. (2016). \u201cModeling Coverage for Neural Machine Translation.\u201d In <i>Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)<\/i>, pp. 76\u201385, Berlin, Germany. Association for Computational Linguistics.","DOI":"10.18653\/v1\/P16-1008"},{"key":"34","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A. N., Kaiser, L., and Polosukhin, I. (2017). \u201cAttention is All you Need.\u201d In <i>Advances in Neural Information Processing Systems<\/i>, Vol. 30, pp. 5998\u20136008. Curran Associates, Inc."},{"key":"35","doi-asserted-by":"crossref","unstructured":"Wolf, T., Debut, L., Sanh, V., Chaumond, J., Delangue, C., Moi, A., Cistac, P., Rault, T., Louf, R., Funtowicz, M., Davison, J., Shleifer, S., von Platen, P., Ma, C., Jernite, Y., Plu, J., Xu, C., Scao, T. L., Gugger, S., Drame, M., Lhoest, Q., and Rush, A. M. (2020). \u201cTransformers: State-of-the-Art Natural Language Processing.\u201d In <i>Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing: System Demonstrations<\/i>, pp. 38\u201345, Online. Association for Computational Linguistics.","DOI":"10.18653\/v1\/2020.emnlp-demos.6"},{"key":"36","unstructured":"Wolf, T., Sanh, V., Chaumond, J., and Delangue, C. (2019). \u201cTransferTransfo: A Transfer Learning Approach for Neural Network Based Conversational Agents.\u201d <i>CoRR<\/i>, abs\/1901.08149."},{"key":"37","unstructured":"Wu, Y., Schuster, M., Chen, Z., Le, Q. V., Norouzi, M., Macherey, W., Krikun, M., Cao, Y., Gao, Q., Macherey, K., et al. (2016). \u201cGoogle\u2019s Neural Machine Translation System: Bridging the Gap between Human and Machine Translation.\u201d <i>arXiv preprint arXiv:1609.08144<\/i>."},{"key":"38","unstructured":"Xu, J., Liu, X., Yan, J., Cai, D., Li, H., and Li, J. (2022). \u201cLearning to Break the Loop: Analyzing and Mitigating Repetitions for Neural Text Generation.\u201d <i>arXiv preprint arXiv:2206.02369<\/i>."},{"key":"39","doi-asserted-by":"crossref","unstructured":"Zhang, S., Dinan, E., Urbanek, J., Szlam, A., Kiela, D., and Weston, J. (2018). \u201cPersonalizing Dialogue Agents: I Have a Dog, Do You Have Pets Too?\u201d In <i>Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)<\/i>, pp. 2204\u20132213, Melbourne, Australia. Association for Computational Linguistics.","DOI":"10.18653\/v1\/P18-1205"},{"key":"40","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Kamigaito, H., Aoki, T., Takamura, H., and Okumura, M. (2021). \u201cGeneric Mechanism for Reducing Repetitions in Encoder-Decoder Models.\u201d In <i>Proceedings of the International Conference on Recent Advances in Natural Language Processing (RANLP 2021)<\/i>, pp. 1606\u20131615, Held Online. INCOMA Ltd.","DOI":"10.26615\/978-954-452-072-4_180"}],"container-title":["Journal of Natural Language Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.jstage.jst.go.jp\/article\/jnlp\/30\/2\/30_401\/_pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,6,17]],"date-time":"2023-06-17T04:27:58Z","timestamp":1686976078000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.jstage.jst.go.jp\/article\/jnlp\/30\/2\/30_401\/_article"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"references-count":40,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2023]]}},"URL":"https:\/\/doi.org\/10.5715\/jnlp.30.401","relation":{},"ISSN":["1340-7619","2185-8314"],"issn-type":[{"value":"1340-7619","type":"print"},{"value":"2185-8314","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023]]}}}