{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,3,2]],"date-time":"2024-03-02T13:22:02Z","timestamp":1709385722393},"reference-count":33,"publisher":"Institute of Electronics, Information and Communications Engineers (IEICE)","issue":"3","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEICE Trans. Inf. &amp; Syst."],"published-print":{"date-parts":[[2020,3,1]]},"DOI":"10.1587\/transinf.2019edp7065","type":"journal-article","created":{"date-parts":[[2020,2,29]],"date-time":"2020-02-29T22:10:43Z","timestamp":1583014243000},"page":"674-683","source":"Crossref","is-referenced-by-count":1,"title":["Leveraging Neural Caption Translation with Visually Grounded Paraphrase Augmentation"],"prefix":"10.1587","volume":"E103.D","author":[{"given":"Johanes","family":"EFFENDI","sequence":"first","affiliation":[{"name":"Augmented Human Communication Lab., Nara Institute of Science and Technology"},{"name":"RIKEN, Center for Advanced Intelligence Project AIP"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sakriani","family":"SAKTI","sequence":"additional","affiliation":[{"name":"Augmented Human Communication Lab., Nara Institute of Science and Technology"},{"name":"RIKEN, Center for Advanced Intelligence Project AIP"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Katsuhito","family":"SUDOH","sequence":"additional","affiliation":[{"name":"Augmented Human Communication Lab., Nara Institute of Science and Technology"},{"name":"RIKEN, Center for Advanced Intelligence Project AIP"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Satoshi","family":"NAKAMURA","sequence":"additional","affiliation":[{"name":"Augmented Human Communication Lab., Nara Institute of Science and Technology"},{"name":"RIKEN, Center for Advanced Intelligence Project AIP"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"532","reference":[{"key":"1","unstructured":"[1] G. Hirst, \u201cParaphrasing paraphrased,\u201d Invited talk at the ACL International Workshop on Paraphrasing, 2003."},{"key":"2","unstructured":"[2] C. Chu, M. Otani, and Y. Nakashima, \u201ciParaphrasing: Extracting visually grounded paraphrases via an image,\u201d Proc. 27th International Conference on Computational Linguistics, pp.3479-3492, Association for Computational Linguistics, 2018."},{"key":"3","doi-asserted-by":"crossref","unstructured":"[3] O. Vinyals, A. Toshev, S. Bengio, and D. Erhan, \u201cShow and tell: A neural image caption generator,\u201d 2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp.3156-3164, 2015. 10.1109\/cvpr.2015.7298935","DOI":"10.1109\/CVPR.2015.7298935"},{"key":"4","doi-asserted-by":"publisher","unstructured":"[4] Q. Wu, D. Teney, P. Wang, C. Shen, A.R. Dick, and A. van den Hengel, \u201cVisual question answering: A survey of methods and datasets,\u201d Computer Vision and Image Understanding, vol.163, pp.21-40, 2017. 10.1016\/j.cviu.2017.05.001","DOI":"10.1016\/j.cviu.2017.05.001"},{"key":"5","unstructured":"[5] I. Calixto, Q. Liu, and N. Campbell, \u201cDoubly-attentive decoder for multi-modal neural machine translation,\u201d Proc. of 2017 Annual Conference of the Association for Computational Linguistics (ACL), pp.1913-1924, Vancouver, Canada, 2017."},{"key":"6","doi-asserted-by":"crossref","unstructured":"[6] D. Elliott, S. Frank, K. Sima&apos;an, and L. Specia, \u201cMulti30k: Multilingual english-german image descriptions,\u201d Proc. 5th Workshop on Vision and Language, pp.70-74, 2016. 10.18653\/v1\/w16-3210","DOI":"10.18653\/v1\/W16-3210"},{"key":"7","doi-asserted-by":"crossref","unstructured":"[7] T.Y. Lin, M. Maire, S. Belongie, J. Hays, P. Perona, D. Ramanan, P. Doll\u00e1r, and C.L. Zitnick, \u201cMicrosoft COCO: Common objects in context,\u201d European Conference on Computer Vision (ECCV), pp.740-755, Springer, 2014. 10.1007\/978-3-319-10602-1_48","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"8","unstructured":"[8] A. Prakash, S.A. Hasan, K. Lee, V. Datla, A. Qadir, J. Liu, and O. Farri, \u201cNeural paraphrase generation with stacked residual lstm networks,\u201d Proc. COLING 2016, the 26th International Conference on Computational Linguistics: Technical Papers, Osaka, Japan, pp.2923-2934, The COLING 2016 Organizing Committee, Dec. 2016."},{"key":"9","doi-asserted-by":"publisher","unstructured":"[9] R. Bhagat and E. Hovy, \u201cWhat is a paraphrase?,\u201d Computational Linguistics, vol.39, no.3, pp.463-472, 2013. 10.1162\/coli_a_00166","DOI":"10.1162\/COLI_a_00166"},{"key":"10","unstructured":"[10] G.D.S. Huang and D. Graff, Multiple-Translation Chinese Corpus, Linguistic Data Consortium, University of Pennsylvania, 2002."},{"key":"11","unstructured":"[11] W. B. Dolan and B.Chris, \u201cAutomatically constructing a corpus of sentential paraphrases,\u201d Proc. Third International Workshop on Paraphrasing, IWP2005, 2005"},{"key":"12","doi-asserted-by":"publisher","unstructured":"[12] P. Resnik, O. Buzek, Y. Kronrod, C. Hu, A.J. Quinn, and B.B.Bederson, \u201cUsing targeted paraphrasing and monolingual crowdsourcing to improve translation,\u201d ACM Transactions on Intelligent Systems and Technology (TIST), vol.4, no.3, p.38, 2013. 10.1145\/2483669.2483671","DOI":"10.1145\/2483669.2483671"},{"key":"13","unstructured":"[13] B.A. Plummer, L. Wang, C.M. Cervantes, J.C. Caicedo, J.Hockenmaier, and S. Lazebnik, \u201cFlickr30k entities: Collecting region-to-phrase correspondences for richer image-to-sentence models,\u201d CoRR, vol.abs\/1505.04870, 2015."},{"key":"14","doi-asserted-by":"crossref","unstructured":"[14] D. Elliott, S. Frank, L. Barrault, F. Bougares, and L. Specia, \u201cFindings of the Second Shared Task on Multimodal Machine Translation and Multilingual Image Description,\u201d Proc. Second Conference on Machine Translation (WMT), Copenhagen, Denmark, Sept. 2017. 10.18653\/v1\/w17-4718","DOI":"10.18653\/v1\/W17-4718"},{"key":"15","unstructured":"[15] C. Dyer, V. Chahuneau, and N.A. Smith, \u201cA simple, fast, and effective reparameterization of IBM model 2,\u201d Proc. Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (HLT-NAACL &apos;13),Atlanta, GA, USA, 2013."},{"key":"16","doi-asserted-by":"crossref","unstructured":"[16] K. Toutanova, D. Klein, C.D. Manning, and Y. Singer, \u201cFeature-rich part-of-speech tagging with a cyclic dependency network,\u201d Proc. 2003 Conference of the North American Chapter of the Association for Computational Linguistics on Human Language Technology (HLT-NAACL &apos;03), Stroudsburg, PA, USA, pp.173-180, 2003. 10.3115\/1073445.1073478","DOI":"10.3115\/1073445.1073478"},{"key":"17","unstructured":"[17] J. Devlin, M.W. Chang, K. Lee, and K. Toutanova, \u201cBERT: Pre-training of deep bidirectional transformers for language understanding,\u201d arXiv preprint arXiv:1810.04805, 2018."},{"key":"18","unstructured":"[18] D. Bahdanau, K. Cho, and Y. Bengio, \u201cNeural machine translation by jointly learning to align and translate,\u201d CoRR, vol.abs\/1409.0473, 2014."},{"key":"19","doi-asserted-by":"publisher","unstructured":"[19] E. Nichols, F. Bond, D.S. Appling, and Y. Matsumoto, \u201cParaphrasing training data for statistical machine translation,\u201d Journal of Natural Language Processing, vol.17, no.3, pp.3_101-3_122, 2010. 10.5715\/jnlp.17.3_101","DOI":"10.5715\/jnlp.17.3_101"},{"key":"20","unstructured":"[20] B. Zoph and K. Knight, \u201cMulti-source neural translation,\u201d CoRR, vol.abs\/1601.00710, 2016."},{"key":"21","unstructured":"[21] E. Garmash and C. Monz, \u201cEnsemble learning for multi-source neural machine translation,\u201d Proc. COLING, pp.1409-1418, 2016."},{"key":"22","unstructured":"[22] A.L.J. Clark, C. Dyer, and N. Smith, \u201cBetter hypothesis testing for statistical machine translation: Controlling for optimizer instability,\u201d Proc. 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies, pp.176-181, Oregon, USA, 2011."},{"key":"23","doi-asserted-by":"crossref","unstructured":"[23] K. Papineni, S. Roukos, T. Ward, and W.J. Zhu, \u201cBLEU: A method for automatic evaluation of machine translation,\u201d Proc. 40th Annual Meeting on Association for Computational Linguistics, Association for Computational Linguistics, 2002.","DOI":"10.3115\/1073083.1073135"},{"key":"24","doi-asserted-by":"crossref","unstructured":"[24] A. Lavie and A. Agarwal, \u201cMETEOR: An automatic metric for MT evaluation with high levels of correlation with human judgments,\u201d Proc. Second Workshop on Statistical Machine Translation, pp.228-231, 2007.","DOI":"10.3115\/1626355.1626389"},{"key":"25","unstructured":"[25] D.P. Kingma and J. Ba, \u201cAdam: A method for stochastic optimization,\u201d CoRR, vol.abs\/1412.6980, 2014."},{"key":"26","unstructured":"[26] A. Graves, \u201cGenerating sequences with recurrent neural networks,\u201d CoRR, vol.abs\/1308.0850, 2013."},{"key":"27","unstructured":"[27] S. Tokui, K. Oono, S. Hido, and J. Clayton, \u201cChainer: A next-generation open source framework for deep learning,\u201d Proc. Workshop on Machine Learning Systems (LearningSys) in the 29th Annual Conference on Neural Information Processing Systems (NIPS), 2015."},{"key":"28","doi-asserted-by":"crossref","unstructured":"[28] J. Zhang, M. Utiyama, E. Sumita, G. Neubig, and S. Nakamura,\u201cNICT-NAIST system for WMT17 multimodal translation task,\u201d Proc. Conference of Machine Translation (WMT), 2017.","DOI":"10.18653\/v1\/W17-4753"},{"key":"29","doi-asserted-by":"crossref","unstructured":"[29] P.S. Madhyastha, J. Wang, and L. Specia, \u201cSheffield multimt: Using object posterior predictions for multimodal machine translation,\u201d Proc. Second Conference on Machine Translation (WMT), Volume 2: Shared Task Papers, Copenhagen, Denmark, pp.470-476, Association for Computational Linguistics, Sept. 2017. 10.18653\/v1\/w17-4752","DOI":"10.18653\/v1\/W17-4752"},{"key":"30","doi-asserted-by":"crossref","unstructured":"[30] I. Calixto, K.D. Chowdhury, and Q. Liu, \u201cDCU system report on the WMT 2017 multi-modal machine translation task,\u201d Proc. Conference of Machine Translation (WMT), 2017. 10.18653\/v1\/w17-4747","DOI":"10.18653\/v1\/W17-4747"},{"key":"31","doi-asserted-by":"crossref","unstructured":"[31] M. Ma, D. Li, K. Zhao, and L. Huang, \u201cOSU multimodal machine translation system report,\u201d Proc. Second Conference on Machine Translation, Volume 2: Shared Task Papers, Copenhagen, Denmark, pp.465-469, Association for Computational Linguistics, Sept. 2017. 10.18653\/v1\/w17-4751","DOI":"10.18653\/v1\/W17-4751"},{"key":"32","unstructured":"[32] J. Helcl and J. Libovick\u00fd, \u201cCUNI system for the WMT17 multimodal translation task,\u201d CoRR, vol.abs\/1707.04550, 2017."},{"key":"33","unstructured":"[33] A. Vaswani, N. Shazeer, N. Parmar, J. Uszkoreit, L. Jones, A.N. Gomez, L. Kaiser, and I. Polosukhin, \u201cAttention is all you need,\u201d Advances in Neural Information Processing Systems 30, ed. I. Guyon, U.V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S.Vishwanathan, and R. Garnett, pp.5998-6008, Curran Associates, 2017."}],"container-title":["IEICE Transactions on Information and Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.jstage.jst.go.jp\/article\/transinf\/E103.D\/3\/E103.D_2019EDP7065\/_pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,3,7]],"date-time":"2020-03-07T03:26:34Z","timestamp":1583551594000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.jstage.jst.go.jp\/article\/transinf\/E103.D\/3\/E103.D_2019EDP7065\/_article"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,3,1]]},"references-count":33,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2020]]}},"URL":"https:\/\/doi.org\/10.1587\/transinf.2019edp7065","relation":{},"ISSN":["0916-8532","1745-1361"],"issn-type":[{"value":"0916-8532","type":"print"},{"value":"1745-1361","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,3,1]]}}}