{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,3]],"date-time":"2026-07-03T08:19:49Z","timestamp":1783066789232,"version":"3.54.6"},"publisher-location":"New York, NY, USA","reference-count":39,"publisher":"ACM","license":[{"start":{"date-parts":[[2019,11,3]],"date-time":"2019-11-03T00:00:00Z","timestamp":1572739200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2019,11,3]]},"DOI":"10.1145\/3357384.3358046","type":"proceedings-article","created":{"date-parts":[[2019,11,4]],"date-time":"2019-11-04T14:11:35Z","timestamp":1572876695000},"page":"1643-1652","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":6,"title":["Generative Question Refinement with Deep Reinforcement Learning in Retrieval-based QA System"],"prefix":"10.1145","author":[{"given":"Ye","family":"Liu","sequence":"first","affiliation":[{"name":"University of Illinois at Chicago, Chicago, IL, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Chenwei","family":"Zhang","sequence":"additional","affiliation":[{"name":"Amazon, Seattle, WA, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Xiaohui","family":"Yan","sequence":"additional","affiliation":[{"name":"Poisson Lab, Huawei Technologies, Shenzhen, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yi","family":"Chang","sequence":"additional","affiliation":[{"name":"Jilin University, Jilin, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Philip S.","family":"Yu","sequence":"additional","affiliation":[{"name":"University of Illinois at Chicago, Chicago, IL, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2019,11,3]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"An actor-critic algorithm for sequence prediction. arXiv preprint arXiv:1607.07086","author":"Bahdanau Dzmitry","year":"2016"},{"key":"e_1_3_2_1_2_1","volume-title":"Neural machine translation by jointly learning to align and translate. arXiv preprint arXiv:1409.0473","author":"Bahdanau Dzmitry","year":"2014"},{"key":"e_1_3_2_1_3_1","volume-title":"Proceedings of the ACL workshop on intrinsic and extrinsic evaluation measures for machine translation and\/or summarization . 65--72","author":"Banerjee Satanjeev","year":"2005"},{"key":"e_1_3_2_1_4_1","volume-title":"Reinforcement learning. Neural systems for control","author":"Barto Andrew G","year":"1998"},{"key":"e_1_3_2_1_5_1","volume-title":"Massive exploration of neural machine translation architectures. arXiv preprint arXiv:1703.03906","author":"Britz Denny","year":"2017"},{"key":"e_1_3_2_1_6_1","volume-title":"Ask the Right Questions: Active Question Reformulation with Reinforcement Learning. ICLR","author":"Buck Christian","year":"2018"},{"key":"e_1_3_2_1_7_1","volume-title":"Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805","author":"Devlin Jacob","year":"2018"},{"key":"e_1_3_2_1_8_1","volume-title":"Learning to paraphrase for question answering. arXiv preprint arXiv:1708.06022","author":"Dong Li","year":"2017"},{"key":"e_1_3_2_1_9_1","volume-title":"Identifying Well-formed Natural Language Questions. arXiv preprint arXiv:1808.09419","author":"Faruqui Manaal","year":"2018"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2015.7404872"},{"key":"e_1_3_2_1_11_1","volume-title":"Generating sequences with recurrent neural networks. arXiv preprint arXiv:1308.0850","author":"Graves Alex","year":"2013"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.5555\/1005332.1044710"},{"key":"e_1_3_2_1_13_1","volume-title":"Long short-term memory. Neural computation","author":"Hochreiter Sepp","year":"1997"},{"key":"e_1_3_2_1_14_1","volume-title":"Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980","author":"Kingma Diederik P","year":"2014"},{"key":"e_1_3_2_1_15_1","volume-title":"Paraphrase generation with deep reinforcement learning. arXiv preprint arXiv:1711.00279","author":"Li Zichao","year":"2017"},{"key":"e_1_3_2_1_16_1","volume-title":"Neural symbolic machines: Learning semantic parsers on freebase with weak supervision. arXiv preprint arXiv:1611.00020","author":"Liang Chen","year":"2016"},{"key":"e_1_3_2_1_17_1","volume-title":"Rouge: A package for automatic evaluation of summaries. Text Summarization Branches Out","author":"Lin Chin-Yew","year":"2004"},{"key":"e_1_3_2_1_18_1","volume-title":"Effective approaches to attention-based neural machine translation. arXiv preprint arXiv:1508.04025","author":"Luong Minh-Thang","year":"2015"},{"key":"e_1_3_2_1_19_1","unstructured":"Tomas Mikolov Ilya Sutskever Kai Chen Greg S Corrado and Jeff Dean. 2013. Distributed representations of words and phrases and their compositionality. In Advances in neural information processing systems. 3111--3119.  Tomas Mikolov Ilya Sutskever Kai Chen Greg S Corrado and Jeff Dean. 2013. Distributed representations of words and phrases and their compositionality. In Advances in neural information processing systems. 3111--3119."},{"key":"e_1_3_2_1_20_1","volume-title":"Playing atari with deep reinforcement learning. arXiv preprint arXiv:1312.5602","author":"Mnih Volodymyr","year":"2013"},{"key":"e_1_3_2_1_21_1","volume-title":"et almbox","author":"Nallapati Ramesh","year":"2016"},{"key":"e_1_3_2_1_22_1","volume-title":"Learning to Coordinate Multiple Reinforcement Learning Agents for Diverse Query Reformulation. arXiv preprint arXiv:1809.10658","author":"Nogueira Rodrigo","year":"2018"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"crossref","unstructured":"Rodrigo Nogueira and Kyunghyun Cho. 2017. Task-Oriented Query Reformulation with Reinforcement Learning. In EMNLP . 574--583.  Rodrigo Nogueira and Kyunghyun Cho. 2017. Task-Oriented Query Reformulation with Reinforcement Learning. In EMNLP . 574--583.","DOI":"10.18653\/v1\/D17-1061"},{"key":"e_1_3_2_1_24_1","volume-title":"MEMEN: multi-layer embedding with memory networks for machine comprehension. arXiv preprint arXiv:1707.09098","author":"Pan Boyuan","year":"2017"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"crossref","unstructured":"Kishore Papineni Salim Roukos Todd Ward and Wei-Jing Zhu. 2002. BLEU: a method for automatic evaluation of machine translation. In ACL. ACL 311--318.  Kishore Papineni Salim Roukos Todd Ward and Wei-Jing Zhu. 2002. BLEU: a method for automatic evaluation of machine translation. In ACL. ACL 311--318.","DOI":"10.3115\/1073083.1073135"},{"key":"e_1_3_2_1_26_1","volume-title":"Glove: Global vectors for word representation. In EMNLP. 1532--1543.","author":"Pennington Jeffrey","year":"2014"},{"key":"e_1_3_2_1_27_1","volume-title":"Sequence level training with recurrent neural networks. ICLR","author":"Ranzato Marc'Aurelio","year":"2016"},{"key":"e_1_3_2_1_28_1","volume-title":"International Conference on Machine Learning . 1889--1897","author":"Schulman John","year":"2015"},{"key":"e_1_3_2_1_29_1","volume-title":"Proximal policy optimization algorithms. arXiv preprint arXiv:1707.06347","author":"Schulman John","year":"2017"},{"key":"e_1_3_2_1_30_1","volume-title":"Query-reduction networks for question answering. arXiv preprint arXiv:1606.04582","author":"Seo Minjoon","year":"2016"},{"key":"e_1_3_2_1_31_1","unstructured":"Ilya Sutskever Oriol Vinyals and Quoc V Le. 2014. Sequence to sequence learning with neural networks. In NIPS. 3104--3112.  Ilya Sutskever Oriol Vinyals and Quoc V Le. 2014. Sequence to sequence learning with neural networks. In NIPS. 3104--3112."},{"key":"e_1_3_2_1_32_1","unstructured":"Richard S Sutton David A McAllester Satinder P Singh and Yishay Mansour. 2000. Policy gradient methods for reinforcement learning with function approximation. In NIPS . 1057--1063.  Richard S Sutton David A McAllester Satinder P Singh and Yishay Mansour. 2000. Policy gradient methods for reinforcement learning with function approximation. In NIPS . 1057--1063."},{"key":"e_1_3_2_1_33_1","volume-title":"LSTM-based deep learning models for non-factoid answer selection. arXiv preprint arXiv:1511.04108","author":"Tan Ming","year":"2015"},{"key":"e_1_3_2_1_34_1","volume-title":"Proximal Policy Optimization and its Dynamic Version for Sequence Generation. arXiv preprint arXiv:1808.07982","author":"Tuan Yi-Lin","year":"2018"},{"key":"e_1_3_2_1_35_1","volume-title":"No metrics are perfect: Adversarial reward learning for visual storytelling. arXiv preprint arXiv:1804.09160","author":"Wang Xin","year":"2018"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1080\/09540099108946587"},{"key":"e_1_3_2_1_37_1","volume-title":"Neural language correction with character-based attention. arXiv preprint arXiv:1603.09727","author":"Xie Ziang","year":"2016"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N16-1042"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"crossref","unstructured":"Xingxing Zhang and Mirella Lapata. 2017. Sentence Simplification with Deep Reinforcement Learning. In EMNLP. 584--594.  Xingxing Zhang and Mirella Lapata. 2017. Sentence Simplification with Deep Reinforcement Learning. In EMNLP. 584--594.","DOI":"10.18653\/v1\/D17-1062"}],"event":{"name":"CIKM '19: The 28th ACM International Conference on Information and Knowledge Management","location":"Beijing China","acronym":"CIKM '19","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGIR ACM Special Interest Group on Information Retrieval"]},"container-title":["Proceedings of the 28th ACM International Conference on Information and Knowledge Management"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3357384.3358046","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3357384.3358046","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T23:44:18Z","timestamp":1750203858000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3357384.3358046"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,11,3]]},"references-count":39,"alternative-id":["10.1145\/3357384.3358046","10.1145\/3357384"],"URL":"https:\/\/doi.org\/10.1145\/3357384.3358046","relation":{},"subject":[],"published":{"date-parts":[[2019,11,3]]},"assertion":[{"value":"2019-11-03","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}