{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,23]],"date-time":"2025-08-23T05:19:45Z","timestamp":1755926385126,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":39,"publisher":"ACM","license":[{"start":{"date-parts":[[2019,11,3]],"date-time":"2019-11-03T00:00:00Z","timestamp":1572739200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2019,11,3]]},"DOI":"10.1145\/3357384.3358046","type":"proceedings-article","created":{"date-parts":[[2019,11,4]],"date-time":"2019-11-04T14:11:35Z","timestamp":1572876695000},"page":"1643-1652","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":6,"title":["Generative Question Refinement with Deep Reinforcement Learning in Retrieval-based QA System"],"prefix":"10.1145","author":[{"given":"Ye","family":"Liu","sequence":"first","affiliation":[{"name":"University of Illinois at Chicago, Chicago, IL, USA"}]},{"given":"Chenwei","family":"Zhang","sequence":"additional","affiliation":[{"name":"Amazon, Seattle, WA, USA"}]},{"given":"Xiaohui","family":"Yan","sequence":"additional","affiliation":[{"name":"Poisson Lab, Huawei Technologies, Shenzhen, China"}]},{"given":"Yi","family":"Chang","sequence":"additional","affiliation":[{"name":"Jilin University, Jilin, China"}]},{"given":"Philip S.","family":"Yu","sequence":"additional","affiliation":[{"name":"University of Illinois at Chicago, Chicago, IL, USA"}]}],"member":"320","published-online":{"date-parts":[[2019,11,3]]},"reference":[{"volume-title":"An actor-critic algorithm for sequence prediction. arXiv preprint arXiv:1607.07086","year":"2016","author":"Bahdanau Dzmitry","key":"e_1_3_2_1_1_1"},{"volume-title":"Neural machine translation by jointly learning to align and translate. arXiv preprint arXiv:1409.0473","year":"2014","author":"Bahdanau Dzmitry","key":"e_1_3_2_1_2_1"},{"volume-title":"Proceedings of the ACL workshop on intrinsic and extrinsic evaluation measures for machine translation and\/or summarization . 65--72","year":"2005","author":"Banerjee Satanjeev","key":"e_1_3_2_1_3_1"},{"volume-title":"Reinforcement learning. Neural systems for control","year":"1998","author":"Barto Andrew G","key":"e_1_3_2_1_4_1"},{"volume-title":"Massive exploration of neural machine translation architectures. arXiv preprint arXiv:1703.03906","year":"2017","author":"Britz Denny","key":"e_1_3_2_1_5_1"},{"volume-title":"Ask the Right Questions: Active Question Reformulation with Reinforcement Learning. ICLR","year":"2018","author":"Buck Christian","key":"e_1_3_2_1_6_1"},{"volume-title":"Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805","year":"2018","author":"Devlin Jacob","key":"e_1_3_2_1_7_1"},{"volume-title":"Learning to paraphrase for question answering. arXiv preprint arXiv:1708.06022","year":"2017","author":"Dong Li","key":"e_1_3_2_1_8_1"},{"volume-title":"Identifying Well-formed Natural Language Questions. arXiv preprint arXiv:1808.09419","year":"2018","author":"Faruqui Manaal","key":"e_1_3_2_1_9_1"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2015.7404872"},{"volume-title":"Generating sequences with recurrent neural networks. arXiv preprint arXiv:1308.0850","year":"2013","author":"Graves Alex","key":"e_1_3_2_1_11_1"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.5555\/1005332.1044710"},{"volume-title":"Long short-term memory. Neural computation","year":"1997","author":"Hochreiter Sepp","key":"e_1_3_2_1_13_1"},{"volume-title":"Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980","year":"2014","author":"Kingma Diederik P","key":"e_1_3_2_1_14_1"},{"volume-title":"Paraphrase generation with deep reinforcement learning. arXiv preprint arXiv:1711.00279","year":"2017","author":"Li Zichao","key":"e_1_3_2_1_15_1"},{"volume-title":"Neural symbolic machines: Learning semantic parsers on freebase with weak supervision. arXiv preprint arXiv:1611.00020","year":"2016","author":"Liang Chen","key":"e_1_3_2_1_16_1"},{"volume-title":"Rouge: A package for automatic evaluation of summaries. Text Summarization Branches Out","year":"2004","author":"Lin Chin-Yew","key":"e_1_3_2_1_17_1"},{"volume-title":"Effective approaches to attention-based neural machine translation. arXiv preprint arXiv:1508.04025","year":"2015","author":"Luong Minh-Thang","key":"e_1_3_2_1_18_1"},{"key":"e_1_3_2_1_19_1","unstructured":"Tomas Mikolov Ilya Sutskever Kai Chen Greg S Corrado and Jeff Dean. 2013. Distributed representations of words and phrases and their compositionality. In Advances in neural information processing systems. 3111--3119.  Tomas Mikolov Ilya Sutskever Kai Chen Greg S Corrado and Jeff Dean. 2013. Distributed representations of words and phrases and their compositionality. In Advances in neural information processing systems. 3111--3119."},{"volume-title":"Playing atari with deep reinforcement learning. arXiv preprint arXiv:1312.5602","year":"2013","author":"Mnih Volodymyr","key":"e_1_3_2_1_20_1"},{"volume-title":"et almbox","year":"2016","author":"Nallapati Ramesh","key":"e_1_3_2_1_21_1"},{"volume-title":"Learning to Coordinate Multiple Reinforcement Learning Agents for Diverse Query Reformulation. arXiv preprint arXiv:1809.10658","year":"2018","author":"Nogueira Rodrigo","key":"e_1_3_2_1_22_1"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"crossref","unstructured":"Rodrigo Nogueira and Kyunghyun Cho. 2017. Task-Oriented Query Reformulation with Reinforcement Learning. In EMNLP . 574--583.  Rodrigo Nogueira and Kyunghyun Cho. 2017. Task-Oriented Query Reformulation with Reinforcement Learning. In EMNLP . 574--583.","DOI":"10.18653\/v1\/D17-1061"},{"volume-title":"MEMEN: multi-layer embedding with memory networks for machine comprehension. arXiv preprint arXiv:1707.09098","year":"2017","author":"Pan Boyuan","key":"e_1_3_2_1_24_1"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"crossref","unstructured":"Kishore Papineni Salim Roukos Todd Ward and Wei-Jing Zhu. 2002. BLEU: a method for automatic evaluation of machine translation. In ACL. ACL 311--318.  Kishore Papineni Salim Roukos Todd Ward and Wei-Jing Zhu. 2002. BLEU: a method for automatic evaluation of machine translation. In ACL. ACL 311--318.","DOI":"10.3115\/1073083.1073135"},{"volume-title":"Glove: Global vectors for word representation. In EMNLP. 1532--1543.","year":"2014","author":"Pennington Jeffrey","key":"e_1_3_2_1_26_1"},{"volume-title":"Sequence level training with recurrent neural networks. ICLR","year":"2016","author":"Ranzato Marc'Aurelio","key":"e_1_3_2_1_27_1"},{"volume-title":"International Conference on Machine Learning . 1889--1897","year":"2015","author":"Schulman John","key":"e_1_3_2_1_28_1"},{"volume-title":"Proximal policy optimization algorithms. arXiv preprint arXiv:1707.06347","year":"2017","author":"Schulman John","key":"e_1_3_2_1_29_1"},{"volume-title":"Query-reduction networks for question answering. arXiv preprint arXiv:1606.04582","year":"2016","author":"Seo Minjoon","key":"e_1_3_2_1_30_1"},{"key":"e_1_3_2_1_31_1","unstructured":"Ilya Sutskever Oriol Vinyals and Quoc V Le. 2014. Sequence to sequence learning with neural networks. In NIPS. 3104--3112.  Ilya Sutskever Oriol Vinyals and Quoc V Le. 2014. Sequence to sequence learning with neural networks. In NIPS. 3104--3112."},{"key":"e_1_3_2_1_32_1","unstructured":"Richard S Sutton David A McAllester Satinder P Singh and Yishay Mansour. 2000. Policy gradient methods for reinforcement learning with function approximation. In NIPS . 1057--1063.  Richard S Sutton David A McAllester Satinder P Singh and Yishay Mansour. 2000. Policy gradient methods for reinforcement learning with function approximation. In NIPS . 1057--1063."},{"volume-title":"LSTM-based deep learning models for non-factoid answer selection. arXiv preprint arXiv:1511.04108","year":"2015","author":"Tan Ming","key":"e_1_3_2_1_33_1"},{"volume-title":"Proximal Policy Optimization and its Dynamic Version for Sequence Generation. arXiv preprint arXiv:1808.07982","year":"2018","author":"Tuan Yi-Lin","key":"e_1_3_2_1_34_1"},{"volume-title":"No metrics are perfect: Adversarial reward learning for visual storytelling. arXiv preprint arXiv:1804.09160","year":"2018","author":"Wang Xin","key":"e_1_3_2_1_35_1"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1080\/09540099108946587"},{"volume-title":"Neural language correction with character-based attention. arXiv preprint arXiv:1603.09727","year":"2016","author":"Xie Ziang","key":"e_1_3_2_1_37_1"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N16-1042"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"crossref","unstructured":"Xingxing Zhang and Mirella Lapata. 2017. Sentence Simplification with Deep Reinforcement Learning. In EMNLP. 584--594.  Xingxing Zhang and Mirella Lapata. 2017. Sentence Simplification with Deep Reinforcement Learning. In EMNLP. 584--594.","DOI":"10.18653\/v1\/D17-1062"}],"event":{"name":"CIKM '19: The 28th ACM International Conference on Information and Knowledge Management","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGIR ACM Special Interest Group on Information Retrieval"],"location":"Beijing China","acronym":"CIKM '19"},"container-title":["Proceedings of the 28th ACM International Conference on Information and Knowledge Management"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3357384.3358046","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3357384.3358046","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T23:44:18Z","timestamp":1750203858000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3357384.3358046"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,11,3]]},"references-count":39,"alternative-id":["10.1145\/3357384.3358046","10.1145\/3357384"],"URL":"https:\/\/doi.org\/10.1145\/3357384.3358046","relation":{},"subject":[],"published":{"date-parts":[[2019,11,3]]},"assertion":[{"value":"2019-11-03","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}