{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T15:29:16Z","timestamp":1775230156483,"version":"3.50.1"},"reference-count":28,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,4]]},"DOI":"10.1109\/icassp.2018.8461705","type":"proceedings-article","created":{"date-parts":[[2018,9,21]],"date-time":"2018-09-21T18:24:48Z","timestamp":1537554288000},"page":"5829-5833","source":"Crossref","is-referenced-by-count":17,"title":["Sequence-to-Sequence Asr Optimization Via Reinforcement Learning"],"prefix":"10.1109","author":[{"given":"Andros","family":"Tjandra","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sakriani","family":"Sakti","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Satoshi","family":"Nakamura","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"crossref","first-page":"229","DOI":"10.1007\/BF00992696","article-title":"Simple statistical gradient-following algorithms for connectionist reinforcement learning","volume":"8","author":"ronald j","year":"1992","journal-title":"Machine Learning"},{"key":"ref11","author":"sutton","year":"1998","journal-title":"Introduction to Reinforcement Learning"},{"key":"ref12","article-title":"Minimum risk training for neural machine translation","volume":"1","author":"shen","year":"2016","journal-title":"Proceedings of the 54th Annual Meeting of the Associationfor Computational Linguistics ACL"},{"key":"ref13","first-page":"1471","article-title":"Vari-ance reduction techniques for gradient estimates in reinforcement learning","volume":"5","author":"evan","year":"2004","journal-title":"Journal of Machine Learning Research"},{"key":"ref14","first-page":"ii","article-title":"Neural variational inference and learning in belief networks","volume":"32","author":"mnih","year":"2014","journal-title":"Proceedings of the 31st International Conference on International Conference on Machine Learning"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.3115\/1075527.1075614"},{"key":"ref16","article-title":"The Kaldi speech recognition toolkit","author":"daniel","year":"2011","journal-title":"2011 IEEE Workshop on Automatic Speech Recognition &amp; Understanding"},{"key":"ref17","author":"awni y","year":"2014","journal-title":"First-pass large vocabulary continuous speech recognition using bi-directional recurrent dnns"},{"key":"ref18","author":"bing","year":"2015","journal-title":"Empirical evaluation of rectified activations in convolutional network"},{"key":"ref19","volume":"385","author":"alex","year":"2012","journal-title":"Supervised Sequence Labelling with Recurrent Neural Networks"},{"key":"ref28","author":"matt","year":"2017","journal-title":"Optimizing expected word error rate via sampling for speech recognition"},{"key":"ref4","first-page":"3156","article-title":"Show and tell: A neural image caption generator","author":"oriol","year":"2015","journal-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition"},{"key":"ref27","author":"marc","year":"2015","journal-title":"Sequence level training with recurrent neural networks"},{"key":"ref3","first-page":"2048","article-title":"Show, attend and tell: Neural image caption generation with visual attention","author":"kelvin","year":"2015","journal-title":"International Conference on Machine Learning"},{"key":"ref6","first-page":"4960","article-title":"Listen, attend and spell: A neural network for large vocabulary conversational speech recognition","author":"william","year":"2016","journal-title":"Acoustics Speech and Signal Processing (ICASSP) 2016 IEEE International Conference on"},{"key":"ref5","first-page":"4945","article-title":"End-to-end attention-based large vocabulary speech recognition","author":"dzmitry","year":"2016","journal-title":"Proc ICASSP 2016"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"270","DOI":"10.1162\/neco.1989.1.2.270","article-title":"A learning algorithm for continually running fully recurrent neural networks","volume":"1","author":"ronald j","year":"1989","journal-title":"Neural Computation"},{"key":"ref7","first-page":"309","article-title":"Attention-based wav2text with feature transfer learning","author":"andros","year":"2017","journal-title":"2017 IEEE Automatic Speech Recognition and Understanding Workshop ASRU 2017"},{"key":"ref2","author":"dzmitry","year":"2014","journal-title":"Neural machine translation by jointly learning to align and translate"},{"key":"ref9","author":"yonghui","year":"2016","journal-title":"Googlc's neural machine translation system Bridging the gap between human and machine translation"},{"key":"ref1","first-page":"3104","article-title":"Sequence to sequence learning with neural networks","author":"ilya","year":"2014","journal-title":"Advances in neural information processing systems"},{"key":"ref20","author":"diederik","year":"2014","journal-title":"Adam A method for stochastic optimization"},{"key":"ref22","doi-asserted-by":"crossref","first-page":"529","DOI":"10.1038\/nature14236","article-title":"Human-level control through deep reinforcement learning","volume":"518","author":"volodymyr","year":"2015","journal-title":"Nature"},{"key":"ref21","article-title":"Joint CTC-attention based end-to-end speech recognition using multitask learning","author":"suyoun","year":"2017","journal-title":"Acoustics Speech and Signal Processing (ICASSP) 2017 IEEE International Conference"},{"key":"ref24","first-page":"579","article-title":"Reinforcement learning in robotics: A survey","author":"jens","year":"2012","journal-title":"Reinforcement Learning"},{"key":"ref23","doi-asserted-by":"crossref","first-page":"484","DOI":"10.1038\/nature16961","article-title":"Mastering the game of go with deep neural networks and tree search","volume":"529","author":"david","year":"2016","journal-title":"Nature"},{"key":"ref26","author":"jiwei","year":"2016","journal-title":"Deep Reinforcement Learning for Dialogue Generation"},{"key":"ref25","first-page":"956","article-title":"Reinforcement learning for spoken dialogue systems","author":"satinder","year":"2000","journal-title":"Advances in neural information processing systems"}],"event":{"name":"ICASSP 2018 - 2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Calgary, AB","start":{"date-parts":[[2018,4,15]]},"end":{"date-parts":[[2018,4,20]]}},"container-title":["2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8450881\/8461260\/08461705.pdf?arnumber=8461705","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,8,23]],"date-time":"2020-08-23T22:26:52Z","timestamp":1598221612000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8461705\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,4]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/icassp.2018.8461705","relation":{},"subject":[],"published":{"date-parts":[[2018,4]]}}}