{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T19:45:01Z","timestamp":1776887101300,"version":"3.51.2"},"reference-count":29,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,4]]},"DOI":"10.1109\/icassp.2018.8461785","type":"proceedings-article","created":{"date-parts":[[2018,9,21]],"date-time":"2018-09-21T22:24:48Z","timestamp":1537568688000},"page":"5754-5758","source":"Crossref","is-referenced-by-count":91,"title":["Towards End-to-end Spoken Language Understanding"],"prefix":"10.1109","author":[{"given":"Dmitriy","family":"Serdyuk","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yongqiang","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Christian","family":"Fuegen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Anuj","family":"Kumar","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Baiyang","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yoshua","family":"Bengio","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","author":"bahdanau","year":"2014","journal-title":"Neural machine translation by jointly learning to align and translate"},{"key":"ref11","author":"gehring","year":"2017","journal-title":"Convolutional sequence to sequence learning"},{"key":"ref12","article-title":"Show, attend and tell: Neural image caption generation with visual attention","author":"xu","year":"2015","journal-title":"ICML"},{"key":"ref13","author":"van den oord","year":"2016","journal-title":"WaveNet A Generative Model for Raw Audio"},{"key":"ref14","article-title":"Deep speech 2: End-to-end speech recognition in English and Mandarin","author":"amodei","year":"2016","journal-title":"ICML"},{"key":"ref15","article-title":"Listen, attend and spell: A neural network for large vocabulary conversational speech recognition","author":"chan","year":"2016","journal-title":"ICASSP"},{"key":"ref16","author":"soltau","year":"2016","journal-title":"Neural speech recognizer Acoustic-to-word lstm model for large vocabulary speech recognition"},{"key":"ref17","article-title":"Attention-based models for speech recognition","author":"chorowski","year":"2015","journal-title":"NIPS"},{"key":"ref18","article-title":"End-to-end attention-based large vocabulary speech recognition","author":"bahdanau","year":"2016","journal-title":"ICASSP"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-312"},{"key":"ref28","article-title":"Natural language processing (almost) from scratch","author":"collobert","year":"2011","journal-title":"JMLR"},{"key":"ref4","article-title":"Easy contextual intent prediction and slot detection","author":"bhargava","year":"2013","journal-title":"ICASSP"},{"key":"ref27","article-title":"Batch normalization: Accelerating deep network training by reducing internal covariate shifr","author":"ioffe","year":"2015","journal-title":"ICML"},{"key":"ref3","article-title":"Recurrent neural networks for language understanding","author":"yao","year":"2014","journal-title":"InterSpeech"},{"key":"ref6","article-title":"Appli-cation of deep belief networks for natural language understanding","author":"ruhi","year":"2014","journal-title":"IEEE\/ACM Transactions on Audio Speech and Language Processing"},{"key":"ref29","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v29i1.9513","article-title":"Recurrent convolutional neural networks for text classification","author":"lai","year":"2015","journal-title":"AAAI"},{"key":"ref5","article-title":"Recurrent neural network and LSTM models for lexical utterance classification","author":"ravuri","year":"2015","journal-title":"InterSpeech"},{"key":"ref8","article-title":"A reranking approach for recognition and classification of speech input in conversational dialogue systems","author":"morbini","year":"2012","journal-title":"SLT"},{"key":"ref7","article-title":"Towards deeper understanding: Deep convex networks for semantic utterance classification","author":"tur","year":"2012","journal-title":"ICASSP"},{"key":"ref2","article-title":"Contextual domain classification in spoken language understanding systems using recurrent neural network","author":"xu","year":"2014","journal-title":"ICASSP"},{"key":"ref9","article-title":"Sequence to sequence learning with neural networks","author":"sutskever","year":"2014","journal-title":"NIPS"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1002\/9781119992691"},{"key":"ref20","article-title":"Long short-term memory recurrent neural network architectures for large scale acoustic modeling","author":"sak","year":"2014","journal-title":"InterSpeech"},{"key":"ref22","author":"graves","year":"2012","journal-title":"Sequence transduction with recurrent neural networks"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref24","author":"chung","year":"2014","journal-title":"Empirical evaluation of gated recurrent neural networks on sequence modeling"},{"key":"ref23","author":"battenberg","year":"2017","journal-title":"Exploring neural transducers for end-to-end speech recognition"},{"key":"ref26","author":"kingma","year":"2014","journal-title":"Adam A method for stochastic optimization"},{"key":"ref25","article-title":"The ATIS spoken language systems pilot corpus","author":"hemphill","year":"1990","journal-title":"DARPA Speech and Natural Language Workshop"}],"event":{"name":"ICASSP 2018 - 2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Calgary, AB","start":{"date-parts":[[2018,4,15]]},"end":{"date-parts":[[2018,4,20]]}},"container-title":["2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8450881\/8461260\/08461785.pdf?arnumber=8461785","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,9,2]],"date-time":"2022-09-02T10:49:40Z","timestamp":1662115780000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8461785\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,4]]},"references-count":29,"URL":"https:\/\/doi.org\/10.1109\/icassp.2018.8461785","relation":{},"subject":[],"published":{"date-parts":[[2018,4]]}}}