{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,25]],"date-time":"2026-02-25T20:11:22Z","timestamp":1772050282853,"version":"3.50.1"},"reference-count":30,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,5,1]],"date-time":"2020-05-01T00:00:00Z","timestamp":1588291200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,5,1]],"date-time":"2020-05-01T00:00:00Z","timestamp":1588291200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,5,1]],"date-time":"2020-05-01T00:00:00Z","timestamp":1588291200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,5]]},"DOI":"10.1109\/icassp40776.2020.9053889","type":"proceedings-article","created":{"date-parts":[[2020,4,9]],"date-time":"2020-04-09T20:21:13Z","timestamp":1586463673000},"page":"6124-6128","source":"Crossref","is-referenced-by-count":182,"title":["Quartznet: Deep Automatic Speech Recognition with 1D Time-Channel Separable Convolutions"],"prefix":"10.1109","author":[{"given":"Samuel","family":"Kriman","sequence":"first","affiliation":[]},{"given":"Stanislav","family":"Beliaev","sequence":"additional","affiliation":[]},{"given":"Boris","family":"Ginsburg","sequence":"additional","affiliation":[]},{"given":"Jocelyn","family":"Huang","sequence":"additional","affiliation":[]},{"given":"Oleksii","family":"Kuchaiev","sequence":"additional","affiliation":[]},{"given":"Vitaly","family":"Lavrukhin","sequence":"additional","affiliation":[]},{"given":"Ryan","family":"Leary","sequence":"additional","affiliation":[]},{"given":"Jason","family":"Li","sequence":"additional","affiliation":[]},{"given":"Yang","family":"Zhang","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref30","article-title":"Towards better decoding and language model integration in sequence to sequence models","author":"chorowski","year":"2016"},{"key":"ref10","article-title":"Learning visual representations at scale","author":"vanhoucke","year":"2014","journal-title":"ICLRE"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2460"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003730"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1819"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/1143844.1143891"},{"key":"ref15","article-title":"Letter-based speech recognition with gated convnets","author":"liptchinsky","year":"2017"},{"key":"ref16","article-title":"Batch normalization: Accelerating deep network training by reducing internal covariate shift","author":"ioffe","year":"2015"},{"key":"ref17","article-title":"Layer normalization","author":"ba","year":"2016"},{"key":"ref18","article-title":"Instance normalization: The missing ingredient for fast stylization","author":"ulyanov","year":"2016"},{"key":"ref19","first-page":"319","article-title":"Group normalization","author":"wu","year":"2018","journal-title":"Lecture Notes in Computer Science"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-2414"},{"key":"ref4","article-title":"SqueezeNet: AlexNet-level accuracy with 50x fewer parameters and <1MB model","author":"iandola","year":"2016"},{"key":"ref27","article-title":"Mixed precision training","author":"micikevicius","year":"2017"},{"key":"ref3","article-title":"NeMo: a toolkit for building AI applications using neural modules","author":"kuchaiev","year":"2019"},{"key":"ref6","article-title":"EfficientNet: Rethinking model scaling for convolutional neural networks","author":"tan","year":"2019","journal-title":"ICML"},{"key":"ref29","article-title":"Towards end-to-end speech recognition with recurrent neural networks","author":"graves","year":"2014","journal-title":"ICML"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00716"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"key":"ref7","article-title":"MobileNets: Efficient convolutional neural networks for mobile vision applications","author":"howard","year":"2017"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.3115\/1075527.1075614"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.195"},{"key":"ref1","first-page":"5206","article-title":"Librispeech: an ASR corpus based on public domain audio books","author":"panayotov","year":"2015","journal-title":"ICASSP"},{"key":"ref20","article-title":"Common Voice","year":"2019"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2680"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1285"},{"key":"ref24","article-title":"Improved regularization of convolutional neural networks with cutout","author":"devries","year":"2017"},{"key":"ref23","article-title":"Audio augmentation for speech recognition","author":"ko","year":"2015","journal-title":"InterSpeech"},{"key":"ref26","article-title":"Fully convolutional speech recognition","author":"zeghidour","year":"2018"},{"key":"ref25","article-title":"Stochastic gradient methods with layer-wise adaptive moments for training of deep networks","author":"ginsburg","year":"2019"}],"event":{"name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Barcelona, Spain","start":{"date-parts":[[2020,5,4]]},"end":{"date-parts":[[2020,5,8]]}},"container-title":["ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9040208\/9052899\/09053889.pdf?arnumber=9053889","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,28]],"date-time":"2022-06-28T00:16:36Z","timestamp":1656375396000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9053889\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,5]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/icassp40776.2020.9053889","relation":{},"subject":[],"published":{"date-parts":[[2020,5]]}}}