{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,22]],"date-time":"2024-10-22T20:05:17Z","timestamp":1729627517401,"version":"3.28.0"},"reference-count":28,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,3]]},"DOI":"10.1109\/icassp.2016.7472808","type":"proceedings-article","created":{"date-parts":[[2016,6,24]],"date-time":"2016-06-24T01:58:30Z","timestamp":1466733510000},"page":"5895-5899","source":"Crossref","is-referenced-by-count":16,"title":["Filterbank learning using Convolutional Restricted Boltzmann Machine for speech recognition"],"prefix":"10.1109","author":[{"given":"Hardik B.","family":"Sailor","sequence":"first","affiliation":[]},{"given":"Hemant A.","family":"Patil","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/1553374.1553453"},{"key":"ref11","first-page":"1096","article-title":"Unsuper-vised feature learning for audio classification using convolutional deep belief networks","author":"lee","year":"2009","journal-title":"23rd Annual Conference on Neural Information Processing Systems"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1162\/0899766052530839"},{"key":"ref13","first-page":"890","article-title":"Acoustic modeling with deep neural networks using raw time signal for LVCSR","author":"tuske","year":"2014","journal-title":"InterSpeech"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178781"},{"key":"ref15","first-page":"26","article-title":"Convolutional neural networks for acoustic modeling of raw time signal in LVCSR","author":"golik","year":"2015","journal-title":"InterSpeech"},{"key":"ref16","first-page":"1","article-title":"Learning the speech front-end with raw waveform CLDNNs","author":"sainath","year":"2015","journal-title":"InterSpeech"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2013.6707746"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/89.326615"},{"key":"ref19","first-page":"807","article-title":"Rectified linear units improve restricted Boltzmann machines","author":"nair","year":"2010","journal-title":"Proceedings of the 27th International Conference on Machine Learning (ICML)"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2009.5459469"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"436","DOI":"10.1038\/nature14539","article-title":"Deep learning","volume":"521","author":"bengio","year":"2015","journal-title":"Nature"},{"key":"ref27","article-title":"The kaldi speech recognition toolkit","author":"povey","year":"2011","journal-title":"2011 IEEE Workshop on Automatic Speech Recognition &amp; Understanding"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.50"},{"key":"ref6","first-page":"1631","article-title":"Speech feature extraction using independent component analysis","volume":"3","author":"lee","year":"2000","journal-title":"IEEE International Conference on Acoustics Speech and Signal Processing (ICASSP)"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1111\/cogs.12049"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2008.4518709"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1038\/nn831"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2013.2252316"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2011.5947700"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2012.2207989"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1162\/089976602760128018"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178847"},{"key":"ref21","first-page":"305","article-title":"Auditory features based on gammatone filters for robust speech recognition","author":"qi","year":"2013","journal-title":"2013 IEEE International Symposium on Circuits and Systems (IS-CAS)"},{"key":"ref24","first-page":"27403","article-title":"DARPA TIMIT acoustic-phonetic continous speech corpus CD-ROM. NIST speech disc 1&#x2013;1.1","volume":"93","year":"1993","journal-title":"NASA STI\/Recon Technical Report N"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/18.119739"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/29.46546"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.3115\/1075527.1075614"}],"event":{"name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2016,3,20]]},"location":"Shanghai","end":{"date-parts":[[2016,3,25]]}},"container-title":["2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7465907\/7471614\/07472808.pdf?arnumber=7472808","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,24]],"date-time":"2017-06-24T17:00:13Z","timestamp":1498323613000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7472808\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,3]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/icassp.2016.7472808","relation":{},"subject":[],"published":{"date-parts":[[2016,3]]}}}