{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,16]],"date-time":"2025-11-16T07:23:27Z","timestamp":1763277807910,"version":"3.28.0"},"reference-count":22,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,4]]},"DOI":"10.1109\/icassp.2018.8461551","type":"proceedings-article","created":{"date-parts":[[2018,9,21]],"date-time":"2018-09-21T22:24:48Z","timestamp":1537568688000},"page":"5529-5533","source":"Crossref","is-referenced-by-count":11,"title":["Dnn-Based Voice Activity Detection Using Auxiliary Speech Models in Noisy Environments"],"prefix":"10.1109","author":[{"given":"Yuuki","family":"Tachioka","sequence":"first","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2010.2064307"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-589"},{"key":"ref12","article-title":"Recognize and separate approach for speech denoising using nonnegative matrix factorization","author":"sohrab","year":"2015","journal-title":"Proceedings of EUSIPCO"},{"key":"ref13","first-page":"1760","article-title":"Text-informed speech enhancement with deep neural networks","author":"kinoshita","year":"2015","journal-title":"Proceedings of Interspeech"},{"key":"ref14","doi-asserted-by":"crossref","first-page":"788","DOI":"10.1038\/44565","article-title":"Learning the parts of objects by nonnegative matrix factorization","volume":"401","author":"lee","year":"1999","journal-title":"Nature"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2006.876726"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1093\/ietisy\/e88-d.3.553"},{"key":"ref17","first-page":"1217","article-title":"Phoneme-dependent NMF for speech enhancement in monaural mixtures","author":"raj","year":"2011","journal-title":"Proceedings of Interspeech"},{"key":"ref18","doi-asserted-by":"crossref","first-page":"2461","DOI":"10.21437\/Interspeech.2017-61","article-title":"Cou-pled initialization of multi-channel non-negative matrix factorization based on spatial and spectral information","author":"tachioka","year":"2017","journal-title":"Proceedings of Interspeech"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2013.2252615"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1093\/ietisy\/e91-d.3.467"},{"key":"ref3","first-page":"1","article-title":"Voice activity detection based on density ratio estimation and system combination","author":"tachioka","year":"2013","journal-title":"Proceedings of APSIPA"},{"key":"ref6","first-page":"1","article-title":"Deep belief networks based voice activity detection","volume":"21","author":"zhang","year":"2013","journal-title":"IEEE Transactions on Audio Speech and Language Processing"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2012.2205597"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178829"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6639096"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/97.736233"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1002\/j.1538-7305.1975.tb02840.x"},{"key":"ref9","article-title":"Feedback connection for deep neural network-based acoustic modeling","author":"tran","year":"2017","journal-title":"Proceedings of ICASSP"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1250\/ast.30.363"},{"key":"ref22","first-page":"436","article-title":"The NTT CHiME-3 system: Advances in speech enhancement and recognition for mobile multi-microphone devices","author":"yoshioka","year":"0","journal-title":"Proc of ASRU 2015"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TASSP.1984.1164453"}],"event":{"name":"ICASSP 2018 - 2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2018,4,15]]},"location":"Calgary, AB","end":{"date-parts":[[2018,4,20]]}},"container-title":["2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8450881\/8461260\/08461551.pdf?arnumber=8461551","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,8,23]],"date-time":"2020-08-23T22:36:43Z","timestamp":1598222203000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8461551\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,4]]},"references-count":22,"URL":"https:\/\/doi.org\/10.1109\/icassp.2018.8461551","relation":{},"subject":[],"published":{"date-parts":[[2018,4]]}}}