{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,22]],"date-time":"2024-10-22T18:30:42Z","timestamp":1729621842831,"version":"3.28.0"},"reference-count":13,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,3]]},"DOI":"10.1109\/icassp.2016.7472716","type":"proceedings-article","created":{"date-parts":[[2016,6,23]],"date-time":"2016-06-23T21:58:30Z","timestamp":1466719110000},"page":"5435-5439","source":"Crossref","is-referenced-by-count":6,"title":["Divergence estimation based on deep neural networks and its use for language identification"],"prefix":"10.1109","author":[{"given":"Yosuke","family":"Kashiwagi","sequence":"first","affiliation":[]},{"given":"Congying","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Daisuke","family":"Saito","sequence":"additional","affiliation":[]},{"given":"Nobuaki","family":"Minematsu","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","first-page":"2653","article-title":"Vocal tract normalization equals linear transformation in cepstral space","author":"pitz","year":"2001","journal-title":"InterSpeech"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/s00354-009-0091-y"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TSP.2010.2047340"},{"key":"ref13","first-page":"158","article-title":"Speaker-basis accent clustering using invariant structure analysis and the speech accent archive","author":"minematsu","year":"2014","journal-title":"Proc Odyssay"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2011.2109382"},{"key":"ref3","doi-asserted-by":"crossref","first-page":"1527","DOI":"10.1162\/neco.2006.18.7.1527","article-title":"A fast learning algorithm for deep belief nets","volume":"18","author":"geoffrey","year":"2006","journal-title":"Neural Computation"},{"key":"ref6","first-page":"1910","article-title":"Learning small-size DNN with output-distribution-based criteria","author":"li","year":"2014","journal-title":"Proc INTERSPEECH"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2010.2082532"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/SLT.2014.7078568"},{"journal-title":"NIST LRE Group","article-title":"The 2007 nist languag recognition evaluation plan (Ire07)","year":"2007","key":"ref7"},{"key":"ref2","doi-asserted-by":"crossref","first-page":"1300","DOI":"10.1109\/TASL.2009.2032950","article-title":"GMM-SVM kernel with a Bhattacharyya-based distance for speaker recognition","volume":"18","author":"huai you","year":"2010","journal-title":"Audio Speech and Language Processing IEEE Transactions on"},{"key":"ref1","first-page":"317","article-title":"Approximating the Kullback Leibler divergence between gaussian mixture models","volume":"4","author":"john","year":"2007","journal-title":"Acoustics Speech and Signal Processing 2007 ICASSP 2007 IEEE International Conference on"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2004.1326053"}],"event":{"name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2016,3,20]]},"location":"Shanghai","end":{"date-parts":[[2016,3,25]]}},"container-title":["2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7465907\/7471614\/07472716.pdf?arnumber=7472716","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,24]],"date-time":"2017-06-24T13:00:27Z","timestamp":1498309227000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7472716\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,3]]},"references-count":13,"URL":"https:\/\/doi.org\/10.1109\/icassp.2016.7472716","relation":{},"subject":[],"published":{"date-parts":[[2016,3]]}}}