{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T08:20:26Z","timestamp":1729671626370,"version":"3.28.0"},"reference-count":25,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,11]]},"DOI":"10.23919\/apsipa.2018.8659595","type":"proceedings-article","created":{"date-parts":[[2019,3,18]],"date-time":"2019-03-18T23:11:49Z","timestamp":1552950709000},"page":"1478-1482","source":"Crossref","is-referenced-by-count":2,"title":["Deep Speaker Embeddings with Convolutional Neural Network on Supervector for Text-Independent Speaker Recognition"],"prefix":"10.23919","author":[{"given":"Danwei","family":"Cai","sequence":"first","affiliation":[]},{"given":"Zexin","family":"Cai","sequence":"additional","affiliation":[]},{"given":"Ming","family":"Li","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"crossref","first-page":"1487","DOI":"10.21437\/Interspeech.2017-1608","article-title":"End-to-end text-independent speaker verification with triplet loss on short utterances","author":"zhang","year":"2017","journal-title":"Proc of Interspeech"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-452"},{"key":"ref12","first-page":"165","article-title":"Deep neural network-based speaker embeddings for end-to-end speaker verification","author":"snyder","year":"2016","journal-title":"Proc of SLT"},{"key":"ref13","doi-asserted-by":"crossref","first-page":"74","DOI":"10.21437\/Odyssey.2018-11","article-title":"Exploring the encoding layer and loss function in end-to-end speaker and language recognition system","author":"cai","year":"2018","journal-title":"Proc Odyssey"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462025"},{"key":"ref15","article-title":"Insights into end-to-end learning scheme for language identification","author":"cai","year":"2018","journal-title":"Proc ICASSP"},{"key":"ref16","first-page":"1120","article-title":"Speaker verification and spoken language identification using a generalized i-vector framework with phonetic tokenizations and tandem features","author":"li","year":"2014","journal-title":"Proc of Interspeech"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/s11265-015-1019-z"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref19","doi-asserted-by":"crossref","first-page":"249","DOI":"10.21437\/Interspeech.2011-53","article-title":"Analysis of i-vector length normalization in speaker recognition systems","author":"garcia-romero","year":"2011","journal-title":"Proc of Interspeech"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.21236\/ADA613971"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1006\/dspr.1999.0361"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6854363"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2010.2064307"},{"key":"ref8","first-page":"171","article-title":"End-to-end attention based text-dependent speaker verification","author":"zhang","year":"2016","journal-title":"Proc of SLT"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472652"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2009.08.009"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-620"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1991.150355"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2015.7404779"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.123"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.3115\/1075812.1075885"},{"key":"ref24","first-page":"69","article-title":"The fisher corpus: a resource for the next generations of speech-to-text","volume":"4","author":"cieri","year":"2004","journal-title":"Proc Int Conf on Lang Resources and Evaluation"},{"journal-title":"The NIST year 2010 speaker rccognition evaluation plan","year":"0","key":"ref23"},{"key":"ref25","article-title":"The bosaris toolkit: Theory, algorithms and code for surviving the new DCF","author":"brmmer","year":"2011","journal-title":"NIST SRE Analysis Workshop"}],"event":{"name":"2018 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","start":{"date-parts":[[2018,11,12]]},"location":"Honolulu, HI, USA","end":{"date-parts":[[2018,11,15]]}},"container-title":["2018 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8648538\/8659446\/08659595.pdf?arnumber=8659595","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,9,14]],"date-time":"2023-09-14T16:47:24Z","timestamp":1694710044000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8659595\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,11]]},"references-count":25,"URL":"https:\/\/doi.org\/10.23919\/apsipa.2018.8659595","relation":{},"subject":[],"published":{"date-parts":[[2018,11]]}}}