{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,14]],"date-time":"2026-02-14T10:31:07Z","timestamp":1771065067263,"version":"3.50.1"},"reference-count":61,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"12","license":[{"start":{"date-parts":[[2017,12,1]],"date-time":"2017-12-01T00:00:00Z","timestamp":1512086400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE\/ACM Trans. Audio Speech Lang. Process."],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1109\/taslp.2017.2751747","type":"journal-article","created":{"date-parts":[[2017,11,23]],"date-time":"2017-11-23T19:08:05Z","timestamp":1511464085000},"page":"2301-2312","source":"Crossref","is-referenced-by-count":16,"title":["Crosslingual and Multilingual Speech Recognition Based on the Speech Manifold"],"prefix":"10.1109","volume":"25","author":[{"given":"Reza","family":"Sahraeian","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dirk","family":"Van Compernolle","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1049\/ip-i-2.1992.0018"},{"key":"ref38","author":"fant","year":"1970","journal-title":"Acoustic Theory of Speech Production"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2006.1660002"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2011.2167610"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2008.4518596"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1006\/csla.2000.0148"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2007.899533"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1162\/089976603321780317"},{"key":"ref35","first-page":"1","article-title":"Algorithms for manifold learning","author":"cayton","year":"2005"},{"key":"ref34","article-title":"A geometric perspective on speech sounds","author":"jansen","year":"2005"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2017.04.016"},{"key":"ref61","first-page":"348","article-title":"Manifold regularized deep neural networks","author":"tomar","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref28","article-title":"Estimating articulatory parameters from the acoustic speech signal","author":"richmond","year":"2002"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2003.822636"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1121\/1.3514544"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2012.2205597"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2011.2134090"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6639081"},{"key":"ref22","first-page":"336","article-title":"The language-independent bottleneck features","author":"vesel`y","year":"0","journal-title":"Proc IEEE Spoken Lang Technol Workshop"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2011.6163958"},{"key":"ref24","author":"jakobson","year":"1951","journal-title":"Preliminaries to speech analysis The distinctive features and their correlates"},{"key":"ref23","first-page":"90","article-title":"Multilingual bottle-neck features and its application for under-resourced languages","author":"vu","year":"0","journal-title":"Proc Int Workshop Spoken Lang Technol Under-Resourced Lang"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1121\/1.403994"},{"key":"ref25","author":"chomsky","year":"1968","journal-title":"The Sound Pattern of English"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1214\/009053607000000640"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1162\/089976602317250942"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/89.759034"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2010.5495662"},{"key":"ref57","first-page":"1","article-title":"The KALDI speech recognition toolkit","author":"povey","year":"0","journal-title":"Proc IEEE Workshop on Automatic Speech Recognition and Understanding"},{"key":"ref56","article-title":"Parallel training of deep neural networks with natural gradient and parameter averaging","author":"povey","year":"2014"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2012.6288862"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6639248"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177704472"},{"key":"ref52","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4419-1570-2","author":"principe","year":"2010","journal-title":"Information Theoretic Learning Renyi's Entropy and Kernel Perspectives"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2000.859138"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2009.4960588"},{"key":"ref40","first-page":"2399","article-title":"Manifold regularization: A geometric framework for learning from examples","volume":"7","author":"belkin","year":"2006","journal-title":"Mach Learn Res"},{"key":"ref12","first-page":"1433","article-title":"An evaluation of cross-language adaptation and native speech training for rapid HMM construction based on very limited training data","author":"zhao","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.17159\/sajs.2017\/20160038"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2010.5495646"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2013.2281575"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2012.6289010"},{"key":"ref17","first-page":"877","author":"thomas","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2013.2277932"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6639084"},{"key":"ref4","first-page":"16","article-title":"Speech recognition and keyword spotting for low resource languages: Babel project research at CUED","author":"gales","year":"0","journal-title":"Proc Int Workshop Spoken Lang Technol Under-Resourced Lang"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2013.07.008"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.1997.659141"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICSLP.1996.607240"},{"key":"ref8","first-page":"371","article-title":"Fast bootstrapping of LVCSR systems with multilingual phoneme sets","author":"schultz","year":"0","journal-title":"Proc EUROSPEECH"},{"key":"ref7","article-title":"Language independent speech recognition","author":"d\u2019hoore","year":"2000"},{"key":"ref49","first-page":"1912","article-title":"Exploring how deep neural networks form phonemic categories","author":"nagamine","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6393(00)00094-7"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/TSP.2013.2238931"},{"key":"ref45","first-page":"1255","article-title":"Under-resourced speech recognition based on the speech manifold","author":"sahraeian","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2012.6288863"},{"key":"ref47","article-title":"Feature learning in deep neural networks-studies on speech recognition tasks","author":"yu","year":"2013"},{"key":"ref42","first-page":"86","article-title":"Semi-supervised learning of speech sounds","author":"jansen","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref41","article-title":"Intrinsic spectral analysis for zero and high resource speech recognition","author":"jansen","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref44","first-page":"1722","article-title":"Intrinsic spectral analysis based on temporal context features for query-by-example spoken term detection","author":"yang","year":"0","journal-title":"Proc INTERSPEECH"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2013.6707739"}],"container-title":["IEEE\/ACM Transactions on Audio, Speech, and Language Processing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6570655\/8114348\/08114354.pdf?arnumber=8114354","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,12]],"date-time":"2022-01-12T16:24:07Z","timestamp":1642004647000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/8114354\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,12]]},"references-count":61,"journal-issue":{"issue":"12"},"URL":"https:\/\/doi.org\/10.1109\/taslp.2017.2751747","relation":{},"ISSN":["2329-9290","2329-9304"],"issn-type":[{"value":"2329-9290","type":"print"},{"value":"2329-9304","type":"electronic"}],"subject":[],"published":{"date-parts":[[2017,12]]}}}