{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,16]],"date-time":"2025-02-16T18:40:03Z","timestamp":1739731203285,"version":"3.37.1"},"reference-count":23,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2009,12]]},"DOI":"10.1109\/asru.2009.5373454","type":"proceedings-article","created":{"date-parts":[[2010,1,13]],"date-time":"2010-01-13T20:40:58Z","timestamp":1263415258000},"page":"228-231","source":"Crossref","is-referenced-by-count":2,"title":["Improved decision trees for multi-stream HMM-based audio-visual continuous speech recognition"],"prefix":"10.1109","author":[{"given":"Jing","family":"Huang","sequence":"first","affiliation":[]},{"given":"Karthik","family":"Visweswariah","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"article-title":"Fundamentals of speech recognition","year":"1993","author":"rabiner","key":"ref10"},{"key":"ref11","article-title":"Late integration in audio-visual continuous speech recognition","author":"verma","year":"1999","journal-title":"Proc IEEE Workshop of ASRU"},{"key":"ref12","article-title":"Confusability of phonemes grouped according to their viseme classes in noisy environments","author":"lucey","year":"2004","journal-title":"10th Australian International Conference on Speech Science & Technology"},{"key":"ref13","article-title":"Audio-visual speech recognition with a hybrid SVM-HMM system","author":"gurban","year":"2005","journal-title":"Proc 13th European Signal Processing Conference"},{"key":"ref14","article-title":"Efficient Likelihood Computation in Multi-Stream HMM Based Audio-Visual Speech Recognition","author":"marcheret","year":"2004","journal-title":"Int Conf Speech Language Processing 98"},{"key":"ref15","article-title":"Frame-Dependent Multi-Stream Reliability Indicators for Audio-Visual Speech Recognition","author":"garg","year":"2003","journal-title":"Int Conf Acoustic Speech and Signal Processing"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2005.1521429"},{"key":"ref17","article-title":"Discriminatively Trained Features Using fMPE for Multi-Stream Audio-Visual Speech Recognition","author":"huang","year":"2005","journal-title":"Proc INTERSPEECH"},{"key":"ref18","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2009-426","article-title":"Combined Discriminative Training for Multi-Stream HMM-based Audio-Visual Speech Recognition","author":"huang","year":"2009","journal-title":"Proc INTERSPEECH"},{"key":"ref19","article-title":"Decision trees for phonological rules in contiuous speech","author":"bahl","year":"1991","journal-title":"Proc ICASSP"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/6046.985551"},{"key":"ref3","doi-asserted-by":"crossref","first-page":"591","DOI":"10.21437\/Eurospeech.1999-152","article-title":"Multi-stream speech recognition: Ready for prime time?","author":"janin","year":"1999","journal-title":"Proc Europ Conf Speech Technol"},{"key":"ref6","doi-asserted-by":"crossref","first-page":"1260","DOI":"10.1155\/S1110865702206150","article-title":"Noise adaptive stream weighting in audio-visual speech recognition","volume":"11","author":"heckmann","year":"2002","journal-title":"EURASIP J Appl Signal Process"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/6046.865479"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/B0-08-044854-2\/00912-3"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2003.817150"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/5.664274"},{"key":"ref1","first-page":"265","article-title":"Automatic lipreading to enhance speech recognition","author":"petajan","year":"0","journal-title":"Proc Global Communication Conf"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2004.10.007"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2000.861810"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.1991.150402"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2009.5372904"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-662-13015-5"}],"event":{"name":"Understanding (ASRU)","start":{"date-parts":[[2009,11,13]]},"location":"Moreno, Italy","end":{"date-parts":[[2009,12,17]]}},"container-title":["2009 IEEE Workshop on Automatic Speech Recognition &amp; Understanding"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/5357590\/5372876\/05373454.pdf?arnumber=5373454","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,16]],"date-time":"2025-02-16T18:15:56Z","timestamp":1739729756000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/5373454\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,12]]},"references-count":23,"URL":"https:\/\/doi.org\/10.1109\/asru.2009.5373454","relation":{},"subject":[],"published":{"date-parts":[[2009,12]]}}}