{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T15:29:17Z","timestamp":1775230157887,"version":"3.50.1"},"reference-count":20,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,3]]},"DOI":"10.1109\/icassp.2016.7472029","type":"proceedings-article","created":{"date-parts":[[2016,6,24]],"date-time":"2016-06-24T01:58:30Z","timestamp":1466733510000},"page":"2009-2013","source":"Crossref","is-referenced-by-count":21,"title":["Decoding visemes: Improving machine lip-reading"],"prefix":"10.1109","author":[{"given":"Helen L.","family":"Bear","sequence":"first","affiliation":[]},{"given":"Richard","family":"Harvey","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"crossref","first-page":"1082","DOI":"10.1109\/TSA.2005.857572","article-title":"Visual model structures and synchrony constraints for audio-visual speech recognition","volume":"14","author":"timothy","year":"2006","journal-title":"Audio Speech and Language Processing IEEE Transactions on"},{"key":"ref11","first-page":"2109","article-title":"Viseme definitions comparison for visual-only speech recognition","author":"cappelletta","year":"2011","journal-title":"Proc 19th European Signal Processing Conference 2011"},{"key":"ref12","first-page":"1","article-title":"Comparison of phoneme and viseme based acoustic units for speech driven realistic lip animation","author":"bozkurt","year":"2007","journal-title":"Signal Processing and Communications Applications"},{"key":"ref13","first-page":"190","article-title":"Finding phonemes: improving machine lip-reading","author":"helen","year":"2015","journal-title":"1st Joint International Conference on Facial Analysis Animation and Audio-Visual Speech Processing (FAAVSP)"},{"key":"ref14","article-title":"The HTK book version 3.4","author":"steve","year":"2006"},{"key":"ref15","first-page":"93","article-title":"The DARPA speech recognition research database: specifications and status","author":"william","year":"1986","journal-title":"Proc DARPA Workshop on Speech Recognition"},{"key":"ref16","article-title":"Improving visual features for lip-reading","volume":"7","author":"lan","year":"2010","journal-title":"International Conference on Audio-Visual Speech Processing"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1023\/B:VISI.0000029666.37597.d3"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/34.982900"},{"key":"ref19","doi-asserted-by":"crossref","first-page":"36","DOI":"10.1080\/00031305.1983.10483087","article-title":"A leisurely look at the bootstrap, the jackknife, and cross-validation","volume":"37","author":"efron","year":"1983","journal-title":"The American Statistician"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2010.205"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/34.927467"},{"key":"ref6","first-page":"322","article-title":"Phoneme-to-viseme mapping for visual speech recognition","author":"cappelletta","year":"2012","journal-title":"ICPRAM"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2014.7025274"},{"key":"ref8","first-page":"92530g","article-title":"Some observations on computer lipreading: moving from the dream to the reality","author":"helen","year":"2014","journal-title":"SPIE Defence and Security"},{"key":"ref7","first-page":"230","article-title":"Which phoneme-to-viseme maps best improve visual-only computer lip-reading?","author":"helen","year":"2014","journal-title":"Advances in Visual Computing"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2012.192"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2007.366941"},{"key":"ref9","author":"liam howell","year":"2014","journal-title":"Confusion modelling for lip-reading"},{"key":"ref20","doi-asserted-by":"crossref","first-page":"796","DOI":"10.1044\/jshr.1104.796","article-title":"Confusions among visually perceived consonants","volume":"11","author":"cletus","year":"1968","journal-title":"Journal of Speech Language and Hearing Research"}],"event":{"name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Shanghai","start":{"date-parts":[[2016,3,20]]},"end":{"date-parts":[[2016,3,25]]}},"container-title":["2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7465907\/7471614\/07472029.pdf?arnumber=7472029","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,6,17]],"date-time":"2024-06-17T21:28:02Z","timestamp":1718659682000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7472029\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,3]]},"references-count":20,"URL":"https:\/\/doi.org\/10.1109\/icassp.2016.7472029","relation":{},"subject":[],"published":{"date-parts":[[2016,3]]}}}