{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,8]],"date-time":"2024-09-08T11:24:41Z","timestamp":1725794681233},"reference-count":11,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,6]]},"DOI":"10.1109\/tsp.2016.7760884","type":"proceedings-article","created":{"date-parts":[[2016,12,1]],"date-time":"2016-12-01T16:40:11Z","timestamp":1480610411000},"page":"303-306","source":"Crossref","is-referenced-by-count":1,"title":["Depth-based features in audio-visual speech recognition"],"prefix":"10.1109","author":[{"given":"Karel","family":"Palecek","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Josef","family":"Chaloupka","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref4","first-page":"142","article-title":"Improving visual features for lip-reading","author":"lan","year":"2010"},{"key":"ref3","doi-asserted-by":"crossref","first-page":"535","DOI":"10.1109\/CVPR.2004.1315210","article-title":"Real-time combined 2d+3d active appearance models","author":"xiao","year":"2004","journal-title":"Proceedings of the 2004 IEEE Computer Society Conference on Computer Vision and Pattern Recognition Ser CVPR'04"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2009.2030637"},{"key":"ref6","article-title":"WAPUSK20-A database for robust audiovisual speech recognition","author":"vorwerk","year":"2010","journal-title":"Proceedings First InternationalConference on Language Resources and Evaluation"},{"key":"ref11","article-title":"Face alignment by explicit shape regression","author":"cao","year":"2012","journal-title":"CVPR"},{"key":"ref5","first-page":"2525","article-title":"The audio-video australian english speech data corpus avozes","author":"goecke","year":"2004"},{"key":"ref8","first-page":"2521","article-title":"3d lip-tracking for audio-visual speech recognition in real applications","author":"c\u00edsa?","year":"2004","journal-title":"The Journal of the Acoustical Society of Korea"},{"key":"ref7","first-page":"235","article-title":"A comparative study of 2d and 3d lip tracking methods for av asr","author":"goecke","year":"2008","journal-title":"AVSPN"},{"key":"ref2","first-page":"493","article-title":"Audio-visual speech recognition for slavonic languages (czech and russian)","author":"c\u00edsa?","year":"2006"},{"key":"ref9","first-page":"2714","article-title":"Audio-visual speech recognition incorporating facial depth information captured by the kinect","author":"galatas","year":"2012","journal-title":"Proceedings of the 20th European Signal Processing Conference (EUSIPCO)"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2014.06.004"}],"event":{"name":"2016 39th International Conference on Telecommunications and Signal Processing (TSP)","start":{"date-parts":[[2016,6,27]]},"location":"Vienna, Austria","end":{"date-parts":[[2016,6,29]]}},"container-title":["2016 39th International Conference on Telecommunications and Signal Processing (TSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7750937\/7760810\/07760884.pdf?arnumber=7760884","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,25]],"date-time":"2017-06-25T01:04:28Z","timestamp":1498352668000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7760884\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,6]]},"references-count":11,"URL":"https:\/\/doi.org\/10.1109\/tsp.2016.7760884","relation":{},"subject":[],"published":{"date-parts":[[2016,6]]}}}