{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,4]],"date-time":"2025-10-04T08:04:50Z","timestamp":1759565090721,"version":"3.37.3"},"reference-count":28,"publisher":"IEEE","license":[{"start":{"date-parts":[[2022,9,26]],"date-time":"2022-09-26T00:00:00Z","timestamp":1664150400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,9,26]],"date-time":"2022-09-26T00:00:00Z","timestamp":1664150400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100011222","name":"National Laboratory of Pattern Recognition (NLPR)","doi-asserted-by":"publisher","award":["202200042"],"award-info":[{"award-number":["202200042"]}],"id":[{"id":"10.13039\/501100011222","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002766","name":"Beijing University of Posts and Telecommunications","doi-asserted-by":"publisher","award":["2021RC37"],"award-info":[{"award-number":["2021RC37"]}],"id":[{"id":"10.13039\/501100002766","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022,9,26]]},"DOI":"10.1109\/mmsp55362.2022.9949293","type":"proceedings-article","created":{"date-parts":[[2022,11,22]],"date-time":"2022-11-22T21:39:16Z","timestamp":1669153156000},"page":"1-6","source":"Crossref","is-referenced-by-count":4,"title":["A Keypoint Based Enhancement Method for Audio Driven Free View Talking Head Synthesis"],"prefix":"10.1109","author":[{"given":"Yichen","family":"Han","sequence":"first","affiliation":[{"name":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications,Beijing,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ya","family":"Li","sequence":"additional","affiliation":[{"name":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications,Beijing,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yingming","family":"Gao","sequence":"additional","affiliation":[{"name":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications,Beijing,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jinlong","family":"Xue","sequence":"additional","affiliation":[{"name":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications,Beijing,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Songpo","family":"Wang","sequence":"additional","affiliation":[{"name":"DeepScience Tech Ltd.,Beijing,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lei","family":"Yang","sequence":"additional","affiliation":[{"name":"DeepScience Tech Ltd.,Beijing,China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"crossref","first-page":"2616","DOI":"10.21437\/Interspeech.2017-950","article-title":"VoxCeleb: A Large-Scale Speaker Identification Dataset","author":"nagrani","year":"2017","journal-title":"in INTERSPEECH 2017"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2017.287"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413532"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/WACV48630.2021.00009"},{"key":"ref14","article-title":"First Order Motion Model for Image Animation","volume":"32","author":"siarohin","year":"2019","journal-title":"Advances in Neural Infor-Mation Processing Systems"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TIFS.2022.3146783"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/3072959.3073640"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3072959.3073699"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58517-4_42"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00991"},{"key":"ref28","doi-asserted-by":"crossref","first-page":"600","DOI":"10.1109\/TIP.2003.819861","article-title":"Image quality assess-ment: from error visibility to structural similarity","volume":"13","author":"wang","year":"2004","journal-title":"IEEE Transactions on Image Processing"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58577-8_25"},{"key":"ref27","article-title":"Others Deep face recognition","volume":"1","author":"omkar","year":"2015","journal-title":"BMVC"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58545-7_3"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00573"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/2897824.2925984"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01386"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-019-01150-y"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00802"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_24"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/2503385.2503473"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58610-2_31"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00416"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3414685.3417774"},{"key":"ref24","first-page":"2362","article-title":"Arbitrary Talking Face Generation via Attentional Audio-Visual Coherence Learning","author":"zhu","year":"2021","journal-title":"Proceedings of the Twenty-Ninth International Conference on International Joint Conferences on Artificial Intelligence"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3197517.3201292"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/3478513.3480484"},{"key":"ref25","article-title":"Scene representation networks: Continuous 3d-structure-aware neural scene representations","volume":"32","author":"sitzmann","year":"2019","journal-title":"Advances in neural information processing systems"}],"event":{"name":"2022 IEEE 24th International Workshop on Multimedia Signal Processing (MMSP)","start":{"date-parts":[[2022,9,26]]},"location":"Shanghai, China","end":{"date-parts":[[2022,9,28]]}},"container-title":["2022 IEEE 24th International Workshop on Multimedia Signal Processing (MMSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9948698\/9948704\/09949293.pdf?arnumber=9949293","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,12]],"date-time":"2022-12-12T19:54:11Z","timestamp":1670874851000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9949293\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,9,26]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/mmsp55362.2022.9949293","relation":{},"subject":[],"published":{"date-parts":[[2022,9,26]]}}}