{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:14:27Z","timestamp":1750220067369,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":7,"publisher":"ACM","license":[{"start":{"date-parts":[[2022,1,14]],"date-time":"2022-01-14T00:00:00Z","timestamp":1642118400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"?????????","award":["R21101H8"],"award-info":[{"award-number":["R21101H8"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2022,1,14]]},"DOI":"10.1145\/3517077.3517091","type":"proceedings-article","created":{"date-parts":[[2022,5,22]],"date-time":"2022-05-22T22:15:21Z","timestamp":1653257721000},"page":"86-92","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["A preliminary study of challenges in extracting purity videos from the AV Speech Benchmark"],"prefix":"10.1145","author":[{"given":"Haoran","family":"Yan","sequence":"first","affiliation":[{"name":"China Mobile (Suzhou) Software Technology Co. Ltd, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Huijun","family":"Lu","sequence":"additional","affiliation":[{"name":"China Mobile (Suzhou) Software Technology Co. Ltd, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dunbo","family":"Cai","sequence":"additional","affiliation":[{"name":"China Mobile (Suzhou) Software Technology Co. Ltd, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tao","family":"Hang","sequence":"additional","affiliation":[{"name":"China Mobile (Suzhou) Software Technology Co. Ltd, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ling","family":"Qian","sequence":"additional","affiliation":[{"name":"China Mobile (Suzhou) Software Technology Co. Ltd, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2022,5,22]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"crossref","unstructured":"Qian\u00a0Y \u00a0Weng\u00a0C \u00a0Chang\u00a0X \u00a0et\u00a0al.\u00a0Past\u00a0review \u00a0current\u00a0progress \u00a0and\u00a0challenges\u00a0ahead\u00a0on\u00a0the\u00a0cocktail\u00a0party\u00a0problem[J].\u00a0Frontiers\u00a0of\u00a0Information\u00a0Technology\u00a0&\u00a0Electronic\u00a0Engineering \u00a02018 \u00a019(1):\u00a040-63.  Qian\u00a0Y \u00a0Weng\u00a0C \u00a0Chang\u00a0X \u00a0et\u00a0al.\u00a0Past\u00a0review \u00a0current\u00a0progress \u00a0and\u00a0challenges\u00a0ahead\u00a0on\u00a0the\u00a0cocktail\u00a0party\u00a0problem[J].\u00a0Frontiers\u00a0of\u00a0Information\u00a0Technology\u00a0&\u00a0Electronic\u00a0Engineering \u00a02018 \u00a019(1):\u00a040-63.","DOI":"10.1631\/FITEE.1700814"},{"key":"e_1_3_2_1_2_1","volume-title":"Deep Audio-Visual Learning: A Survey[J]. arXiv preprint arXiv:2001.04758","author":"Zhu H","year":"2020","unstructured":"Zhu H , Luo M , Wang R , Deep Audio-Visual Learning: A Survey[J]. arXiv preprint arXiv:2001.04758 , 2020 . Zhu H, Luo M, Wang R, Deep Audio-Visual Learning: A Survey[J]. arXiv preprint arXiv:2001.04758, 2020."},{"key":"e_1_3_2_1_3_1","volume-title":"Looking to listen at the cocktail party: A speaker-independent audio-visual model for speech separation [J]. arXiv preprint arXiv:1804.03619","author":"Ephrat A","year":"2018","unstructured":"Ephrat A , Mosseri I , Lang O , Looking to listen at the cocktail party: A speaker-independent audio-visual model for speech separation [J]. arXiv preprint arXiv:1804.03619 , 2018 . Ephrat A, Mosseri I, Lang O, Looking to listen at the cocktail party: A speaker-independent audio-visual model for speech separation [J]. arXiv preprint arXiv:1804.03619, 2018."},{"volume-title":"Proc. Interspeech 2021","author":"Rigal R","key":"e_1_3_2_1_4_1","unstructured":"Rigal R , Chodorowski J , Zerr B. Deep Audio-Visual Speech Separation Based on Facial Motion}}[J] . Proc. Interspeech 2021 , 2021: 3540-3544. Rigal R, Chodorowski J, Zerr B. Deep Audio-Visual Speech Separation Based on Facial Motion}}[J]. Proc. Interspeech 2021, 2021: 3540-3544."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"crossref","unstructured":"Owens A Efros A A. Audio-visual scene analysis with self-supervised multisensory features[C]\/\/Proceedings of the European Conference on Computer Vision (ECCV). 2018: 631-648.  Owens A Efros A A. Audio-visual scene analysis with self-supervised multisensory features[C]\/\/Proceedings of the European Conference on Computer Vision (ECCV). 2018: 631-648.","DOI":"10.1007\/978-3-030-01231-1_39"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"crossref","unstructured":"Zhao H Gan C Rouditchenko A The sound of pixels[C]\/\/Proceedings of the European conference on computer vision (ECCV). 2018: 570-586.  Zhao H Gan C Rouditchenko A The sound of pixels[C]\/\/Proceedings of the European conference on computer vision (ECCV). 2018: 570-586.","DOI":"10.1007\/978-3-030-01246-5_35"},{"key":"e_1_3_2_1_7_1","volume-title":"Joint face detection and facial expression recognition with MTCNN[C]\/\/2017 4th international conference on information science and control engineering (ICISCE)","author":"Xiang J","year":"2017","unstructured":"Xiang J , Zhu G. Joint face detection and facial expression recognition with MTCNN[C]\/\/2017 4th international conference on information science and control engineering (ICISCE) . IEEE , 2017 : 424-427. Xiang J, Zhu G. Joint face detection and facial expression recognition with MTCNN[C]\/\/2017 4th international conference on information science and control engineering (ICISCE). IEEE, 2017: 424-427."}],"event":{"name":"ICMIP 2022: 2022 7th International Conference on Multimedia and Image Processing","acronym":"ICMIP 2022","location":"Tianjin China"},"container-title":["2022 7th International Conference on Multimedia and Image Processing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3517077.3517091","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3517077.3517091","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T18:09:01Z","timestamp":1750183741000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3517077.3517091"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,1,14]]},"references-count":7,"alternative-id":["10.1145\/3517077.3517091","10.1145\/3517077"],"URL":"https:\/\/doi.org\/10.1145\/3517077.3517091","relation":{},"subject":[],"published":{"date-parts":[[2022,1,14]]},"assertion":[{"value":"2022-05-22","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}