{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,6]],"date-time":"2025-08-06T12:12:08Z","timestamp":1754482328009,"version":"3.28.0"},"reference-count":38,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,6,6]],"date-time":"2021-06-06T00:00:00Z","timestamp":1622937600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,6,6]],"date-time":"2021-06-06T00:00:00Z","timestamp":1622937600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,6,6]],"date-time":"2021-06-06T00:00:00Z","timestamp":1622937600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,6,6]]},"DOI":"10.1109\/icassp39728.2021.9414856","type":"proceedings-article","created":{"date-parts":[[2021,5,13]],"date-time":"2021-05-13T19:53:45Z","timestamp":1620935625000},"page":"2280-2284","source":"Crossref","is-referenced-by-count":2,"title":["SeeHear: Signer Diarisation and a New Dataset"],"prefix":"10.1109","author":[{"given":"Samuel","family":"Albanie","sequence":"first","affiliation":[]},{"given":"Gul","family":"Varol","sequence":"additional","affiliation":[]},{"given":"Liliane","family":"Momeni","sequence":"additional","affiliation":[]},{"given":"Triantafyllos","family":"Afouras","sequence":"additional","affiliation":[]},{"given":"Andrew","family":"Brown","sequence":"additional","affiliation":[]},{"given":"Chuhan","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Ernesto","family":"Coto","sequence":"additional","affiliation":[]},{"given":"Necati Cihan","family":"Camgoz","sequence":"additional","affiliation":[]},{"given":"Ben","family":"Saunders","sequence":"additional","affiliation":[]},{"given":"Abhishek","family":"Dutta","sequence":"additional","affiliation":[]},{"given":"Neil","family":"Fox","sequence":"additional","affiliation":[]},{"given":"Richard","family":"Bowden","sequence":"additional","affiliation":[]},{"given":"Bencie","family":"Woll","sequence":"additional","affiliation":[]},{"given":"Andrew","family":"Zisserman","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58517-4_4"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9781139167048"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01225-0_32"},{"key":"ref31","article-title":"Building the British sign language corpus","volume":"7","author":"schembri","year":"2013","journal-title":"Journal of Language Documentation and Conservation"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1268"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.596"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1044\/jslhr.4101.200"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1044\/jshr.3805.1014"},{"year":"0","key":"ref34","article-title":"Library archives"},{"key":"ref10","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v32i1.12269","article-title":"Pixellink: Detecting scene text via instance segmentation","author":"deng","year":"2018","journal-title":"AAAI"},{"key":"ref11","article-title":"Retinaface: Single-stage dense face localisation in the wild","author":"deng","year":"2019","journal-title":"ArXiv"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/3343031.3350535"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W17-4414"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6853855"},{"key":"ref15","article-title":"Automatic signer diarization-the mover is the signer approach","author":"gebrekidan gebre","year":"2013","journal-title":"cvprw"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6638947"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46487-9_6"},{"key":"ref18","article-title":"Mobilenets: Efficient convolutional neural networks for mobile vision applications","author":"howard","year":"2017","journal-title":"arXiv 1704 04861"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2019.2913372"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW50498.2020.00525"},{"year":"2017","key":"ref4","article-title":"The Difference between BSL & SSE"},{"key":"ref27","article-title":"Facebook FAIR&#x2019;s WMT19 news translation task submission","author":"ng","year":"2019","journal-title":"Proceedings of the Fourth Conference on Machine Translation"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/3308561.3353774"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/FG.2018.00020"},{"key":"ref29","article-title":"Yolov3: An incremental improvement","author":"redmon","year":"2018","journal-title":"arXiv 1804 02767"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00812"},{"key":"ref8","article-title":"Out of time: automated lip sync in the wild","author":"chung","year":"2016","journal-title":"ACCV Workshops"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.502"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8683257"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1111\/1467-9481.00162"},{"key":"ref1","article-title":"BSL-1K: Scaling up co-articulated sign language recognition using mouthing cues","author":"albanie","year":"2020","journal-title":"ECCV"},{"key":"ref20","article-title":"Quantitative survey of the state of the art in sign language recognition","author":"koller","year":"2020","journal-title":"arXiv 2008 09918"},{"key":"ref22","article-title":"Microsoft COCO: Common objects in context","author":"lin","year":"2014","journal-title":"ECCV"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2015.09.013"},{"key":"ref24","article-title":"Seeing wake words: Audio-visual keyword spotting","author":"momeni","year":"2020","journal-title":"BMVC"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01228-1_27"},{"key":"ref26","article-title":"Real-Time Sign Language Detection using Human Pose Estimation","author":"moryossef","year":"2020","journal-title":"ECCVW Sign Language Recognition Translation and Production (SLRTP)"},{"key":"ref25","article-title":"Watch, read and lookup: learning to spot signs from multiple supervisors","author":"momeni","year":"2020","journal-title":"ACCV"}],"event":{"name":"ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2021,6,6]]},"location":"Toronto, ON, Canada","end":{"date-parts":[[2021,6,11]]}},"container-title":["ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9413349\/9413350\/09414856.pdf?arnumber=9414856","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,27]],"date-time":"2022-12-27T08:27:12Z","timestamp":1672129632000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9414856\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,6,6]]},"references-count":38,"URL":"https:\/\/doi.org\/10.1109\/icassp39728.2021.9414856","relation":{},"subject":[],"published":{"date-parts":[[2021,6,6]]}}}