{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,5]],"date-time":"2025-11-05T06:59:45Z","timestamp":1762325985144},"reference-count":24,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,4,14]],"date-time":"2024-04-14T00:00:00Z","timestamp":1713052800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,4,14]],"date-time":"2024-04-14T00:00:00Z","timestamp":1713052800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,4,14]]},"DOI":"10.1109\/icasspw62465.2024.10627170","type":"proceedings-article","created":{"date-parts":[[2024,8,15]],"date-time":"2024-08-15T17:19:18Z","timestamp":1723742358000},"page":"444-448","source":"Crossref","is-referenced-by-count":1,"title":["A Cross-Talk Robust Multichannel VAD Model For Multiparty Agent Interactions Trained Using Synthetic Re-Recordings"],"prefix":"10.1109","author":[{"given":"Hyewon","family":"Han","sequence":"first","affiliation":[{"name":"Yonsei University,Dept. of Electrical and Electronic Engineering,Seoul,South Korea"}]},{"given":"Naveen","family":"Kumar","sequence":"additional","affiliation":[{"name":"Disney Research Imagineering,Los Angeles,USA"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1017\/S0047404500001019"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9746465"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2020-2800"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2003.1198793"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/11677482_3"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.21437\/chime.2020-1"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2021-1208"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2021.101317"},{"article-title":"End-to-end neural diarization: Reformulating speaker diarization as simple multi-label classification","year":"2020","author":"Fujita","key":"ref9"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9747343"},{"key":"ref11","first-page":"28492","article-title":"Robust speech recognition via large-scale weak supervision","volume-title":"International Conference on Machine Learning","author":"Radford"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/APSIPA.2017.8282048"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1238"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9414470"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2010-771"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-200"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2020.3043115"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-11100"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053426"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178964"},{"key":"ref21","article-title":"Deep speech enhancement challenge at icassp 2023","author":"Dubey","year":"2023","journal-title":"ICASSP"},{"article-title":"Silero vad: pre-trained enterprise-grade voice activity detector (vad), number detector and language classifier","year":"2021","author":"Team","key":"ref22"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2023-684"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.21437\/CHiME.2023-16"}],"event":{"name":"2024 IEEE International Conference on Acoustics, Speech, and Signal Processing Workshops (ICASSPW)","start":{"date-parts":[[2024,4,14]]},"location":"Seoul, Korea, Republic of","end":{"date-parts":[[2024,4,19]]}},"container-title":["2024 IEEE International Conference on Acoustics, Speech, and Signal Processing Workshops (ICASSPW)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10625769\/10625780\/10627170.pdf?arnumber=10627170","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,16]],"date-time":"2024-08-16T05:32:05Z","timestamp":1723786325000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10627170\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,14]]},"references-count":24,"URL":"https:\/\/doi.org\/10.1109\/icasspw62465.2024.10627170","relation":{},"subject":[],"published":{"date-parts":[[2024,4,14]]}}}