{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,23]],"date-time":"2026-01-23T07:26:08Z","timestamp":1769153168187,"version":"3.49.0"},"reference-count":31,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,1,19]]},"DOI":"10.1109\/slt48900.2021.9383492","type":"proceedings-article","created":{"date-parts":[[2021,3,25]],"date-time":"2021-03-25T20:46:54Z","timestamp":1616705214000},"page":"104-110","source":"Crossref","is-referenced-by-count":6,"title":["Multi-Channel Automatic Speech Recognition Using Deep Complex Unet"],"prefix":"10.1109","author":[{"given":"Yuxiang","family":"Kong","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jian","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Quandong","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Peng","family":"Gao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Weiji","family":"Zhuang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yujun","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lei","family":"Xie","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1423"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2015.2512042"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/HSCMA.2008.4538698"},{"key":"ref11","volume":"1","author":"benesty","year":"2008","journal-title":"Microphone Array Signal Processing"},{"key":"ref12","author":"benesty","year":"2007","journal-title":"Springer Handbook of Speech Processing"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472778"},{"key":"ref14","article-title":"Frequency domain multi-channel acoustic modeling for distant speech recognition","author":"wu","year":"2019","journal-title":"2019 IEEE International Conference on Acoustics Speech and Signal Processing (ICASSP)"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7953173"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462372"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/SLT.2018.8639547"},{"key":"ref18","article-title":"Multi-task learning for speech recognition: an overview","author":"pironkov","year":"2016","journal-title":"European Symposium on Artificial Neural Networks (ESANN)"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178925"},{"key":"ref28","article-title":"Phase-aware speech enhancement with deep complex u-net","author":"choi","year":"2018","journal-title":"International Conference on Learning Representations"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472621"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2537"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/1143844.1143891"},{"key":"ref6","author":"brandstein","year":"2013","journal-title":"Microphone Arrays Signal Processing Techniques and Applications"},{"key":"ref29","first-page":"234","article-title":"U-net: Convolutional networks for biomedical image segmentation","author":"ronneberger","year":"2015","journal-title":"International Conference on Medical Image Computing and Computer-Assisted Intervention (MICCAI)"},{"key":"ref5","first-page":"5998","article-title":"Attention is all you need","author":"vaswani","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2017.2672401"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2011.2163395"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461809"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/HSCMA.2008.4538699"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-595"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-805"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2078"},{"key":"ref21","article-title":"Speech enhancement and recognition using multi-task learning of long short-term memory re-current neural networks","author":"chen","year":"2015","journal-title":"Sixteenth Annual Conference of the International Speech Communication Association (INTERSPEECH)"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003983"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2019.2913512"},{"key":"ref26","article-title":"PHASEN: A phase-and-harmonicsaware speech enhancement network","author":"yin","year":"2019"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2019.2955276"}],"event":{"name":"2021 IEEE Spoken Language Technology Workshop (SLT)","location":"Shenzhen, China","start":{"date-parts":[[2021,1,19]]},"end":{"date-parts":[[2021,1,22]]}},"container-title":["2021 IEEE Spoken Language Technology Workshop (SLT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9383468\/9383452\/09383492.pdf?arnumber=9383492","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,6,8]],"date-time":"2021-06-08T18:52:17Z","timestamp":1623178337000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9383492\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,1,19]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/slt48900.2021.9383492","relation":{},"subject":[],"published":{"date-parts":[[2021,1,19]]}}}