{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,7]],"date-time":"2024-09-07T19:30:30Z","timestamp":1725737430710},"reference-count":43,"publisher":"IEEE","license":[{"start":{"date-parts":[[2022,9,26]],"date-time":"2022-09-26T00:00:00Z","timestamp":1664150400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,9,26]],"date-time":"2022-09-26T00:00:00Z","timestamp":1664150400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022,9,26]]},"DOI":"10.1109\/mmsp55362.2022.9949148","type":"proceedings-article","created":{"date-parts":[[2022,11,22]],"date-time":"2022-11-22T21:39:16Z","timestamp":1669153156000},"page":"1-6","source":"Crossref","is-referenced-by-count":1,"title":["Subjective Evaluation of Deep Neural Network Based Speech Enhancement Systems in Real-World Conditions"],"prefix":"10.1109","author":[{"given":"Gaurav","family":"Naithani","sequence":"first","affiliation":[{"name":"Tampere University,Audio Research Group,Tampere,Finland"}]},{"given":"Kirsi","family":"Pietila","sequence":"additional","affiliation":[{"name":"Huawei Tampere,Wireless Headset Audio Lab,Tampere,Finland"}]},{"given":"Riitta","family":"Niemisto","sequence":"additional","affiliation":[{"name":"Huawei Tampere,Wireless Headset Audio Lab,Tampere,Finland"}]},{"given":"Erkki","family":"Paajanen","sequence":"additional","affiliation":[{"name":"Huawei Tampere,Wireless Headset Audio Lab,Tampere,Finland"}]},{"given":"Tero","family":"Takala","sequence":"additional","affiliation":[{"name":"Huawei Tampere,Wireless Headset Audio Lab,Tampere,Finland"}]},{"given":"Tuomas","family":"Virtanen","sequence":"additional","affiliation":[{"name":"Tampere University,Audio Research Group,Tampere,Finland"}]}],"member":"263","reference":[{"key":"ref39","article-title":"Automatic differentiation in PyTorch","author":"paszke","year":"0","journal-title":"NIPS Autodiff Workshop"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.25080\/Majora-7b98e3ed-003"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.195"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA.2017.8169997"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-53547-0_25"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9054563"},{"key":"ref37","article-title":"Adam: A method for stochastic optimization","author":"kingma","year":"2014","journal-title":"Proc International Conference on Learning Representations"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/89.928915"},{"key":"ref35","first-page":"1182","article-title":"Spectral subtraction based on minimum statistics","author":"martin","year":"1994","journal-title":"Proc Euro Signal Processing Conf (EUSIPCO)"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TASSP.1984.1164453"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2005.851927"},{"journal-title":"ITU-R BS 2399 - Recommendation of the International Telecommunication Union Methods for selecting and describing attributes and terms in preparation of subjective tests","year":"2017","key":"ref40"},{"journal-title":"Handbook on Array Processing and Sensor Networks","year":"2015","author":"haykin","key":"ref11"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1016\/S0165-1684(01)00128-1"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2409"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1121\/1.5119226"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2018.2882738"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1163\/000579511X605759"},{"key":"ref17","article-title":"The INTER-SPEECH 2020 deep noise suppression challenge: Datasets, subjective testing framework, and challenge results","author":"reddy","year":"2020","journal-title":"ISCA INTERSPEECH"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9415105"},{"key":"ref19","first-page":"679","article-title":"INTERSPEECH 2021 ConferencingSpeech challenge: Towards far-field multi-channel speech enhancement for video conferencing","author":"rao","year":"2021","journal-title":"Proc IEEE Workshop Automatic Speech Recognition and Understanding (ASRU)"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.23919\/EUSIPCO54536.2021.9616165"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-1428"},{"key":"ref27","first-page":"222","article-title":"A low delay, variable resolution, perfect reconstruction spectral analysis-synthesis system for speech enhancement","author":"mauler","year":"2007","journal-title":"15th European Signal Processing Conference (EUSIPCO)"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2013-130"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9414177"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2013.2291240"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2537"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.21236\/ADA073139"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TASSP.1979.1163209"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2014.2364452"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1002\/9781119279860"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TASSP.1985.1164550"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA52581.2021.9632771"},{"key":"ref22","article-title":"Empirical evaluation of gated recurrent neural networks on sequence modeling","author":"chung","year":"2014","journal-title":"NIPS Workshop on Deep Learning"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2021.3082282"},{"key":"ref24","article-title":"Phase-aware speech enhancement with deep complex U-Net","author":"choi","year":"2018","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2010.5495701"},{"key":"ref23","first-page":"234","article-title":"U-Net: Convolutional networks for biomedical image segmentation","author":"ronneberger","year":"2015","journal-title":"International Conference on Medical Image Computing and Computer-Assisted Intervention (MIC-CAI)"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2005.858005"},{"journal-title":"ITU-T P 835 - Recommendation of the International Telecommunication Union Subjective test methodology for evaluating speech communication systems that include noise suppression algorithm","year":"2003","key":"ref26"},{"journal-title":"ITU-T P 800 - Recommendation of the International Telecommunication Union Methods for subjective determination of transmission quality","year":"1996","key":"ref25"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2001.941023"}],"event":{"name":"2022 IEEE 24th International Workshop on Multimedia Signal Processing (MMSP)","start":{"date-parts":[[2022,9,26]]},"location":"Shanghai, China","end":{"date-parts":[[2022,9,28]]}},"container-title":["2022 IEEE 24th International Workshop on Multimedia Signal Processing (MMSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9948698\/9948704\/09949148.pdf?arnumber=9949148","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,12]],"date-time":"2022-12-12T19:54:21Z","timestamp":1670874861000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9949148\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,9,26]]},"references-count":43,"URL":"https:\/\/doi.org\/10.1109\/mmsp55362.2022.9949148","relation":{},"subject":[],"published":{"date-parts":[[2022,9,26]]}}}