{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,11]],"date-time":"2026-07-11T22:06:47Z","timestamp":1783807607503,"version":"3.55.0"},"reference-count":32,"publisher":"IEEE","license":[{"start":{"date-parts":[[2019,10,1]],"date-time":"2019-10-01T00:00:00Z","timestamp":1569888000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2019,10,1]],"date-time":"2019-10-01T00:00:00Z","timestamp":1569888000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,10,1]],"date-time":"2019-10-01T00:00:00Z","timestamp":1569888000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019,10]]},"DOI":"10.1109\/waspaa.2019.8937253","type":"proceedings-article","created":{"date-parts":[[2019,12,24]],"date-time":"2019-12-24T06:50:13Z","timestamp":1577170213000},"page":"175-179","source":"Crossref","is-referenced-by-count":141,"title":["Universal Sound Separation"],"prefix":"10.1109","author":[{"given":"Ilya","family":"Kavalerov","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Scott","family":"Wisdom","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Hakan","family":"Erdogan","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Brian","family":"Patton","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Kevin","family":"Wilson","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jonathan","family":"Le Roux","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"John R.","family":"Hershey","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref32","article-title":"Explicit consistency constraints for STFT spectrograms and their application to phase reconstruction","author":"le roux","year":"2008","journal-title":"Proc SAPA"},{"key":"ref31","article-title":"Adam: A method for stochastic op-timization","author":"kingma","year":"2014","journal-title":"arXiv preprint arXiv 1412 6980"},{"key":"ref30","article-title":"TensorFlow: Large-scale machine learning on heterogeneous systems","year":"2015"},{"key":"ref10","article-title":"Supervised Speech Separation Based on Deep Learning: An Overview","author":"wang","year":"2017","journal-title":"arXiv preprint arXiv 1708 02562"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462507"},{"key":"ref12","article-title":"SDR &#x2013; half-baked or well done&#x0192;","author":"le roux","year":"2019","journal-title":"Proc ICASSP"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6853860"},{"key":"ref14","article-title":"Tasnet: Surpassing ideal time-frequency masking for speech separation","author":"luo","year":"2018","journal-title":"arXiv preprint arXiv 1809 07454"},{"key":"ref15","article-title":"Singing voice separation with deep U-Net convolutional networks","author":"jansson","year":"2017","journal-title":"Proc ISMIR"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461671"},{"key":"ref17","article-title":"Combining fully convolutional and recurrent neural networks for single channel audio source separation","author":"grais","year":"2018","journal-title":"Proc AES"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462448"},{"key":"ref19","article-title":"MMDenseL-STM: An efficient combination of convolutional and recurrent neural networks for audio source separation","author":"takahashi","year":"2018","journal-title":"n arXiv preprint arXiv 1805 02410"},{"key":"ref28","year":"0"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178061"},{"key":"ref27","article-title":"Fixup initialization: Residual learning without normalization","author":"zhang","year":"2019","journal-title":"arXiv preprint arXiv 1901 04217"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2013.2291240"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7471631"},{"key":"ref29","year":"0","journal-title":"Universal Sound Separation project webpage"},{"key":"ref5","article-title":"Speech enhancement with LSTM recurrent neural networks and its application to noise-robust ASR","author":"weninger","year":"2015","journal-title":"Proc LVA\/ICA"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7952154"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2016-1176"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/GlobalSIP.2014.7032183"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2017.2726762"},{"key":"ref1","article-title":"Speech enhancement based on deep denoising autoencoder","author":"lu","year":"2013","journal-title":"Proc Inter-speech"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/GlobalSIP.2017.8309164"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6637622"},{"key":"ref21","article-title":"Monoaural audio source separation using deep convolutional neural networks","author":"chandna","year":"2017","journal-title":"Proc LVA\/ICA"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7952118"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2018.2795749"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8682783"},{"key":"ref25","article-title":"Exploring trade-offs in models for low-latency speech enhancement","author":"wilson","year":"2018","journal-title":"Proc IWAENC"}],"event":{"name":"2019 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","location":"New Paltz, NY, USA","start":{"date-parts":[[2019,10,20]]},"end":{"date-parts":[[2019,10,23]]}},"container-title":["2019 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8932990\/8937073\/08937253.pdf?arnumber=8937253","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,15]],"date-time":"2022-07-15T03:10:20Z","timestamp":1657854620000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8937253\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,10]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/waspaa.2019.8937253","relation":{},"subject":[],"published":{"date-parts":[[2019,10]]}}}