{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,9]],"date-time":"2024-09-09T11:13:42Z","timestamp":1725880422514},"publisher-location":"Cham","reference-count":22,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319535463"},{"type":"electronic","value":"9783319535470"}],"license":[{"start":{"date-parts":[[2017,1,1]],"date-time":"2017-01-01T00:00:00Z","timestamp":1483228800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017]]},"DOI":"10.1007\/978-3-319-53547-0_23","type":"book-chapter","created":{"date-parts":[[2017,2,14]],"date-time":"2017-02-14T09:54:19Z","timestamp":1487066059000},"page":"236-246","source":"Crossref","is-referenced-by-count":7,"title":["Discriminative Enhancement for Single Channel Audio Source Separation Using Deep Neural Networks"],"prefix":"10.1007","author":[{"given":"Emad M.","family":"Grais","sequence":"first","affiliation":[]},{"given":"Gerard","family":"Roma","sequence":"additional","affiliation":[]},{"given":"Andrew J. R.","family":"Simpson","sequence":"additional","affiliation":[]},{"given":"Mark D.","family":"Plumbley","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,2,15]]},"reference":[{"key":"23_CR1","doi-asserted-by":"crossref","unstructured":"Bergstra, J., Breuleux, O., Bastien, F., Lamblin, P., Pascanu, R., Desjardins, G., Turian, J., Warde-Farley, D., Bengio, Y.: Theano: a CPU and GPU math expression compiler. In: Proceedings of the Python for Scientific Computing Conference (SciPy) (2010)","DOI":"10.25080\/Majora-92bf1922-003"},{"key":"23_CR2","doi-asserted-by":"crossref","unstructured":"Erdogan, H., Hershey, J., Watanabe, S., Roux, J.L.: Phase-sensitive and recognition-boosted speech separation using deep recurrent neural networks. In: Proceedings of the ICASSP, pp. 708\u2013712 (2015)","DOI":"10.1109\/ICASSP.2015.7178061"},{"key":"23_CR3","doi-asserted-by":"crossref","unstructured":"Grais, E.M., Erdogan, H.: Hidden Markov models as priors for regularized nonnegative matrix factorization in single-channel source separation. In: Proceedings of the InterSpeech (2012)","DOI":"10.21437\/Interspeech.2012-433"},{"key":"23_CR4","doi-asserted-by":"crossref","unstructured":"Grais, E.M., Erdogan, H.: Spectro-temporal post-enhancement using MMSE estimation in NMF based single-channel source separation. In: Proceedings of the InterSpeech (2013)","DOI":"10.21437\/Interspeech.2013-726"},{"key":"23_CR5","doi-asserted-by":"crossref","unstructured":"Grais, E.M., Sen, M.U., Erdogan, H.: Deep neural networks for single channel source separation. In: Proceedings of the ICASSP, pp. 3734\u20133738 (2014)","DOI":"10.1109\/ICASSP.2014.6854299"},{"key":"23_CR6","unstructured":"Huang, P.S., Kim, M., Hasegawa-Johnson, M., Smaragdis, P.: Singing-Voice separation from monaural recordings using deep recurrent neural networks. In: Proceedings of the ISMIR, pp. 477\u2013482 (2014)"},{"issue":"12","key":"23_CR7","doi-asserted-by":"crossref","first-page":"2136","DOI":"10.1109\/TASLP.2015.2468583","volume":"23","author":"PS Huang","year":"2015","unstructured":"Huang, P.S., Kim, M., Hasegawa-Johnson, M., Smaragdis, P.: Joint optimization of masks and deep recurrent neural networks for monaural source separation. IEEE\/ACM Trans. Audio Speech Lang. Process. 23(12), 2136\u20132147 (2015)","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."},{"key":"23_CR8","first-page":"556","volume":"13","author":"DD Lee","year":"2001","unstructured":"Lee, D.D., Seung, H.S.: Algorithms for non-negative matrix factorization. Adv. Neural Inf. Process. Syst. (NIPS) 13, 556\u2013562 (2001)","journal-title":"Adv. Neural Inf. Process. Syst. (NIPS)"},{"key":"23_CR9","doi-asserted-by":"crossref","unstructured":"Narayanan, A., Wang, D.: Ideal ratio mask estimation using deep neural networks for robust speech recognition. In: Proceedings of the ICASSP, pp. 7092\u20137096 (2013)","DOI":"10.1109\/ICASSP.2013.6639038"},{"issue":"9","key":"23_CR10","doi-asserted-by":"crossref","first-page":"1652","DOI":"10.1109\/TASLP.2016.2580946","volume":"24","author":"AA Nugraha","year":"2016","unstructured":"Nugraha, A.A., Liutkus, A., Vincent, E.: Multichannel audio source separation with deep neural networks. IEEE\/ACM Trans. Audio Speech Lang. Process. 24(9), 1652\u20131664 (2016)","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."},{"key":"23_CR11","doi-asserted-by":"crossref","unstructured":"Ono, N., Rafii, Z., Kitamura, D., Ito, N., Liutkus, A.: The 2015 signal separation evaluation campaign. In: Proceedings of the LVA\/ICA, pp. 387\u2013395 (2015)","DOI":"10.1007\/978-3-319-22482-4_45"},{"key":"23_CR12","doi-asserted-by":"crossref","unstructured":"Ozerov, A., Fevotte, C., Charbit, M.: Factorial scaled hidden Markov model for polyphonic audio representation and source separation. In: Proceedings of the WASPAA, pp. 121\u2013124 (2009)","DOI":"10.1109\/ASPAA.2009.5346527"},{"key":"23_CR13","doi-asserted-by":"crossref","unstructured":"Simpson, A.J.R., Roma, G., Grais, E.M., Mason, R., Hummersone, C., Liutkus, A., Plumbley, M.D.: Evaluation of audio source separation models using hypothesis-driven non-parametric statistical methods. In: Proceedings of the EUSIPCO (2016)","DOI":"10.1109\/EUSIPCO.2016.7760551"},{"key":"23_CR14","doi-asserted-by":"crossref","unstructured":"Simpson, A.J.R., Roma, G., Plumbley, M.D.: Deep Karaoke: extracting vocals from musical mixtures using a convolutional deep neural network. In: Proceedings of the LVA\/ICA, pp. 429\u2013436 (2015)","DOI":"10.1007\/978-3-319-22482-4_50"},{"issue":"4","key":"23_CR15","doi-asserted-by":"crossref","first-page":"1462","DOI":"10.1109\/TSA.2005.858005","volume":"14","author":"E Vincent","year":"2006","unstructured":"Vincent, E., Gribonval, R., Fevotte, C.: Performance measurement in blind audio source separation. IEEE Trans. Audio Speech Lang. Process. 14(4), 1462\u20131469 (2006)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"23_CR16","first-page":"3371","volume":"11","author":"P Vincent","year":"2010","unstructured":"Vincent, P., Larochelle, H., Lajoie, I., Bengio, Y., Manzagol, P.A.: Stacked denoising autoencoders: learning useful representations in a deep network with a local denoising criterion. J. Mach. Learn. Res. 11, 3371\u20133408 (2010)","journal-title":"J. Mach. Learn. Res."},{"key":"23_CR17","doi-asserted-by":"crossref","first-page":"1066","DOI":"10.1109\/TASL.2006.885253","volume":"15","author":"T Virtanen","year":"2007","unstructured":"Virtanen, T.: Monaural sound source separation by non-negative matrix factorization with temporal continuity and sparseness criteria. IEEE Trans. Audio Speech Lang. Process. 15, 1066\u20131074 (2007)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"23_CR18","doi-asserted-by":"crossref","unstructured":"Weninger, F., Hershey, J.R., Roux, J.L., Schuller, B.: Discriminatively trained recurrent neural networks for single-channel speech separation. In: Proceedings of the GlobalSIP, pp. 577\u2013581 (2014)","DOI":"10.1109\/GlobalSIP.2014.7032183"},{"issue":"6","key":"23_CR19","doi-asserted-by":"crossref","first-page":"80","DOI":"10.2307\/3001968","volume":"1","author":"F Wilcoxon","year":"1945","unstructured":"Wilcoxon, F.: Individual comparisons by ranking methods. Biometrics Bull. 1(6), 80\u201383 (1945)","journal-title":"Biometrics Bull."},{"key":"23_CR20","doi-asserted-by":"crossref","unstructured":"Williamson, D., Wang, Y., Wang, D.: A two-stage approach for improving the perceptual quality of separated speech. In: Proceedings of the ICASSP, pp. 7034\u20137038 (2014)","DOI":"10.1109\/ICASSP.2014.6854964"},{"key":"23_CR21","unstructured":"Xie, J., Xu, L., Chen, E.: Image denoising and inpainting with deep neural networks. In: Advances in Neural Information Processing Systems (NIPS) (2012)"},{"key":"23_CR22","doi-asserted-by":"crossref","DOI":"10.1002\/9780470316672","volume-title":"Multiple Comparison Procedures","author":"Y Hochberg","year":"1987","unstructured":"Hochberg, Y., Tamhane, A.C.: Multiple Comparison Procedures. Wiley, New York (1987)"}],"container-title":["Lecture Notes in Computer Science","Latent Variable Analysis and Signal Separation"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-53547-0_23","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,24]],"date-time":"2022-07-24T03:21:55Z","timestamp":1658632915000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-53547-0_23"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017]]},"ISBN":["9783319535463","9783319535470"],"references-count":22,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-53547-0_23","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2017]]}}}