{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T19:00:52Z","timestamp":1776884452896,"version":"3.51.2"},"reference-count":49,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2016,1,18]],"date-time":"2016-01-18T00:00:00Z","timestamp":1453075200000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["EURASIP J. Adv. Signal Process."],"published-print":{"date-parts":[[2016,12]]},"DOI":"10.1186\/s13634-016-0306-6","type":"journal-article","created":{"date-parts":[[2016,1,18]],"date-time":"2016-01-18T00:45:51Z","timestamp":1453077951000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":259,"title":["A summary of the REVERB challenge: state-of-the-art and remaining challenges in reverberant speech processing research"],"prefix":"10.1186","volume":"2016","author":[{"given":"Keisuke","family":"Kinoshita","sequence":"first","affiliation":[]},{"given":"Marc","family":"Delcroix","sequence":"additional","affiliation":[]},{"given":"Sharon","family":"Gannot","sequence":"additional","affiliation":[]},{"given":"Emanu\u00ebl A.","family":"P. Habets","sequence":"additional","affiliation":[]},{"given":"Reinhold","family":"Haeb-Umbach","sequence":"additional","affiliation":[]},{"given":"Walter","family":"Kellermann","sequence":"additional","affiliation":[]},{"given":"Volker","family":"Leutnant","sequence":"additional","affiliation":[]},{"given":"Roland","family":"Maas","sequence":"additional","affiliation":[]},{"given":"Tomohiro","family":"Nakatani","sequence":"additional","affiliation":[]},{"given":"Bhiksha","family":"Raj","sequence":"additional","affiliation":[]},{"given":"Armin","family":"Sehr","sequence":"additional","affiliation":[]},{"given":"Takuya","family":"Yoshioka","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2016,1,18]]},"reference":[{"key":"306_CR1","doi-asserted-by":"publisher","DOI":"10.1002\/9780470994443","volume-title":"Sound capture and processing","author":"I Tashev","year":"2009","unstructured":"I Tashev, Sound capture and processing (Wiley, New Jersey, 2009)."},{"key":"306_CR2","volume-title":"Spoken language processing: a guide to theory, algorithm and system development","author":"X Huang","year":"2001","unstructured":"X Huang, A Acero, H-W Hong, Spoken language processing: a guide to theory, algorithm and system development (Prentice Hall, New Jersey, 2001)."},{"key":"306_CR3","doi-asserted-by":"publisher","DOI":"10.1002\/9780470714089","volume-title":"Distant speech recognition","author":"M W\u00f6lfel","year":"2009","unstructured":"M W\u00f6lfel, J McDonough, Distant speech recognition (Wiley, New Jersey, 2009)."},{"key":"306_CR4","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-84996-056-4","volume-title":"Speech dereverberation","author":"PA Naylor","year":"2010","unstructured":"PA Naylor, ND Gaubitch, Speech dereverberation (Springer, Berlin, 2010)."},{"issue":"6","key":"306_CR5","doi-asserted-by":"publisher","first-page":"114","DOI":"10.1109\/MSP.2012.2205029","volume":"29","author":"T Yoshioka","year":"2012","unstructured":"T Yoshioka, A Sehr, M Delcroix, K Kinoshita, R Maas, T Nakatani, W Kellermann, Making machines understand us in reverberant rooms: robustness against reverberation for automatic speech recognition. IEEE Signal Process. Mag.29(6), 114\u2013126 (2012).","journal-title":"IEEE Signal Process. Mag."},{"key":"306_CR6","volume-title":"Proceedings of Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","author":"K Kinoshita","year":"2013","unstructured":"K Kinoshita, M Delcroix, T Yoshioka, T Nakatani, E Habets, R Haeb-Umbach, V Leutnant, A Sehr, W Kellermann, R Maas, BR S. Gannot, in Proceedings of Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA). The REVERB challenge: a common evaluation framework for dereverberation and recognition of reverberant speech, (2013)."},{"key":"306_CR7","unstructured":"REVERB Challenge Webpage. \n                    http:\/\/reverb2014.dereverberation.com\/\n                    \n                  . Accessed 13 Jan 2016."},{"key":"306_CR8","first-page":"29","volume-title":"Proceedings of International Conference on Spoken Language Processing (ICSLP)","author":"D Pearce","year":"2000","unstructured":"D Pearce, H-G Hirsch, in Proceedings of International Conference on Spoken Language Processing (ICSLP). The Aurora experimental framework for the performance evaluation of speech recognition systems under noisy conditions, (2000), pp. 29\u201332."},{"key":"306_CR9","doi-asserted-by":"publisher","first-page":"1928","DOI":"10.1016\/j.sigpro.2011.10.007","volume":"92","author":"E Vincent","year":"2012","unstructured":"E Vincent, S Araki, FJ Theis, G Nolte, P Bofill, H Sawada, A Ozerov, BV Gowreesunker, D Lutter, The signal separation evaluation campaign (2007\u20132010): achievements and remaining challenges. Signal Process.92:, 1928\u20131936 (2012).","journal-title":"Signal Process."},{"issue":"3","key":"306_CR10","doi-asserted-by":"publisher","first-page":"621","DOI":"10.1016\/j.csl.2012.10.004","volume":"27","author":"J Barker","year":"2013","unstructured":"J Barker, E Vincent, N Ma, C Christensen, P Green, The PASCAL CHiME speech separation and recognition challenge. Comput. Speech and Lang.27(3), 621\u2013633 (2013).","journal-title":"Comput. Speech and Lang."},{"key":"306_CR11","first-page":"81","volume-title":"Proceedings of International Conference on Acoustics, Speech and Signal Processing (ICASSP)","author":"T Robinson","year":"1995","unstructured":"T Robinson, J Fransen, D Pye, J Foote, S Renals, in Proceedings of International Conference on Acoustics, Speech and Signal Processing (ICASSP). WSJCAM0: A British English speech corpus for large vocabulary continuous speech recognition, (1995), pp. 81\u201384."},{"key":"306_CR12","first-page":"357","volume-title":"Proceedings of IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)","author":"M Lincoln","year":"2005","unstructured":"M Lincoln, I McCowan, J Vepa, HK Maganti, in Proceedings of IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU). The multi-channel Wall Street Journal audio visual corpus (MC-WSJ-AV): specification and initial experiments, (2005), pp. 357\u2013362."},{"issue":"1","key":"306_CR13","doi-asserted-by":"publisher","first-page":"229","DOI":"10.1109\/TASL.2007.911054","volume":"16","author":"Y Hu","year":"2008","unstructured":"Y Hu, PC Loizou, Evaluation of objective quality measures for speech enhancement. IEEE Trans. Audio, Speech, Lang. Process.16(1), 229\u2013238 (2008).","journal-title":"IEEE Trans. Audio, Speech, Lang. Process."},{"issue":"7","key":"306_CR14","doi-asserted-by":"publisher","first-page":"1766","DOI":"10.1109\/TASL.2010.2052247","volume":"18","author":"TH Falk","year":"2010","unstructured":"TH Falk, C Zheng, W-Y Chan, A non-intrusive quality and intelligibility measure of reverberant and dereverberated speech. IEEE Trans. Audio, Speech, Lang. Process.18(7), 1766\u20131774 (2010).","journal-title":"IEEE Trans. Audio, Speech, Lang. Process."},{"key":"306_CR15","unstructured":"ITU-T Recommendation P.862: Perceptual evaluation of speech quality (PESQ): an objective method for end-to-end speech quality assessment of narrow-band telephone networks and speech codecs."},{"key":"306_CR16","unstructured":"ITU-R Recommendation BS.1534: method for the subjective assessment of intermediate quality levels of coding systems."},{"key":"306_CR17","volume-title":"Proceedings of REVERB Challenge Workshop, p2.10","author":"MJ Alam","year":"2014","unstructured":"MJ Alam, V Gupta, P Kenny, P Dumouchel, in Proceedings of REVERB Challenge Workshop, p2.10. Use of multiple front-ends and I-vector-based speaker adaptation for robust speech recognition, (2014)."},{"key":"306_CR18","volume-title":"Proceedings of REVERB Challenge Workshop, o1.3","author":"RF Astudillo","year":"2014","unstructured":"RF Astudillo, S Braun, E Habets, in Proceedings of REVERB Challenge Workshop, o1.3. A multichannel feature compensation approach for robust ASR in noisy and reverberant environments, (2014)."},{"key":"306_CR19","volume-title":"Proceedings of REVERB Challenge Workshop, o1.2","author":"B Cauchi","year":"2014","unstructured":"B Cauchi, I Kodrasi, R Rehr, S Gerlach, A Juki\u0107, T Gerkmann, S Doclo, S Goetze, in Proceedings of REVERB Challenge Workshop, o1.2. Joint dereverberation and noise reduction using beamforming and a single-channel speech enhancement scheme, (2014)."},{"key":"306_CR20","volume-title":"Proceedings of REVERB Challenge Workshop, o2.3","author":"M Delcroix","year":"2014","unstructured":"M Delcroix, T Yoshioka, A Ogawa, Y Kubo, M Fujimoto, I Nobutaka, K Kinoshita, M Espi, T Hori, T Nakatani, A Nakamura, in Proceedings of REVERB Challenge Workshop, o2.3. Linear prediction-based dereverberation with advanced speech enhancement and recognition technologies for the REVERB challenge, (2014)."},{"key":"306_CR21","volume-title":"Proceedings of REVERB Challenge Workshop, p2.7","author":"N Epain","year":"2014","unstructured":"N Epain, T Noohi, C Jin, in Proceedings of REVERB Challenge Workshop, p2.7. Sparse recovery method for dereverberation, (2014)."},{"key":"306_CR22","volume-title":"Proceedings of REVERB Challenge Workshop, p1.9","author":"X Feng","year":"2014","unstructured":"X Feng, K Kumatani, J McDonough, in Proceedings of REVERB Challenge Workshop, p1.9. The CMU-MIT REVERB challenge 2014 system: description and results, (2014)."},{"key":"306_CR23","volume-title":"Proceedings of REVERB Challenge Workshop, p1.6","author":"JT Geiger","year":"2014","unstructured":"JT Geiger, E Marchi, BW Schuller, G Rigoll, in Proceedings of REVERB Challenge Workshop, p1.6. The TUM system for the REVERB challenge: recognition of reverberated speech using multi-channel correlation shaping dereverberation and blstm recurrent neural networks, (2014)."},{"key":"306_CR24","volume-title":"Proceedings of REVERB Challenge Workshop, p2.2","author":"DR Gonzalez","year":"2014","unstructured":"DR Gonzalez, SC Arias, JRC de Lara, in Proceedings of REVERB Challenge Workshop, p2.2. Single channel speech enhancement based on zero phase transformation in reverberated environments, (2014)."},{"key":"306_CR25","volume-title":"Proceedings of REVERB Challenge Workshop, p2.9","author":"H-G Hirsch","year":"2014","unstructured":"H-G Hirsch, in Proceedings of REVERB Challenge Workshop, p2.9. Extraction of robust features by combining noise reduction and FDLP for the recognition of noisy speech signals in hands-free mode, (2014)."},{"key":"306_CR26","volume-title":"Proceedings of REVERB Challenge Workshop, o2.1","author":"H Kallasjoki","year":"2014","unstructured":"H Kallasjoki, J Gemmeke, K Palom\u00e4ki, A Beeston, G Brown, in Proceedings of REVERB Challenge Workshop, o2.1. Recognition of reverberant speech by missing data imputation and NMF feature enhancement, (2014)."},{"key":"306_CR27","volume-title":"Proceedings of REVERB Challenge Workshop, p2.4","author":"K Kondo","year":"2014","unstructured":"K Kondo, in Proceedings of REVERB Challenge Workshop, p2.4. A computationally restrained and single-channel blind dereverberation method utilizing iterative spectral modifications, (2014)."},{"key":"306_CR28","volume-title":"Proceedings of REVERB Challenge Workshop, p2.11","author":"YR Leng","year":"2014","unstructured":"YR Leng, J Dennis, WZT Ng, TH Dat, in Proceedings of REVERB Challenge Workshop, p2.11. PBF-GSC beamforming for ASR and speech enhancement in reverberant environments, (2014)."},{"key":"306_CR29","volume-title":"Proceedings of REVERB Challenge Workshop, p2.3","author":"N L\u00f3pez","year":"2014","unstructured":"N L\u00f3pez, G Richard, Y Grenier, I Bourmeyster, in Proceedings of REVERB Challenge Workshop, p2.3. Reverberation suppression based on sparse linear prediction in noisy environments, (2014)."},{"key":"306_CR30","volume-title":"Proceedings of REVERB Challenge Workshop, p1.8","author":"M Mimura","year":"2014","unstructured":"M Mimura, S Sakai, T Kawahara, in Proceedings of REVERB Challenge Workshop, p1.8. Reverberant speech recognition combining deep neural networks and deep autoencoders, (2014)."},{"key":"306_CR31","volume-title":"Proceedings of REVERB Challenge Workshop, p2.5","author":"V Mitra","year":"2014","unstructured":"V Mitra, W Wang, Y Lei, A Kathol, G Sivaraman, C Espy-Wilson, in Proceedings of REVERB Challenge Workshop, p2.5. Robust features and system fusion for reverberation-robust speech recognition, (2014)."},{"key":"306_CR32","volume-title":"Proceedings of REVERB Challenge Workshop, p1.2","author":"M Moshirynia","year":"2014","unstructured":"M Moshirynia, F Razzazi, A Haghbin, in Proceedings of REVERB Challenge Workshop, p1.2. A speech dereverberation method using adaptive sparse dictionary learning, (2014)."},{"key":"306_CR33","volume-title":"Proceedings of REVERB Challenge Workshop, p1.5","author":"K Ohtani","year":"2014","unstructured":"K Ohtani, T Komatsu, T Nishino, K Takeda, in Proceedings of REVERB Challenge Workshop, p1.5. Adaptive dereverberation method based on complementary Wiener filter and modulation transfer function, (2014)."},{"key":"306_CR34","volume-title":"Proceedings of REVERB Challenge Workshop, p1.10","author":"K Palom\u00e4ki","year":"2014","unstructured":"K Palom\u00e4ki, in Proceedings of REVERB Challenge Workshop, p1.10. Reverberation robust speech recognition by matching distributions of spectrally and temporally decorrelated features, (2014)."},{"key":"306_CR35","volume-title":"Proceedings of REVERB Challenge Workshop, p1.4","author":"PP Parada","year":"2014","unstructured":"PP Parada, D Sharma, PA Naylor, T van Waterschoot, in Proceedings of REVERB Challenge Workshop, p1.4. Single-channel reverberant speech recognition using C50 estimation, (2014)."},{"key":"306_CR36","volume-title":"Proceedings of REVERB Challenge Workshop, p1.3","author":"Y Tachioka","year":"2014","unstructured":"Y Tachioka, T Narita, FJ Weninger, S Watanabe, in Proceedings of REVERB Challenge Workshop, p1.3. Dual system combination approach for various reverberant environments with dereverberation techniques, (2014)."},{"key":"306_CR37","volume-title":"Proceedings of REVERB Challenge Workshop, p1.7","author":"J Veras","year":"2014","unstructured":"J Veras, T Prego, A Lima, T Ferreira, S Netto, in Proceedings of REVERB Challenge Workshop, p1.7. Speech quality enhancement based on spectral subtraction, (2014)."},{"key":"306_CR38","volume-title":"Proceedings of REVERB Challenge Workshop, p2.1","author":"X Wang","year":"2014","unstructured":"X Wang, Y Guo, X Yang, Q Fu, Y Yan, in Proceedings of REVERB Challenge Workshop, p2.1. Acoustic scene aware dereverberation using 2-channel spectral enhancement for REVERB challenge, (2014)."},{"key":"306_CR39","volume-title":"Proceedings of REVERB Challenge Workshop, o1.1","author":"FJ Weninger","year":"2014","unstructured":"FJ Weninger, S Watanabe, J Le Roux, J Hershey, Y Tachioka, JT Geiger, BW Schuller, G Rigoll, in Proceedings of REVERB Challenge Workshop, o1.1. The MERL\/MELCO\/TUM system for the REVERB challenge using deep recurrent neural network feature enhancement, (2014)."},{"key":"306_CR40","volume-title":"Proceedings of REVERB Challenge Workshop, p1.11","author":"S Wisdom","year":"2014","unstructured":"S Wisdom, T Powers, L Atlas, J Pitton, in Proceedings of REVERB Challenge Workshop, p1.11. Enhancement of reverberant and noisy speech by extending its coherence, (2014)."},{"key":"306_CR41","volume-title":"Proceedings of REVERB Challenge Workshop, o2.2","author":"X Xiao","year":"2014","unstructured":"X Xiao, Z Shengkui, DHH Nguyen, Z Xionghu, D Jones, E-S Chng, H Li, in Proceedings of REVERB Challenge Workshop, o2.2. The NTU-ADSC systems for reverberation challenge 2014, (2014)."},{"key":"306_CR42","volume-title":"Proceedings of REVERB Challenge Workshop, p2.8","author":"F Xiong","year":"2014","unstructured":"F Xiong, N Moritz, R Rehr, J Anemueller, B Meyer, T Gerkmann, S Doclo, S Goetze, in Proceedings of REVERB Challenge Workshop, p2.8. Robust ASR in reverberant environments using temporal cepstrum smoothing for speech enhancement and an amplitude modulation filterbank for feature extraction, (2014)."},{"key":"306_CR43","volume-title":"Proceedings of REVERB Challenge Workshop, p2.6","author":"M Yu","year":"2014","unstructured":"M Yu, F Soong, in Proceedings of REVERB Challenge Workshop, p2.6. Speech dereverberation by constrained and regularized multi-channel spectral decomposition: evaluated on REVERB challenge, (2014)."},{"key":"306_CR44","first-page":"359","volume":"87","author":"K Lebart","year":"2001","unstructured":"K Lebart, JM Boucher, PN Denbigh, A new method based on spectral subtraction for speech de-reverberation. Acta Acoustica. 87:, 359\u2013366 (2001).","journal-title":"Acta Acoustica"},{"key":"306_CR45","first-page":"285","volume-title":"Proceedings of IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)","author":"P Swietojanski","year":"2013","unstructured":"P Swietojanski, A Ghoshal, S Renals, in Proceedings of IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU). Hybrid acoustic models for distant and multichannel large vocabulary speech recognition, (2013), pp. 285\u2013290."},{"key":"306_CR46","first-page":"7398","volume-title":"Proceedings of International Conference on Acoustics, Speech and Signal Processing (ICASSP)","author":"M Seltzer","year":"2013","unstructured":"M Seltzer, D Yu, Y Wang, in Proceedings of International Conference on Acoustics, Speech and Signal Processing (ICASSP). An investigation of deep neural networks for noise robust speech recognition, (2013), pp. 7398\u20137402."},{"key":"306_CR47","first-page":"501","volume-title":"Proceedings of International Conference on Acoustics, Speech and Signal Processing (ICASSP)","author":"T Zernicki","year":"2011","unstructured":"T Zernicki, M Bartkowiak, M Doma, in Proceedings of International Conference on Acoustics, Speech and Signal Processing (ICASSP). Enhanced coding of high-frequency tonal components in MPEG-D USAC through joint application of ESBR and sinusoidal modeling, (2011), pp. 501\u2013504."},{"key":"306_CR48","unstructured":"LDC Site for The Multi-channel Wall Street Journal Audio Visual Corpus (MC-WSJ-AV). \n                    https:\/\/catalog.ldc.upenn.edu\/LDC2014S03\n                    \n                  . Accessed 13 Jan 2016."},{"key":"306_CR49","unstructured":"LDC Site for WSJCAM0. \n                    https:\/\/catalog.ldc.upenn.edu\/LDC95S24\n                    \n                  . Accessed 13 Jan 2016."}],"container-title":["EURASIP Journal on Advances in Signal Processing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13634-016-0306-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s13634-016-0306-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13634-016-0306-6","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13634-016-0306-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,3,26]],"date-time":"2019-03-26T12:07:53Z","timestamp":1553602073000},"score":1,"resource":{"primary":{"URL":"https:\/\/asp-eurasipjournals.springeropen.com\/articles\/10.1186\/s13634-016-0306-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,1,18]]},"references-count":49,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2016,12]]}},"alternative-id":["306"],"URL":"https:\/\/doi.org\/10.1186\/s13634-016-0306-6","relation":{},"ISSN":["1687-6180"],"issn-type":[{"value":"1687-6180","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016,1,18]]},"article-number":"7"}}