{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,18]],"date-time":"2025-12-18T19:58:43Z","timestamp":1766087923396,"version":"3.37.3"},"reference-count":33,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2022,8,30]],"date-time":"2022-08-30T00:00:00Z","timestamp":1661817600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,8,30]],"date-time":"2022-08-30T00:00:00Z","timestamp":1661817600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["6216104"],"award-info":[{"award-number":["6216104"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004763","name":"Natural Science Foundation of Inner Mongolia","doi-asserted-by":"publisher","award":["2021MS06030"],"award-info":[{"award-number":["2021MS06030"]}],"id":[{"id":"10.13039\/501100004763","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100013147","name":"Research Program of Science and Technology at Universities of Inner Mongolia Autonomous Region","doi-asserted-by":"publisher","award":["2021GG0023"],"award-info":[{"award-number":["2021GG0023"]}],"id":[{"id":"10.13039\/501100013147","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Supported By Program for Young Talents of Science and Technology in Universities of Inner Mongolia Autonomous Region","award":["NYJT22056"],"award-info":[{"award-number":["NYJT22056"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Circuits Syst Signal Process"],"published-print":{"date-parts":[[2023,3]]},"DOI":"10.1007\/s00034-022-02155-8","type":"journal-article","created":{"date-parts":[[2022,8,30]],"date-time":"2022-08-30T06:03:39Z","timestamp":1661839419000},"page":"1834-1847","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Speech Enhancement of Complex Convolutional Recurrent Network with Attention"],"prefix":"10.1007","volume":"42","author":[{"given":"Jiangjiao","family":"Zeng","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5587-3744","authenticated-orcid":false,"given":"Lidong","family":"Yang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,8,30]]},"reference":[{"key":"2155_CR1","doi-asserted-by":"publisher","first-page":"157","DOI":"10.1109\/72.279181","volume":"5","author":"Y Bengio","year":"1994","unstructured":"Y. Bengio, P. Simard, P. Frasconi, Learning long-term dependencies with gradient descent is difficult. IEEE Trans. Neural Netw. 5, 157\u2013166 (1994)","journal-title":"IEEE Trans. Neural Netw."},{"key":"2155_CR2","doi-asserted-by":"publisher","first-page":"113","DOI":"10.1109\/TASSP.1979.1163209","volume":"27","author":"S Boll","year":"1979","unstructured":"S. Boll, Suppression of acoustic noise in speech using spectral subtraction. IEEE Trans. Acoust. Speech Signal Process. 27, 113\u2013120 (1979)","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"key":"2155_CR3","unstructured":"J. Cao, et al. Do-conv: depthwise over-parameterized convolutional layer. arXiv preprint arXiv:2006.12030 (2020)"},{"key":"2155_CR4","doi-asserted-by":"crossref","unstructured":"K. Cho, B. Van Merri\u00ebnboer, D. Bahdanau, Y. Bengio, On the properties of neural machine translation: encoder-decoder approaches. arXiv preprint arXiv:1409.1259 (2014)","DOI":"10.3115\/v1\/W14-4012"},{"key":"2155_CR5","doi-asserted-by":"publisher","first-page":"2403","DOI":"10.1016\/S0165-1684(01)00128-1","volume":"81","author":"I Cohen","year":"2001","unstructured":"I. Cohen, B. Berdugo, Speech enhancement for non-stationary noise environments. Signal Process. 81, 2403\u20132418 (2001)","journal-title":"Signal Process."},{"key":"2155_CR6","doi-asserted-by":"publisher","first-page":"1109","DOI":"10.1109\/TASSP.1984.1164453","volume":"32","author":"Y Ephraim","year":"1984","unstructured":"Y. Ephraim, D. Malah, Speech enhancement using a minimum-mean square error short-time spectral amplitude estimator. IEEE Trans. Acoust. Speech Signal Process. 32, 1109\u20131121 (1984)","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"issue":"8","key":"2155_CR7","doi-asserted-by":"publisher","first-page":"799","DOI":"10.1109\/89.966083","volume":"9","author":"H Gustafsson","year":"2001","unstructured":"H. Gustafsson, S.E. Nordholm, I. Claesson, Spectral subtraction using reduced delay convolution and adaptive averaging. IEEE Trans. Speech Audio Process. 9(8), 799\u2013807 (2001)","journal-title":"IEEE Trans. Speech Audio Process."},{"key":"2155_CR8","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"S. Hochreiter, S. Schmidhuber, Long short-term memory. Neural Comput. 9, 1735\u20131780 (1997)","journal-title":"Neural Comput."},{"key":"2155_CR9","doi-asserted-by":"crossref","unstructured":"Y. Hu, et al. DCCRN: Deep complex convolution recurrent network for phase-aware speech enhancement. arXiv preprint arXiv:2008.00264 (2020)","DOI":"10.21437\/Interspeech.2020-2537"},{"key":"2155_CR10","doi-asserted-by":"publisher","first-page":"229","DOI":"10.1109\/TASL.2007.911054","volume":"16","author":"Y Hu","year":"2007","unstructured":"Y. Hu, P.C. Loizou, Evaluation of objective quality measures for speech enhancement. IEEE Trans. Audio Speech Lang. Process. 16, 229\u2013238 (2007)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"2155_CR11","unstructured":"ITU, R. I.-T. P. 862.2: wideband extension to recommendation P. 862 for the assessment of wideband telephone networks and speech codecs. ITU-Telecommunication Standardization Sector (2007)"},{"key":"2155_CR12","unstructured":"D.P. Kingma, J. Ba, Adam: a method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)"},{"issue":"02","key":"2155_CR13","doi-asserted-by":"publisher","first-page":"2150017","DOI":"10.1142\/S0219477521500176","volume":"20","author":"B Kumar","year":"2021","unstructured":"B. Kumar, Comparative performance evaluation of greedy algorithms for speech enhancement system. Fluct. Noise Lett. 20(02), 2150017 (2021)","journal-title":"Fluct. Noise Lett."},{"key":"2155_CR14","doi-asserted-by":"publisher","first-page":"1586","DOI":"10.1109\/PROC.1979.11540","volume":"67","author":"JS Lim","year":"1979","unstructured":"J.S. Lim, A.V. Oppenheim, Enhancement and bandwidth compression of noisy speech. Proc. IEEE 67, 1586\u20131604 (1979)","journal-title":"Proc. IEEE"},{"key":"2155_CR15","doi-asserted-by":"crossref","unstructured":"S.R. Park, J. Lee, A fully convolutional neural network for speech enhancement. arXiv preprint arXiv:1609.07132 (2016)","DOI":"10.21437\/Interspeech.2017-1465"},{"key":"2155_CR16","doi-asserted-by":"crossref","unstructured":"O. Ronneberger, P. Fischer, T. Brox, in U-net: convolutional networks for biomedical image segmentation. International Conference on Medical image computing and computer-assisted intervention, pp. 234\u2013241 (2015)","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"2155_CR17","doi-asserted-by":"publisher","first-page":"533","DOI":"10.1038\/323533a0","volume":"323","author":"DE Rumelhart","year":"1986","unstructured":"D.E. Rumelhart, G.E. Hinton, R.J. Williams, Learning representations by back-propagating errors. Nature 323, 533\u2013536 (1986)","journal-title":"Nature"},{"key":"2155_CR18","doi-asserted-by":"crossref","unstructured":"A. Stergiou, R. Poppe, G. Kalliatakis, Refining activation downsampling with Softpool. arXiv preprint arXiv:2101.00440 (2021)","DOI":"10.1109\/ICCV48922.2021.01019"},{"key":"2155_CR19","unstructured":"D. Stoller, S. Ewert, S. Dixon, Wave-u-net: A multi-scale neural network for end-to-end audio source separation. arXiv preprint arXiv:1806.03185 (2018)"},{"key":"2155_CR20","doi-asserted-by":"crossref","unstructured":"L. Sun, J. Du, L.-R. Dai, C.-H. Lee, in Multiple-target deep learning for LSTM-RNN based speech enhancement. 2017 Hands-free Speech Communications and Microphone Arrays (HSCMA), pp. 136\u2013140 (IEEE, 2017)","DOI":"10.1109\/HSCMA.2017.7895577"},{"key":"2155_CR21","doi-asserted-by":"crossref","unstructured":"K. Tan, D. Wang, in A convolutional recurrent neural network for real-time speech enhancement. Interspeech, pp. 3229\u20133233 (2018)","DOI":"10.21437\/Interspeech.2018-1405"},{"key":"2155_CR22","doi-asserted-by":"crossref","unstructured":"K. Tan, D. Wang, in Complex spectral mapping with a convolutional recurrent network for monaural speech enhancement. ICASSP 2019-2019 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 6865\u20136869 (IEEE, 2019)","DOI":"10.1109\/ICASSP.2019.8682834"},{"key":"2155_CR23","doi-asserted-by":"publisher","first-page":"380","DOI":"10.1109\/TASLP.2019.2955276","volume":"28","author":"K Tan","year":"2019","unstructured":"K. Tan, D. Wang, Learning complex spectral mapping with gated convolutional recurrent networks for monaural speech enhancement. IEEE\/ACM Trans. Audio, Speech, Language Process. 28, 380\u2013390 (2019)","journal-title":"IEEE\/ACM Trans. Audio, Speech, Language Process."},{"key":"2155_CR24","doi-asserted-by":"crossref","unstructured":"J. Thiemann, N. Ito, E. Vincent, in The diverse environments multi-channel acoustic noise database (DEMAND): a database of multichannel environmental noise recordings. Proceedings of Meetings on Acoustics ICA2013, vol. 19 035081 (Acoustical Society of America, 2013)","DOI":"10.1121\/1.4799597"},{"key":"2155_CR25","doi-asserted-by":"crossref","unstructured":"C. Tian, Y. Xu, W. Zuo, C.-W. Lin, D. Zhang, Asymmetric CNN for image superresolution. IEEE Trans. Syst. Man Cybernet. Syst. (2021)","DOI":"10.1109\/TSMC.2021.3069265"},{"key":"2155_CR26","unstructured":"C. Valentini-Botinhao, others. Noisy speech database for training speech enhancement algorithms and tts models. (2017)"},{"key":"2155_CR27","doi-asserted-by":"crossref","unstructured":"C. Veaux, J. Yamagishi, S. King, in The voice bank corpus: design, collection and data analysis of a large regional accent speech database. 2013 International Conference Oriental COCOSDA Held Jointly with 2013 Conference on Asian Spoken Language Research and Evaluation (O-COCOSDA\/CASLRE), pp. 1\u20134 (IEEE, 2013)","DOI":"10.1109\/ICSDA.2013.6709856"},{"key":"2155_CR28","unstructured":"T.H. Vu, J.-C. Wang, Acoustic scene and event recognition using recurrent neural networks. Detect. Classif. Acoust. Scenes Events (2016)"},{"key":"2155_CR29","doi-asserted-by":"crossref","unstructured":"Y. Wang, D. Wang, in Boosting classification based speech separation using temporal dynamics. Thirteenth Annual Conference of the International Speech Communication Association (2012)","DOI":"10.21437\/Interspeech.2012-431"},{"key":"2155_CR30","doi-asserted-by":"publisher","first-page":"11666","DOI":"10.1523\/JNEUROSCI.3414-05.2005","volume":"25","author":"BS Webb","year":"2005","unstructured":"B.S. Webb, N.T. Dhruv, S.G. Solomon, C. Tailby, P. Lennie, Early and late mechanisms of surround suppression in striate cortex of macaque. J. Neurosci. 25, 11666\u201311675 (2005)","journal-title":"J. Neurosci."},{"key":"2155_CR31","unstructured":"L. Yang, R.-Y. Zhang, L. Li, X. Xie, X. Simam in A simple, parameter-free attention module for convolutional neural networks. International Conference on Machine Learning, pp. 11863\u201311874 (PMLR, 2021)"},{"key":"2155_CR32","doi-asserted-by":"crossref","unstructured":"H. Zhang, X. Zhang, G. Gao, in Training supervised speech separation system to improve STOI and PESQ directly. 2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 5374\u20135378 (IEEE, 2018)","DOI":"10.1109\/ICASSP.2018.8461965"},{"key":"2155_CR33","doi-asserted-by":"publisher","first-page":"4681","DOI":"10.1109\/TII.2019.2943898","volume":"16","author":"M Zhao","year":"2019","unstructured":"M. Zhao, S. Zhong, X. Fu, B. Tang, M. Pecht, Deep residual shrinkage networks for fault diagnosis. IEEE Trans. Industr. Inf. 16, 4681\u20134690 (2019)","journal-title":"IEEE Trans. Industr. Inf."}],"container-title":["Circuits, Systems, and Signal Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00034-022-02155-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00034-022-02155-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00034-022-02155-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,3,16]],"date-time":"2023-03-16T02:04:15Z","timestamp":1678932255000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00034-022-02155-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,8,30]]},"references-count":33,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2023,3]]}},"alternative-id":["2155"],"URL":"https:\/\/doi.org\/10.1007\/s00034-022-02155-8","relation":{},"ISSN":["0278-081X","1531-5878"],"issn-type":[{"type":"print","value":"0278-081X"},{"type":"electronic","value":"1531-5878"}],"subject":[],"published":{"date-parts":[[2022,8,30]]},"assertion":[{"value":"27 January 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 August 2022","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 August 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 August 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"None","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}