{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,2]],"date-time":"2025-12-02T15:04:01Z","timestamp":1764687841897},"publisher-location":"Cham","reference-count":88,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030317638"},{"type":"electronic","value":"9783030317645"}],"license":[{"start":{"date-parts":[[2019,11,2]],"date-time":"2019-11-02T00:00:00Z","timestamp":1572652800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020]]},"DOI":"10.1007\/978-3-030-31764-5_7","type":"book-chapter","created":{"date-parts":[[2019,11,1]],"date-time":"2019-11-01T11:46:34Z","timestamp":1572608794000},"page":"171-196","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":25,"title":["Baby Cry Detection: Deep Learning and\u00a0Classical Approaches"],"prefix":"10.1007","author":[{"given":"Rami","family":"Cohen","sequence":"first","affiliation":[]},{"given":"Dima","family":"Ruinskiy","sequence":"additional","affiliation":[]},{"given":"Janis","family":"Zickfeld","sequence":"additional","affiliation":[]},{"given":"Hans","family":"IJzerman","sequence":"additional","affiliation":[]},{"given":"Yizhar","family":"Lavner","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,11,2]]},"reference":[{"key":"7_CR1","unstructured":"Krizhevsky, A., Sutskever, I., Hinton, G.E.: Imagenet classification with deep convolutional neural networks. In: Pereira, F., Burges, C.J.C., Bottou, L., Weinberger, K.Q. (eds.) Advances in Neural Information Processing Systems, vol. 25, pp. 1097\u20131105. Curran Associates, Inc. (2012). http:\/\/papers.nips.cc\/paper\/4824-imagenet-classification-with-deep-convolutional-neural-networks.pdf"},{"key":"7_CR2","doi-asserted-by":"crossref","unstructured":"Hershey, S., Chaudhuri, S., Ellis, D.P., Gemmeke, J.F., Jansen, A., Moore, R.C., Plakal, M., Platt, D., Saurous, R.A., Seybold, B.: CNN architectures for large-scale audio classification. In: IEEE International Conference on Acoustics, Speech and Signal Processing (icassp), pp. 131\u2013135. IEEE (2017)","DOI":"10.1109\/ICASSP.2017.7952132"},{"key":"7_CR3","doi-asserted-by":"crossref","unstructured":"Cakir, E., Heittola, T., Huttunen, H., Virtanen, T.: Polyphonic sound event detection using multi label deep neural networks. In: International Joint Conference on Neural Networks (IJCNN), pp. 1\u20137. IEEE (2015)","DOI":"10.1109\/IJCNN.2015.7280624"},{"key":"7_CR4","doi-asserted-by":"crossref","unstructured":"Ram\u00edrez, J., G\u00f3rriz, J.M., Segura, J.C.: Voice Activity Detection. Fundamentals And Speech Recognition System Robustness (2007)","DOI":"10.5772\/4740"},{"key":"7_CR5","doi-asserted-by":"publisher","first-page":"838","DOI":"10.1109\/TASL.2006.889750","volume":"15","author":"D Ruinskiy","year":"2007","unstructured":"Ruinskiy, D., Lavner, Y.: An effective algorithm for automatic detection and exact demarcation of breath sounds in speech and song signals. IEEE Trans. Audio Speech Lang. Process. 15, 838\u2013850 (2007)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"7_CR6","doi-asserted-by":"crossref","unstructured":"Kong, Y.-Y., Mullangi, A., Kokkinakis, K.: Classification of fricative consonants for speech enhancement in hearing devices. PloS one (2014)","DOI":"10.1371\/journal.pone.0095001"},{"key":"7_CR7","doi-asserted-by":"crossref","unstructured":"Frid, A., Lavner, Y.: Spectral and textural features for automatic classification of fricatives. In: XXII Annual Pacific Voice Conference (PVC), pp. 1\u20134 (2014)","DOI":"10.1109\/PVC.2014.6845422"},{"key":"7_CR8","doi-asserted-by":"publisher","first-page":"155","DOI":"10.1109\/TMM.2004.840604","volume":"7","author":"C Panagiotakis","year":"2005","unstructured":"Panagiotakis, C., Tziritas, G.: A speech\/music discriminator based on rms and zero-crossings. IEEE Trans. Multimed. 7, 155\u2013166 (2005)","journal-title":"IEEE Trans. Multimed."},{"key":"7_CR9","doi-asserted-by":"crossref","unstructured":"Lavner, Y., Ruinskiy, D.: A decision-tree-based algorithm for speech\/music classification and segmentation. EURASIP J. Audio Speech Music Process. (2009)","DOI":"10.1155\/2009\/239892"},{"issue":"5","key":"7_CR10","doi-asserted-by":"publisher","first-page":"293","DOI":"10.1109\/TSA.2002.800560","volume":"10","author":"G Tzanetakis","year":"2002","unstructured":"Tzanetakis, G., Cook, P.: Musical genre classification of audio signals. IEEE Trans. Speech Audio Process. 10(5), 293\u2013302 (2002)","journal-title":"IEEE Trans. Speech Audio Process."},{"issue":"3","key":"7_CR11","doi-asserted-by":"publisher","first-page":"16","DOI":"10.1109\/MSP.2014.2326181","volume":"32","author":"D Barchiesi","year":"2015","unstructured":"Barchiesi, D., Giannoulis, D., Stowell, D., Plumbley, M.D.: Acoustic scene classification: classifying environments from the sounds they produce. IEEE Signal Process. Mag. 32(3), 16\u201334 (2015)","journal-title":"IEEE Signal Process. Mag."},{"issue":"3","key":"7_CR12","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1109\/79.382443","volume":"12","author":"N Morgan","year":"1995","unstructured":"Morgan, N., Bourlard, H.: Continuous speech recognition. IEEE Signal Process. Mag. 12(3), 24\u201342 (1995)","journal-title":"IEEE Signal Process. Mag."},{"key":"7_CR13","doi-asserted-by":"crossref","unstructured":"Aruna, C., Parameswari, A.D., Malini, M., Gopu, G.: Voice recognition and touch screen control based wheel chair for paraplegic persons. In: 2014 International Conference on Green Computing Communication and Electrical Engineering (ICGCCEE), pp. 1\u20135 (2014)","DOI":"10.1109\/ICGCCEE.2014.6922215"},{"key":"7_CR14","doi-asserted-by":"crossref","unstructured":"Carletti, V., Foggia, P., Percannella, G., Saggese, A., Strisciuglio, N., Vento, M.: Audio surveillance using a bag of aural words classifier. In: 2013 10th IEEE International Conference on Advanced Video and Signal Based Surveillance, pp. 81\u201386 (2013)","DOI":"10.1109\/AVSS.2013.6636620"},{"key":"7_CR15","doi-asserted-by":"crossref","unstructured":"Ye, J., Kobayashi, T., Higuchi, T.: Audio-based indoor health monitoring system using flac features. In: 2010 International Conference on Emerging Security Technologies, pp. 90\u201395 (2010)","DOI":"10.1109\/EST.2010.13"},{"key":"7_CR16","doi-asserted-by":"crossref","unstructured":"Kawano, D., Ogawa, T., Matsumoto, H.: A proposal of the method to suppress a click noise only from an observed audio signal. In: 2017 International Symposium on Intelligent Signal Processing and Communication Systems (ISPACS), pp. 93\u201396 (2017)","DOI":"10.1109\/ISPACS.2017.8266452"},{"key":"7_CR17","doi-asserted-by":"crossref","unstructured":"Zhang, H., McLoughlin, I., Song, Y.: Robust sound event recognition using convolutional neural networks. In: 2015 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 559\u2013563 (2015)","DOI":"10.1109\/ICASSP.2015.7178031"},{"key":"7_CR18","doi-asserted-by":"crossref","unstructured":"Piczak, K.J.: Environmental sound classification with convolutional neural networks. In: IEEE 25th International Workshop on Machine Learning for Signal Processing (MLSP), pp. 1\u20136 (2015)","DOI":"10.1109\/MLSP.2015.7324337"},{"key":"7_CR19","unstructured":"Valenti, M., Diment, A., Parascandolo, G., Squartini, S., Virtanen, T.: DCASE 2016 acoustic scene classification using convolutional neural networks. In: Proceedings of the Detection and Classification of Acoustic Scenes and Events 2016 Workshop (DCASE2016). Tampere University of Technology. Department of Signal Processing (2016)"},{"issue":"6","key":"7_CR20","doi-asserted-by":"publisher","first-page":"1291","DOI":"10.1109\/TASLP.2017.2690575","volume":"25","author":"E \u00c7ak\u0131r","year":"2017","unstructured":"\u00c7ak\u0131r, E., Parascandolo, G., Heittola, T., Huttunen, H., Virtanen, T.: Convolutional recurrent neural networks for polyphonic sound event detection. IEEE\/ACM Trans. Audio Speech Lang. Process. 25(6), 1291\u20131303 (2017)","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."},{"key":"7_CR21","doi-asserted-by":"crossref","unstructured":"Naithani, G., Barker, T., Parascandolo, G., Bramslw, L., Pontoppidan, N.H., Virtanen, T.: Low latency sound source separation using convolutional recurrent neural networks. In: 2017 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), pp. 71\u201375 (2017)","DOI":"10.1109\/WASPAA.2017.8169997"},{"key":"7_CR22","doi-asserted-by":"crossref","unstructured":"Dieleman, S., Schrauwen, B.: End-to-end learning for music audio. In: 2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 6964\u20136968 (2014)","DOI":"10.1109\/ICASSP.2014.6854950"},{"key":"7_CR23","unstructured":"Pons, J., Nieto, O., Prockup, M., Schmidt, E.M., Ehmann, A.F., Serra, X.: End-to-end learning for music audio tagging at scale. In: ISMIR (2018)"},{"key":"7_CR24","doi-asserted-by":"crossref","unstructured":"Ferretti, D., Severini, M., Principi, E., Cenci, A., Squartini,S.: Infant cry detection in adverse acoustic environments by using deep neural networks. In: EUSIPCO (2018)","DOI":"10.23919\/EUSIPCO.2018.8553135"},{"key":"7_CR25","doi-asserted-by":"crossref","unstructured":"Turan, M.A.T., Erzin, E.: Monitoring infant\u2019s emotional cry in domestic environments using the capsule network architecture. In: Interspeech (2018)","DOI":"10.21437\/Interspeech.2018-2187"},{"key":"7_CR26","unstructured":"Sabour, S., Frosst, N., Hinton, G.E.: Dynamic routing between capsules. In: NIPS (2017)"},{"key":"7_CR27","doi-asserted-by":"crossref","unstructured":"Torres, R., Battaglino, D., Lepauloux, L.: Baby cry sound detection: a comparison of hand crafted features and deep learning approach. In: EANN (2017)","DOI":"10.1007\/978-3-319-65172-9_15"},{"key":"7_CR28","doi-asserted-by":"crossref","unstructured":"Saraswathy, J., Hariharan, M., Yaacob, S., Khairunizam, W.: Automatic classification of infant cry: a review. In: 2012 International Conference on Biomedical Engineering (ICoBE), pp. 543\u2013548 (2012)","DOI":"10.1109\/ICoBE.2012.6179077"},{"key":"7_CR29","doi-asserted-by":"crossref","unstructured":"Lavner, Y., Cohen, R., Ruinskiy, D., IJzerman, H.:Baby cry detection in domestic environment using deep learning. In: 2016 International Conference on the Sceience of Electrical Engineering (ICSEE 2016) (2016)","DOI":"10.1109\/ICSEE.2016.7806117"},{"key":"7_CR30","doi-asserted-by":"crossref","unstructured":"Zhang, X., Zou, Y., Liu, Y.: AICDS: An Infant Crying Detection System Based on Lightweight Convolutional Neural Network, pp. 185\u2013196. Springer (2018)","DOI":"10.1007\/978-3-319-94361-9_14"},{"key":"7_CR31","doi-asserted-by":"crossref","unstructured":"Xu, Y., Hasegawa-Johnson, M., McElwain, N.: Infant emotional outbursts detection in infant-parent spoken interactions. In: Interspeech (2018)","DOI":"10.21437\/Interspeech.2018-2429"},{"key":"7_CR32","unstructured":"Silva, G., Wickramasinghe, D.: Infant cry detection system with automatic soothing and video monitoring functions. J. Eng. Technol. Open Univ. Sri Lanka (JET-OUSL) 5(1). http:\/\/digital.lib.ou.ac.lk\/docs\/handle\/701300122\/1476 (2017)"},{"key":"7_CR33","unstructured":"Gao, J., Pabon, L.: Hot car baby detector. Illinois College of Engineering, Technical Report, December 2014"},{"key":"7_CR34","unstructured":"Lollipop smart baby monitor. https:\/\/www.lollipop.camera\/ (2018)"},{"key":"7_CR35","unstructured":"Cocoon cam baby monitor. https:\/\/cocooncam.com\/ (2019)"},{"key":"7_CR36","unstructured":"Evoz wifi baby vision monitor. https:\/\/myevoz.com\/ (2019)"},{"issue":"11","key":"7_CR37","doi-asserted-by":"publisher","first-page":"1699","DOI":"10.1016\/j.ijporl.2007.07.005","volume":"71","author":"G Varallyay","year":"2007","unstructured":"Varallyay, G.: The melody of crying. Int. J. Pediatr. Otorhinolaryngol. 71(11), 1699\u20131708 (2007)","journal-title":"Int. J. Pediatr. Otorhinolaryngol."},{"key":"7_CR38","doi-asserted-by":"crossref","unstructured":"Zabidi, A., Khuan, L.Y., Mansor, W., Yassin, I.M., Sahak, R.: Classification of infant cries with asphyxia using multilayer perceptron neural network. In: Proceedings of the 2010 Second International Conference on Computer Engineering and Applications\u2014Series. ICCEA 2010, vol. 01, pp. 204\u2013208. IEEE Computer Society, Washington, DC, USA (2010)","DOI":"10.1109\/ICCEA.2010.47"},{"key":"7_CR39","first-page":"10","volume":"30","author":"S Orlandi","year":"2015","unstructured":"Orlandi, S., Reyes-Garcia, C.A., Bandini, A., Donzelli, G., Manfredi, C.: Application of pattern recognition techniques to the classification of full-term and preterm infant cry. J. Voice Off. J. Voice Found. 30, 10 (2015)","journal-title":"J. Voice Off. J. Voice Found."},{"key":"7_CR40","doi-asserted-by":"publisher","first-page":"S297","DOI":"10.1016\/S0165-5876(99)00180-9","volume":"49","author":"K Michelsson","year":"1999","unstructured":"Michelsson, K., Michelsson, O.: Phonation in the newborn, infant cry. Int. J. Pediatr. Otorhinolaryngol. 49, S297\u2013S301 (1999)","journal-title":"Int. J. Pediatr. Otorhinolaryngol."},{"key":"7_CR41","unstructured":"Bowlby, J.: Attachment and Loss. Basic Books, vol. 1 (1969)"},{"issue":"3","key":"7_CR42","doi-asserted-by":"publisher","first-page":"350","DOI":"10.1111\/j.1469-8749.1972.tb02601.x","volume":"14","author":"P Ostwald","year":"1972","unstructured":"Ostwald, P.: The sounds of infancy. Dev. Med. Child Neurol. 14(3), 350\u2013361 (1972)","journal-title":"Dev. Med. Child Neurol."},{"key":"7_CR43","doi-asserted-by":"crossref","unstructured":"Owings, D., Zeifman, D.: Human infant crying as an animal communication system: insights from an assessment\/management approach. In: Evolution of Communication Systems: A Comparative Approach, pp. 151\u2013170 (2004)","DOI":"10.7551\/mitpress\/2879.003.0015"},{"key":"7_CR44","unstructured":"Nelson, J.: Seeing Through Tears: Crying and Attachment. Routledge (2005)"},{"key":"7_CR45","doi-asserted-by":"crossref","unstructured":"IJzerman, H., et\u00a0al.: A theory of social thermoregulation in human primates. Front. Psychol. 6, 464 (2015)","DOI":"10.3389\/fpsyg.2015.00464"},{"issue":"2","key":"7_CR46","doi-asserted-by":"publisher","first-page":"202","DOI":"10.1177\/1754073912451630","volume":"5","author":"EA Butler","year":"2013","unstructured":"Butler, E.A., Randall, A.K.: Emotional coregulation in close relationships. Emot. Rev. 5(2), 202\u2013210 (2013)","journal-title":"Emot. Rev."},{"issue":"1","key":"7_CR47","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1002\/mrdd.20050","volume":"11","author":"LL LaGasse","year":"2005","unstructured":"LaGasse, L.L., Neal, A.R., Lester, B.M.: Assessment of infant cry: a coustic cry analysis and parental perception. Ment. Retard. Dev. Disabil. Res. Rev. 11(1), 83\u201393 (2005)","journal-title":"Ment. Retard. Dev. Disabil. Res. Rev."},{"key":"7_CR48","doi-asserted-by":"crossref","unstructured":"Hendriks, M., Nelson, J.K., Cornelius, R., Vingerhoets, A.: Why crying improves our well-being: an attachment-theory perspective on the functions of adult crying. In: Emotion Regulation: Conceptual and Clinical Issues, pp. 87\u201396 (2008)","DOI":"10.1007\/978-0-387-29986-0_6"},{"key":"7_CR49","unstructured":"Pal, P.A., Iyer, N., Yantorno, R.E.: Emotion detection from infant facial expressions and cries. In: 2006 IEEE International Conference on Acoustics Speech and Signal Processing Proceedings, vol. 2, pp. II\u2013II (2006)"},{"key":"7_CR50","unstructured":"Barajas-Montiel, S., Reyes-Garcia, C.A.: Identifying pain and hunger in infant cry with classifiers ensembles, pp. 770 \u2013 775 (2005)"},{"key":"7_CR51","unstructured":"Wasz-H\u00f6ckert, O.: The infant cry: a spectrographic and auditory analysis. Spastics International Medical Publications in association with W. Heinemann Medical Books. Series Clinics in Developmental Medicine (1968)"},{"key":"7_CR52","doi-asserted-by":"crossref","unstructured":"Vingerhoets, A.: Why Only Humans Weep: Unravelling the Mysteries of Tears. Oxford University Press (2013)","DOI":"10.1093\/acprof:oso\/9780198570240.001.0001"},{"issue":"4","key":"7_CR53","doi-asserted-by":"publisher","first-page":"1171","DOI":"10.2307\/1127506","volume":"43","author":"SILVIA M. BELL","year":"1972","unstructured":"Bell, S.M., Salter\u00a0Ainsworth, M.D.: Infant crying and maternal responsiveness. In: Child development, vol. 43, pp. 1171\u201390 (1973)","journal-title":"Child Development"},{"issue":"3","key":"7_CR54","doi-asserted-by":"publisher","first-page":"677","DOI":"10.2307\/1129380","volume":"53","author":"ML Lounsbury","year":"1982","unstructured":"Lounsbury, M.L., Bates, J.E.: The cries of infants of differing levels of perceived temperamental difficultness: acoustic properties and effects on listeners. Child Dev. 53(3), 677\u2013686 (1982)","journal-title":"Child Dev."},{"issue":"3","key":"7_CR55","doi-asserted-by":"publisher","first-page":"394","DOI":"10.2307\/1131667","volume":"68","author":"Philip Sanford Zeskind","year":"1997","unstructured":"Zeskind, P., Barr, R.: Acoustic characteristics of naturally occurring cries of infants with colic. Child Dev. 68, 394\u2013403 (1997)","journal-title":"Child Development"},{"key":"7_CR56","doi-asserted-by":"crossref","unstructured":"Laan, A., Assen, M.V., Vingerhoets, A.: Individual differences in adult crying: the role of attachment styles. Soc. Behav. Person. Int. J. (2012)","DOI":"10.2224\/sbp.2012.40.3.453"},{"issue":"3","key":"7_CR57","doi-asserted-by":"publisher","first-page":"175","DOI":"10.1016\/S1090-5138(97)00006-8","volume":"18","author":"F.Bryant Furlow","year":"1997","unstructured":"Bryant\u00a0Furlow, F.: Human neonatal cry quality as an honest signal of fitness. Evol. Hum. Behav. 18, 175\u2013193 (1997)","journal-title":"Evolution and Human Behavior"},{"issue":"08","key":"7_CR58","doi-asserted-by":"publisher","first-page":"796","DOI":"10.4236\/jbise.2013.68097","volume":"06","author":"Y Kheddache","year":"2013","unstructured":"Kheddache, Y., Tadj, C.: Acoustic measures of the cry characteristics of healthy newborns and newborns with pathologies. J. Biomed. Sci. Eng. 06(08), 796\u2013804 (2013)","journal-title":"J. Biomed. Sci. Eng."},{"key":"7_CR59","doi-asserted-by":"crossref","unstructured":"Orlandi, S., Manfredi, C., Bocchi, L., Scattoni, M.L.: Automatic newborn cry analysis: a non-invasive tool to help autism early diagnosis. In: 2012 Annual International Conference of the IEEE Engineering in Medicine and Biology Society, pp. 2953\u20132956 (2012)","DOI":"10.1109\/EMBC.2012.6346583"},{"issue":"5","key":"7_CR60","doi-asserted-by":"publisher","first-page":"331","DOI":"10.1002\/aur.1244","volume":"5","author":"SJ Sheinkopf","year":"2012","unstructured":"Sheinkopf, S.J., Iverson, J.M., Rinaldi, M.L., Lester, B.M.: Atypical cry acoustics in 6-month-old infants at risk for autism spectrum disorder. Autism Res. 5(5), 331\u2013339 (2012)","journal-title":"Autism Res."},{"issue":"5","key":"7_CR61","doi-asserted-by":"publisher","first-page":"391","DOI":"10.1007\/s12553-018-0243-5","volume":"8","author":"Saraswathy Jeyaraman","year":"2018","unstructured":"Jeyaraman, S., Muthusamy, H., Wan, K., Jeyaraman, S., Nadarajaw, T., Yaacob, S., Nisha, S.: A review: survey on automatic infant cry analysis and classification. Health Technol. 8 (2018)","journal-title":"Health and Technology"},{"key":"7_CR62","doi-asserted-by":"crossref","unstructured":"IJzerman, H., \u010coli\u0107, M., Hennecke, M., Hong, Y., Hu, C.-P., Joy-Gaba, J., Lazarevic, D., Lazarevic, L., Parzuchowski, M., Ratner, K.G., Schubert, T., Schuetz, A., Stojilovi, D., Weissgerber, S., Zickfeld, J., Lindenberg, S.: Does distance from the equator predict self-control? Lessons from the human penguin project. Behav. Brain Sci. 40 (2017)","DOI":"10.1017\/S0140525X16001035"},{"key":"7_CR63","doi-asserted-by":"crossref","unstructured":"IJzerman, H., Lindenberg, S., Dalgar, I., Weissgerber, S., Clemente\u00a0Vergara, R., Cairo, A., oli, M., Dursun, P., Frankowska, N., Hadi, R., Hall, C., Hong, Y., Hu, C.-P., Joy-Gaba, J., Lazarevic, D., Lazarevic, L., Parzuchowski, M., Ratner, K.G., Rothman, D., Zickfeld J.: The human penguin project: climate, social integration, and core body temperature. Collabra: Psychol. 4 (2018)","DOI":"10.1525\/collabra.165"},{"key":"7_CR64","unstructured":"Bishop, C.M.: Pattern Recognition and Machine Learning. Springer Science+Business Media (2006)"},{"key":"7_CR65","unstructured":"Goodfellow, I., Bengio, Y., Courville, A.: Deep Learning. MIT Press, http:\/\/www.deeplearningbook.org (2016)"},{"issue":"6088","key":"7_CR66","doi-asserted-by":"publisher","first-page":"533","DOI":"10.1038\/323533a0","volume":"323","author":"David E. Rumelhart","year":"1986","unstructured":"Rumelhart, D.E., Hinton, G.E., Williams, R.J.: Learning representations by back propagating errors. Nature 323, 533\u2013536 (1986)","journal-title":"Nature"},{"key":"7_CR67","unstructured":"Huang, X., Acero, A., Hon, H.-W.: Spoken Language Processing: A Guide to Theory, Algorithm, and System Development. Prentice Hall PTR (2001)"},{"key":"7_CR68","unstructured":"Szegedy, C., Ioffe, S., Vanhoucke, V.: Inception-v4, inception-resnet and the impact of residual connections on learning. CoRR (2016) arXiv:1602.07261"},{"key":"7_CR69","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"7_CR70","unstructured":"Ioffe, S., Szegedy, C.: Batch normalization: Accelerating deep network training by reducing internal covariate shift. CoRR, arXiv:1502.03167"},{"key":"7_CR71","doi-asserted-by":"crossref","unstructured":"Phan, H., Koch, P., Katzberg, F., Maa\u00df, M., Mazur, R., Mertins, A.: Audio scene classification with deep recurrent neural networks. In: INTERSPEECH (2017)","DOI":"10.21437\/Interspeech.2017-101"},{"key":"7_CR72","unstructured":"Graves, A., Mohamed, A., Hinton, G.E.: Speech recognition with deep recurrent neural networks. CoRR (2013) arXiv:1303.5778"},{"issue":"11","key":"7_CR73","doi-asserted-by":"publisher","first-page":"2673","DOI":"10.1109\/78.650093","volume":"45","author":"M Schuster","year":"1997","unstructured":"Schuster, M., Paliwal, K.K.: Bidirectional recurrent neural networks. IEEE Trans. Signal Process. 45(11), 2673\u20132681 (1997)","journal-title":"IEEE Trans. Signal Process."},{"key":"7_CR74","doi-asserted-by":"crossref","unstructured":"Graves, A., Jaitly, N., Mohamed, A.: Hybrid speech recognition with deep bidirectional LSTM. In 2013 IEEE Workshop on Automatic Speech Recognition and Understanding, pp. 273\u2013278 (2013)","DOI":"10.1109\/ASRU.2013.6707742"},{"key":"7_CR75","doi-asserted-by":"crossref","unstructured":"Ben-Yehuda, T., Abramovich, I., Cohen, R.: Low-complexity video classification using recurrent neural networks. In: 2018 International Conference on the Science of Electrical Engineering (ICSEE 2018) (2018)","DOI":"10.1109\/ICSEE.2018.8646076"},{"issue":"8","key":"7_CR76","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S., Schmidhuber, J.: Long short-term memory. Neural Comput. 9(8), 1735\u20131780 (1997)","journal-title":"Neural Comput."},{"key":"7_CR77","doi-asserted-by":"crossref","unstructured":"Graves, A.: Supervised Sequence Labelling with Recurrent Neural Networks, Series Studies in Computational Intelligence, vol. 385. Springer (2012)","DOI":"10.1007\/978-3-642-24797-2"},{"issue":"11","key":"7_CR78","doi-asserted-by":"publisher","first-page":"172","DOI":"10.3390\/a11110172","volume":"11","author":"Hongxiao Fei","year":"2018","unstructured":"Fei, H., Tan, F.: Bidirectional grid long short-term memory (bigridlstm): a method to address context-sensitivity and vanishing gradient. Algorithms 11 (2018)","journal-title":"Algorithms"},{"key":"7_CR79","unstructured":"Glorot, X., Bengio, Y.: Understanding the difficulty of training deep feedforward neural networks. In: Teh, Y.W., Titterington, M. (eds.) Proceedings of the Thirteenth International Conference on Artificial Intelligence and Statistics, Series Proceedings of Machine Learning Research, vol. 9, pp. 249\u2013256 PMLR (2010)"},{"key":"7_CR80","doi-asserted-by":"crossref","unstructured":"Cohen, R., Lavner, Y.: Infant cry analysis and detection. In: 2012 IEEE 27th Convention of Electrical and Electronics Engineers in Israel (IEEEI 2012), pp. 2\u20136 (2012)","DOI":"10.1109\/EEEI.2012.6376996"},{"issue":"2","key":"7_CR81","doi-asserted-by":"publisher","first-page":"293","DOI":"10.1121\/1.1910339","volume":"41","author":"AM Noll","year":"1967","unstructured":"Noll, A.M.: Cepstrum pitch determination. J. Acoust. Soc. Am. 41(2), 293\u2013309 (1967)","journal-title":"J. Acoust. Soc. Am."},{"issue":"2","key":"7_CR82","doi-asserted-by":"publisher","first-page":"288","DOI":"10.1109\/JPROC.2010.2090998","volume":"99","author":"T Waterschoot van","year":"2011","unstructured":"van Waterschoot, T., Moonen, M.: Fifty years of acoustic feedback control: state of the art and future challenges. Proc. IEEE 99(2), 288\u2013327 (2011)","journal-title":"Proc. IEEE"},{"key":"7_CR83","unstructured":"van Waterschoot, T., Moonen, M.: Comparative evaluation of howling detection criteria in notch-filter-based howling suppression. J. Audio Eng. Soc. 58(11), 923\u2013940 (2010)"},{"key":"7_CR84","unstructured":"Rabiner, L.R., Schafer, R.W.: Theory and Applications of Digital Speech Processing, vol.\u00a064. Pearson, Upper Saddle River (2011)"},{"key":"7_CR85","volume-title":"Discrete-Time Speech Signal Processing: Principles and Practice","author":"T Quatieri","year":"2002","unstructured":"Quatieri, T.: Discrete-Time Speech Signal Processing: Principles and Practice. Prentice Hall, London (2002)"},{"key":"7_CR86","unstructured":"Platt, J.: Sequential minimal optimization: a fast algorithm for training support vector machines (1998)"},{"key":"7_CR87","doi-asserted-by":"crossref","unstructured":"Frederiks, K., Sterkenburg, P., Lavner, Y., Cohen, R., Ruinskiy, D., Verbeke, W., IJzerman, H.: Mobile social physiology as the future of relationship research and therapy: presentation of the bio-app for bonding (BAB), PsyArXiv (2018)","DOI":"10.31234\/osf.io\/xr8ma"},{"key":"7_CR88","unstructured":"Kingma, D., Ba, J.: Adam: a method for stochastic optimization. In: International Conference on Learning Representations, December 2014"}],"container-title":["Studies in Computational Intelligence","Development and Analysis of Deep Learning Architectures"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-31764-5_7","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,7,26]],"date-time":"2024-07-26T03:14:31Z","timestamp":1721963671000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-030-31764-5_7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,11,2]]},"ISBN":["9783030317638","9783030317645"],"references-count":88,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-31764-5_7","relation":{},"ISSN":["1860-949X","1860-9503"],"issn-type":[{"type":"print","value":"1860-949X"},{"type":"electronic","value":"1860-9503"}],"subject":[],"published":{"date-parts":[[2019,11,2]]},"assertion":[{"value":"2 November 2019","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}