{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,3]],"date-time":"2026-03-03T16:06:05Z","timestamp":1772553965638,"version":"3.50.1"},"publisher-location":"Cham","reference-count":22,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783319651712","type":"print"},{"value":"9783319651729","type":"electronic"}],"license":[{"start":{"date-parts":[[2017,1,1]],"date-time":"2017-01-01T00:00:00Z","timestamp":1483228800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017]]},"DOI":"10.1007\/978-3-319-65172-9_15","type":"book-chapter","created":{"date-parts":[[2017,8,1]],"date-time":"2017-08-01T04:38:54Z","timestamp":1501562334000},"page":"168-179","source":"Crossref","is-referenced-by-count":28,"title":["Baby Cry Sound Detection: A Comparison of Hand Crafted Features and Deep Learning Approach"],"prefix":"10.1007","author":[{"given":"Rafael","family":"Torres","sequence":"first","affiliation":[]},{"given":"Daniele","family":"Battaglino","sequence":"additional","affiliation":[]},{"given":"Ludovick","family":"Lepauloux","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,8,2]]},"reference":[{"key":"15_CR1","doi-asserted-by":"crossref","unstructured":"Mesaros, A., Heittola, T., Virtanen, T.: TUT database for acoustic scene classification and sound event detection. In: 24th European Signal Processing Conference (EUSIPCO), pp. 1128\u20131132 (2016)","DOI":"10.1109\/EUSIPCO.2016.7760424"},{"issue":"3","key":"15_CR2","doi-asserted-by":"crossref","first-page":"16","DOI":"10.1109\/MSP.2014.2326181","volume":"32","author":"D Barchiesi","year":"2015","unstructured":"Barchiesi, D., Giannoulis, D., Stowell, D., Plumbley, M.: Acoustic scene classification: classifying environments from the sounds they produce. IEEE Sig. Process. Mag. 32(3), 16\u201334 (2015)","journal-title":"IEEE Sig. Process. Mag."},{"issue":"5","key":"15_CR3","doi-asserted-by":"crossref","first-page":"358","DOI":"10.17743\/jaes.2015.0025","volume":"63","author":"S Ntalampiras","year":"2015","unstructured":"Ntalampiras, S.: Audio pattern recognition of baby crying sound events. J. Audio Eng. Soc. 63(5), 358\u2013369 (2015)","journal-title":"J. Audio Eng. Soc."},{"key":"15_CR4","doi-asserted-by":"crossref","unstructured":"Saraswathy, J., Hariharan, M., Yaacob, S., Khairunizam, W.: Automatic classification of infant cry: a review. In: International Conference on Biomedical Engineering (ICoBE), pp. 543\u2013548, February 2012","DOI":"10.1109\/ICoBE.2012.6179077"},{"key":"15_CR5","doi-asserted-by":"crossref","unstructured":"Lavner, Y., Cohen, R., Ruinskiy, D., Ijzerman, H.: Baby cry detection in domestic environment using deep learning. In: IEEE International Conference on the Science of Electrical Engineering (ICSEE), pp. 1\u20135, November 2016","DOI":"10.1109\/ICSEE.2016.7806117"},{"key":"15_CR6","doi-asserted-by":"crossref","unstructured":"Saha, B., Purkait, P.K., Mukherjee, J., Majumdar, A.K., Majumdar, B., Singh, A.K.: An embedded system for automatic classification of neonatal cry. In: IEEE Point-of-Care Healthcare Technologies (PHT), pp. 248\u2013251, January 2013","DOI":"10.1109\/PHT.2013.6461331"},{"key":"15_CR7","doi-asserted-by":"crossref","unstructured":"B\u011fnic\u011f, I.A., Cucu, H., Buzo, A., Burileanu, D., Burileanu, C.: Baby cry recognition in real-world conditions. In: 39th International Conference on Telecommunications and Signal Processing (TSP), pp. 315\u2013318, June 2016","DOI":"10.1109\/TSP.2016.7760887"},{"key":"15_CR8","doi-asserted-by":"crossref","unstructured":"Battaglino, D., Lepauloux, L., Evans, N.: The open-set problem in acoustic scene classification. In: IEEE International Workshop on Acoustic Signal Enhancement (IWAENC), pp. 1\u20135, September 2016","DOI":"10.1109\/IWAENC.2016.7602939"},{"key":"15_CR9","doi-asserted-by":"crossref","unstructured":"Rabaoui, A., Davy, M., Rossignol, S., Lachiri, Z., Ellouze, N.: Improved one-class svm classifier for sounds classification. In: IEEE Conference on Advanced Video and Signal Based Surveillance (AVSS), pp. 117\u2013122 (2007)","DOI":"10.1109\/AVSS.2007.4425296"},{"key":"15_CR10","unstructured":"Tax, D.M.J., Duin, R.P.W.: Data domain description using support vectors. In: European Symposium on Artificial Neural Networks, pp. 251\u2013256 (1999)"},{"key":"15_CR11","doi-asserted-by":"crossref","unstructured":"Cohen, R., Lavner, Y.: Infant cry analysis and detection. In: IEEE 27th Convention of Electrical and Electronics Engineers, pp. 1\u20135, November 2012","DOI":"10.1109\/EEEI.2012.6376996"},{"issue":"3\u20134","key":"15_CR12","doi-asserted-by":"crossref","first-page":"197","DOI":"10.1561\/2000000039","volume":"7","author":"L Deng","year":"2014","unstructured":"Deng, L., Yu, D.: Deep learning: methods and applications. Found. Trends Sig. Process. 7(3\u20134), 197\u2013387 (2014)","journal-title":"Found. Trends Sig. Process."},{"key":"15_CR13","doi-asserted-by":"crossref","unstructured":"Piczak, K.J.: Environmental sound classification with convolutional neural networks. In: IEEE 25th International Workshop on Machine Learning for Signal Processing (MLSP), pp. 1\u20136, September 2015","DOI":"10.1109\/MLSP.2015.7324337"},{"key":"15_CR14","unstructured":"Hinton, G.E., Srivastava, N., Krizhevsky, A., Sutskever, I., Salakhutdinov, R.R.: Improving neural networks by preventing co-adaptation of feature detectors. arXiv:1207.0580 (2012)"},{"key":"15_CR15","unstructured":"Ioffe, S., Szegedy, C.: Batch normalization: accelerating deep network training by reducing internal covariate shift. In: 32nd International Conference on Machine Learning, ICML, pp. 448\u2013456 (2015)"},{"key":"15_CR16","unstructured":"Boersma, P.: Accurate short-term analysis of the fundamental frequency and the harmonics-to-noise ratio of a sampled sound. In: IFA Proceedings 17, pp. 97\u2013110 (1993)"},{"key":"15_CR17","doi-asserted-by":"crossref","unstructured":"Foster, P., Sigtia, S., Krstulovic, S., Barker, J., Plumbley, M.D.: Chime-home: a dataset for sound source recognition in a domestic environment. In: IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA), pp. 1\u20135 (2015)","DOI":"10.1109\/WASPAA.2015.7336899"},{"issue":"3","key":"15_CR18","doi-asserted-by":"crossref","first-page":"e0118432","DOI":"10.1371\/journal.pone.0118432","volume":"10","author":"T Saito","year":"2015","unstructured":"Saito, T., Rehmsmeier, M.: The precision-recall plot is more informative than the ROC plot when evaluating binary classifiers on imbalanced datasets. PloS One 10(3), e0118432 (2015)","journal-title":"PloS One"},{"key":"15_CR19","doi-asserted-by":"crossref","first-page":"27:1","DOI":"10.1145\/1961189.1961199","volume":"2","author":"CC Chang","year":"2011","unstructured":"Chang, C.C., Lin, C.J.: LIBSVM: a library for support vector machines. ACM Trans. Intell. Syst. Technol. 2, 27:1\u201327:27 (2011). http:\/\/www.csie.ntu.edu.tw\/~cjlin\/libsvm","journal-title":"ACM Trans. Intell. Syst. Technol."},{"issue":"1\u20133","key":"15_CR20","doi-asserted-by":"crossref","first-page":"111","DOI":"10.1016\/S0167-9260(02)00045-7","volume":"32","author":"JC Wang","year":"2002","unstructured":"Wang, J.C., Wang, J.F., Weng, Y.S.: Chip design of MFCC extraction for speech recognition. Integr. VLSI J. 32(1\u20133), 111\u2013131 (2002)","journal-title":"Integr. VLSI J."},{"key":"15_CR21","doi-asserted-by":"crossref","unstructured":"Wu, J., Leng, C., Wang, Y., Hu, Q., Cheng, J.: Quantized convolutional neural networks for mobile devices. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 4820\u20134828, June 2016","DOI":"10.1109\/CVPR.2016.521"},{"issue":"11","key":"15_CR22","doi-asserted-by":"crossref","first-page":"2096","DOI":"10.1109\/TASLP.2016.2592698","volume":"24","author":"S Sigtia","year":"2016","unstructured":"Sigtia, S., Stark, A.M., Krstulovi, S., Plumbley, M.D.: Automatic environmental sound recognition: performance versus computational cost. IEEE\/ACM Trans. Audio Speech Lang. Process. 24(11), 2096\u20132107 (2016)","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."}],"container-title":["Communications in Computer and Information Science","Engineering Applications of Neural Networks"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-65172-9_15","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,24]],"date-time":"2025-06-24T19:21:49Z","timestamp":1750792909000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-65172-9_15"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017]]},"ISBN":["9783319651712","9783319651729"],"references-count":22,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-65172-9_15","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"value":"1865-0929","type":"print"},{"value":"1865-0937","type":"electronic"}],"subject":[],"published":{"date-parts":[[2017]]}}}