{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,1]],"date-time":"2025-07-01T21:53:34Z","timestamp":1751406814854,"version":"3.40.3"},"publisher-location":"Cham","reference-count":19,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031474507"},{"type":"electronic","value":"9783031474514"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-47451-4_17","type":"book-chapter","created":{"date-parts":[[2023,10,31]],"date-time":"2023-10-31T20:02:04Z","timestamp":1698782524000},"page":"232-243","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Voice Activity Detection Using Convolutional Recurrent Neural Networks"],"prefix":"10.1007","author":[{"given":"Josafa","family":"Aguiar-Pontes","sequence":"first","affiliation":[]},{"given":"Monserrate","family":"Intriago-Pazmino","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,11,1]]},"reference":[{"key":"17_CR1","doi-asserted-by":"crossref","unstructured":"Afroz, F., Koolagudi, S.G.: Recognition and classification of pauses in stuttered speech using acoustic features. In: 2019 6th International Conference on Signal Processing and Integrated Networks, SPIN 2019, pp. 921\u2013926 (2019)","DOI":"10.1109\/SPIN.2019.8711569"},{"key":"17_CR2","doi-asserted-by":"crossref","unstructured":"Agarwal, A.R., Tiwari, S., Patage, V.V., Sankar Ganesh, S., Sudhakar, M.S.: A method for voice activity detection using K-means clustering. In: 2022 13th International Conference on Computing Communication and Networking Technologies, ICCCNT 2022 (2022)","DOI":"10.1109\/ICCCNT54827.2022.9984425"},{"key":"17_CR3","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"138","DOI":"10.1007\/978-3-642-23126-1_10","volume-title":"Exploring Music Contents","author":"M Barthet","year":"2011","unstructured":"Barthet, M., Hargreaves, S., Sandler, M.: Speech\/music discrimination in audio podcast using structural segmentation and timbre recognition. In: Ystad, S., Aramaki, M., Kronland-Martinet, R., Jensen, K. (eds.) CMMR 2010. LNCS, vol. 6684, pp. 138\u2013162. Springer, Heidelberg (2011). https:\/\/doi.org\/10.1007\/978-3-642-23126-1_10"},{"key":"17_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TASLP.2022.3164199","volume":"31","author":"M Bhattacharjee","year":"2023","unstructured":"Bhattacharjee, M., Prasanna, S.R.M., Guha, P.: Clean vs. overlapped speech-music detection using harmonic-percussive features and multi-task learning. IEEE\/ACM Trans. Audio Speech Lang. Process. 31, 1\u201310 (2023)","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."},{"key":"17_CR5","doi-asserted-by":"crossref","unstructured":"Chung, J.S., Huh, J., Nagrani, A., Afouras, T., Zisserman, A.: Spot the conversation: speaker diarisation in the wild. In: Proceedings of the Annual Conference of the International Speech Communication Association, INTERSPEECH, October 2020, pp. 299\u2013303 (2020)","DOI":"10.21437\/Interspeech.2020-2337"},{"issue":"8","key":"17_CR6","doi-asserted-by":"publisher","first-page":"861","DOI":"10.1016\/j.patrec.2005.10.010","volume":"27","author":"T Fawcett","year":"2006","unstructured":"Fawcett, T.: An introduction to ROC analysis. Pattern Recogn. Lett. 27(8), 861\u2013874 (2006)","journal-title":"Pattern Recogn. Lett."},{"issue":"12","key":"17_CR7","doi-asserted-by":"publisher","first-page":"930","DOI":"10.1049\/el:19940625","volume":"30","author":"RLB Jeann\u00e8s","year":"1994","unstructured":"Jeann\u00e8s, R.L.B., Faucon, G.: Proposal of a voice activity detector for noise reduction. Electron. Lett. 30(12), 930\u2013932 (1994)","journal-title":"Electron. Lett."},{"issue":"18","key":"17_CR8","doi-asserted-by":"publisher","first-page":"6818","DOI":"10.3390\/s22186818","volume":"22","author":"Y Jin","year":"2022","unstructured":"Jin, Y., Wang, M., Luo, L., Zhao, D., Liu, Z.: Polyphonic sound event detection using temporal-frequency attention and feature space attention. Sensors 22(18), 6818 (2022)","journal-title":"Sensors"},{"issue":"1","key":"17_CR9","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2009\/239892","volume":"2009","author":"Y Lavner","year":"2009","unstructured":"Lavner, Y., Ruinskiy, D.: A decision-tree-based algorithm for speech\/music classification and segmentation. EURASIP J. Audio Speech Music Process. 2009(1), 1\u201314 (2009)","journal-title":"EURASIP J. Audio Speech Music Process."},{"key":"17_CR10","doi-asserted-by":"crossref","unstructured":"Leglaive, S., Hennequin, R., Badeau, R.: Singing voice detection with deep recurrent neural networks. In: ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings, August 2015, pp. 121\u2013125 (2015)","DOI":"10.1109\/ICASSP.2015.7177944"},{"key":"17_CR11","doi-asserted-by":"crossref","unstructured":"Levitan, R., Hirschberg, J.B.: Measuring acoustic-prosodic entrainment with respect to multiple levels and dimensions (2011)","DOI":"10.21437\/Interspeech.2011-771"},{"issue":"5","key":"17_CR12","doi-asserted-by":"publisher","first-page":"67","DOI":"10.1109\/MSP.2021.3090678","volume":"38","author":"A Mesaros","year":"2021","unstructured":"Mesaros, A., Heittola, T., Virtanen, T., Plumbley, M.D.: Sound event detection: a tutorial. IEEE Signal Process. Maga. 38(5), 67\u201383 (2021)","journal-title":"IEEE Signal Process. Maga."},{"key":"17_CR13","unstructured":"Boersma, P., Weenink, D.: Praat: doing phonetics by computer (2011)"},{"issue":"10","key":"17_CR14","doi-asserted-by":"publisher","first-page":"1733","DOI":"10.1109\/TMM.2015.2428998","volume":"17","author":"D Stowell","year":"2015","unstructured":"Stowell, D., Giannoulis, D., Benetos, E., Lagrange, M., Plumbley, M.D.: Detection and classification of acoustic scenes and events. IEEE Trans. Multimedia 17(10), 1733\u20131746 (2015)","journal-title":"IEEE Trans. Multimedia"},{"key":"17_CR15","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.csl.2019.06.005","volume":"59","author":"ZH Tan","year":"2020","unstructured":"Tan, Z.H., Sarkar, A.K., Dehak, N.: rVAD: an unsupervised segment-based robust voice activity detection method. Comput. Speech Lang. 59, 1\u201321 (2020)","journal-title":"Comput. Speech Lang."},{"key":"17_CR16","unstructured":"The Apache Software Foundation. MXNet"},{"issue":"2","key":"17_CR17","doi-asserted-by":"publisher","first-page":"130","DOI":"10.2174\/1567205014666171121114930","volume":"15","author":"L Toth","year":"2017","unstructured":"Toth, L., et al.: A speech recognition-based solution for the automatic detection of mild cognitive impairment from spontaneous speech. Curr. Alzheimer Res. 15(2), 130\u2013138 (2017)","journal-title":"Curr. Alzheimer Res."},{"key":"17_CR18","doi-asserted-by":"crossref","unstructured":"Yang, Y.Y., et al.: Torchaudio: building blocks for audio and speech processing. In: ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings, May 2022, pp. 6982\u20136986 (2022)","DOI":"10.1109\/ICASSP43922.2022.9747236"},{"key":"17_CR19","doi-asserted-by":"crossref","unstructured":"Yu, D., Deng, L.: Automatic speech recognition (2015)","DOI":"10.1007\/978-1-4471-5779-3"}],"container-title":["Lecture Notes in Networks and Systems","Proceedings of the Future Technologies Conference (FTC) 2023, Volume 2"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-47451-4_17","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,4,13]],"date-time":"2024-04-13T18:05:45Z","timestamp":1713031545000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-47451-4_17"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031474507","9783031474514"],"references-count":19,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-47451-4_17","relation":{},"ISSN":["2367-3370","2367-3389"],"issn-type":[{"type":"print","value":"2367-3370"},{"type":"electronic","value":"2367-3389"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"1 November 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"FTC","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Proceedings of the Future Technologies Conference","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Vancouver, BC","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Canada","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"19 October 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20 October 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ftc2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/saiconference.com\/FTC","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}