{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T07:27:04Z","timestamp":1740122824771,"version":"3.37.3"},"reference-count":26,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2020,11,18]],"date-time":"2020-11-18T00:00:00Z","timestamp":1605657600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,11,18]],"date-time":"2020-11-18T00:00:00Z","timestamp":1605657600000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Speech Technol"],"published-print":{"date-parts":[[2021,3]]},"DOI":"10.1007\/s10772-020-09777-w","type":"journal-article","created":{"date-parts":[[2020,11,18]],"date-time":"2020-11-18T14:04:15Z","timestamp":1605708255000},"page":"127-142","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["A novel voice activity detection algorithm using modified global thresholding"],"prefix":"10.1007","volume":"24","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6864-453X","authenticated-orcid":false,"given":"R. Johny","family":"Elton","sequence":"first","affiliation":[]},{"given":"J.","family":"Mohanalin","sequence":"additional","affiliation":[]},{"given":"P.","family":"Vasuki","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,11,18]]},"reference":[{"key":"9777_CR1","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1109\/97.995824","volume":"9","author":"F Beritelli","year":"2002","unstructured":"Beritelli, F., Casale, S., Ruggeri, G., & Serano, S. (2002). Performance evaluation and comparison of G.729\/AMR\/fuzzy voice activity detectors. IEEE Signal Processing Letters, 9, 85\u201388.","journal-title":"IEEE Signal Processing Letters"},{"key":"9777_CR2","doi-asserted-by":"publisher","first-page":"266","DOI":"10.1109\/TNSRE.2007.897025","volume":"15","author":"W Chen","year":"2007","unstructured":"Chen, W., Wang, Z., & Yu, W. (2007). Characterization of surface EMG signal based on fuzzy entropy. IEEE Transactions on Neural Systems and Rehabilitation Engineering, 15, 266\u2013272.","journal-title":"IEEE Transactions on Neural Systems and Rehabilitation Engineering"},{"key":"9777_CR3","doi-asserted-by":"publisher","first-page":"61","DOI":"10.1016\/j.medengphy.2008.04.005","volume":"31","author":"W Chen","year":"2009","unstructured":"Chen, W., Zhuang, J., Wang, Z., & Yu, W. (2009). Measuring complexity using FuzzyEn, ApEn and SampEn. Medical Engineering & Physics, 31, 61\u201368.","journal-title":"Medical Engineering & Physics"},{"doi-asserted-by":"crossref","unstructured":"Craciun, A., & Gabrea, M. (2004). Correlation coefficient-based voice activity detector algorithm. In Proceedings of Canadian conference on electrical and computer engineering (Vol. 3, pp. 1789\u20131792).","key":"9777_CR4","DOI":"10.1109\/CCECE.2004.1349763"},{"issue":"12","key":"9777_CR5","doi-asserted-by":"publisher","first-page":"2313","DOI":"10.1109\/TASLP.2016.2566919","volume":"24","author":"D Dov","year":"2016","unstructured":"Dov, D., Talmon, R., & Cohen, I. (2016). Kernel method for voice activity detection in presence of transients. IEEE Transactions on Audio, Speech and Language Processing, 24(12), 2313\u20132326.","journal-title":"IEEE Transactions on Audio, Speech and Language Processing"},{"key":"9777_CR6","doi-asserted-by":"publisher","first-page":"298","DOI":"10.3390\/e18080298","volume":"18","author":"J Elton","year":"2016","unstructured":"Elton, J., Vasuki, P., & Mohanalin, J. (2016). Voice activity detection using fuzzy entropy and support vector machine. Entropy, 18, 298. https:\/\/doi.org\/10.3390\/e18080298.","journal-title":"Entropy"},{"unstructured":"Garofolo, J., Lamel, L., Fisher, W., Fiscus, J., Pallett, D., Dahlgren, N., & Zue, V. (1993). TIMIT: Acoustic-phonetic continuous speech corpus. Philadelphia: Linguistic Data Consortium (1993).","key":"9777_CR7"},{"issue":"3","key":"9777_CR8","doi-asserted-by":"publisher","first-page":"646","DOI":"10.1109\/TASLP.2017.2769220","volume":"26","author":"G Gelly","year":"2017","unstructured":"Gelly, G., & Gauvain, J.-L. (2017). Optimization of RNN-based speech activity detection. IEEE\/ACM Transactions on Audio, Speech, and Language Processing, 26(3), 646\u2013656.","journal-title":"IEEE\/ACM Transactions on Audio, Speech, and Language Processing"},{"unstructured":"Haigh, J., & Mason, J. S. (1993). A voice activity detector based on cepstral analysis. In Proceedings of 3rd Eurospeech (pp. 1103\u20131106). Berlin, Germany.","key":"9777_CR9"},{"unstructured":"Hirsch, H. G., & Pierce, D. (2000). The AURORA experimental framework for the performance evaluation of speech recognition systems under noise conditions. In Proc. ISCA ITRW ASR automatic speech recognition: Challenges for the next millennium.","key":"9777_CR10"},{"key":"9777_CR11","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1016\/j.specom.2009.08.003","volume":"52","author":"K Ishizuka","year":"2010","unstructured":"Ishizuka, K., Nakatani, T., Fujimoto, M., & Miyazaki, N. (2010). Noise robust voice activity detection based on periodic to aperiodic component ratio. Speech Communication, 52, 41\u201360. https:\/\/doi.org\/10.1016\/j.specom.2009.08.003.","journal-title":"Speech Communication"},{"unstructured":"ITU. (1996). A silence compression scheme for G.729 optimized for terminals conforming to recommendation, v.70. In ITU-T Recommendation G.729-Annex B.","key":"9777_CR12"},{"key":"9777_CR13","doi-asserted-by":"publisher","first-page":"537","DOI":"10.1007\/s10772-014-9240-x","volume":"19","author":"SM Joseph","year":"2016","unstructured":"Joseph, S. M., & Babu, A. P. (2016). Wavelet energy-based voice activity detection and adaptive thresholding for efficient speech coding. International Journal of Speech Technology, 19, 537\u2013550.","journal-title":"International Journal of Speech Technology"},{"key":"9777_CR14","doi-asserted-by":"publisher","first-page":"827","DOI":"10.1007\/s10772-019-09625-6","volume":"22","author":"O Kenai","year":"2019","unstructured":"Kenai, O., Ouamour, S., Guerti, M., et al. (2019). A new architecture based VAD for speaker diarization\/detection systems. International Journal of Speech Technology, 22, 827\u2013840.","journal-title":"International Journal of Speech Technology"},{"unstructured":"Krishnan, P. S. H., Padmanabhan, R., & Murthy, H. A. (2007). Voice activity detection using group delay processing on buffered short-term energy. In Proceedings of 13th international conference on communications.","key":"9777_CR15"},{"issue":"6","key":"9777_CR16","doi-asserted-by":"publisher","first-page":"1594","DOI":"10.1093\/ietfec\/e89-a.6.1594","volume":"E-89-A","author":"YC Lee","year":"2006","unstructured":"Lee, Y. C., & Ahn, S. S. (2006). Statistical model-based VAD algorithm with wavelet transform. IEICE Transactions on Fundamentals, E-89-A(6), 1594\u20131600.","journal-title":"IEICE Transactions on Fundamentals"},{"issue":"3","key":"9777_CR17","doi-asserted-by":"publisher","first-page":"217","DOI":"10.1109\/89.905996","volume":"9","author":"E Nemer","year":"2001","unstructured":"Nemer, E., Goubran, R., & Mahmoud, S. (2001). Robust voice activity detection using higher-order statistics in the LPC residual domain. IEEE Transactions on Audio, Speech and Language Processing, 9(3), 217\u2013231.","journal-title":"IEEE Transactions on Audio, Speech and Language Processing"},{"issue":"2","key":"9777_CR18","doi-asserted-by":"publisher","first-page":"297","DOI":"10.1002\/j.1538-7305.1975.tb02840.x","volume":"54","author":"LR Rabiner","year":"1975","unstructured":"Rabiner, L. R., & Sambur, M. R. (1975). An algorithm for determining the endpoints of isolated utterances. Bell System Technical Journal, 54(2), 297\u2013315.","journal-title":"Bell System Technical Journal"},{"issue":"3\u20134","key":"9777_CR19","doi-asserted-by":"publisher","first-page":"271","DOI":"10.1016\/j.specom.2003.10.002","volume":"42","author":"J Ramirez","year":"2004","unstructured":"Ramirez, J., Segura, J. C., Benitez, C., Torre, A., & Rubio, A. (2004). Efficient voice activity detection algorithms using long-term speech information. Speech Communications, 42(3\u20134), 271\u2013287.","journal-title":"Speech Communications"},{"key":"9777_CR20","doi-asserted-by":"publisher","first-page":"9017","DOI":"10.1109\/ACCESS.2018.2800728","volume":"6","author":"A Sehgal","year":"2018","unstructured":"Sehgal, A., & Kehtarnavaz, N. (2018). A convolutional neural network smartphone app for real-time voice activity detection. IEEE Access, 6, 9017\u20139026.","journal-title":"IEEE Access"},{"doi-asserted-by":"crossref","unstructured":"Silva, D. A., Stuchi, J. A., Violato, R. P. V., & Cuozzo, L. G. D. (2017). Exploring convolutional neural networks for voice activity detection. In Cognitive technologies. Cham: Springer.","key":"9777_CR21","DOI":"10.1007\/978-3-319-53753-5_4"},{"issue":"1","key":"9777_CR22","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/97.736233","volume":"6","author":"J Sohn","year":"1999","unstructured":"Sohn, J., Kim, N. S., & Sung, W. (1999). A statistical model-based voice activity detection. IEEE Signal Processing Letters, 6(1), 1\u20133.","journal-title":"IEEE Signal Processing Letters"},{"doi-asserted-by":"crossref","unstructured":"Tan, L. N., Borgstrom, B. J., & Alwan, A. (2010). Voice activity detection using harmonic frequency components in likelihood ratio test. In IEEE International conference on acoustics, speech, and signal processing (ICASSP).","key":"9777_CR23","DOI":"10.1109\/ICASSP.2010.5495611"},{"key":"9777_CR24","doi-asserted-by":"publisher","first-page":"3139","DOI":"10.1016\/j.compeleceng.2014.09.002","volume":"40","author":"Z Tan","year":"2014","unstructured":"Tan, Z., & Kraljevski, I. (2014). Joint variable frame rate and length analysis for speech recognition under adverse conditions. Computers & Electrical Engineering, 40, 3139\u20133149.","journal-title":"Computers & Electrical Engineering"},{"issue":"4","key":"9777_CR25","doi-asserted-by":"publisher","first-page":"697","DOI":"10.1109\/TASL.2012.2229986","volume":"21","author":"X-L Zhang","year":"2012","unstructured":"Zhang, X.-L., & Wu, J. (2012). Deep belief networks based voice activity detection. IEEE Transactions on Audio, Speech and Language Processing, 21(4), 697\u2013710.","journal-title":"IEEE Transactions on Audio, Speech and Language Processing"},{"key":"9777_CR26","doi-asserted-by":"publisher","first-page":"1007","DOI":"10.1007\/s10772-018-9555-0","volume":"21","author":"M Zoulikha","year":"2018","unstructured":"Zoulikha, M., & Djendi, M. (2018). A new robust forward BSS adaptive algorithm based on automatic voice activity detector for speech quality enhancement. International Journal of Speech Technology, 21, 1007\u20131020.","journal-title":"International Journal of Speech Technology"}],"container-title":["International Journal of Speech Technology"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-020-09777-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10772-020-09777-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-020-09777-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,4,14]],"date-time":"2021-04-14T18:45:26Z","timestamp":1618425926000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10772-020-09777-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,11,18]]},"references-count":26,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2021,3]]}},"alternative-id":["9777"],"URL":"https:\/\/doi.org\/10.1007\/s10772-020-09777-w","relation":{},"ISSN":["1381-2416","1572-8110"],"issn-type":[{"type":"print","value":"1381-2416"},{"type":"electronic","value":"1572-8110"}],"subject":[],"published":{"date-parts":[[2020,11,18]]},"assertion":[{"value":"31 December 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 November 2020","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 November 2020","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}