{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,5,5]],"date-time":"2025-05-05T20:10:01Z","timestamp":1746475801641,"version":"3.40.4"},"publisher-location":"Cham","reference-count":24,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319120683"},{"type":"electronic","value":"9783319120690"}],"license":[{"start":{"date-parts":[[2014,1,1]],"date-time":"2014-01-01T00:00:00Z","timestamp":1388534400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2014,1,1]],"date-time":"2014-01-01T00:00:00Z","timestamp":1388534400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-319-12069-0_23","type":"book-chapter","created":{"date-parts":[[2014,10,29]],"date-time":"2014-10-29T12:19:33Z","timestamp":1414585173000},"page":"317-329","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["A Review of Voice Activity Detection Techniques for On-Device Isolated Digit Recognition on Mobile Devices"],"prefix":"10.1007","author":[{"given":"M. K.","family":"Mustafa","sequence":"first","affiliation":[]},{"given":"Tony","family":"Allen","sequence":"additional","affiliation":[]},{"given":"Lindsay","family":"Evett","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2014,10,30]]},"reference":[{"key":"23_CR1","doi-asserted-by":"crossref","unstructured":"Huggins-Daines, D., Kumar, M., Chan, A., Black, A.W., Ravishankar, M., Rudnicky, A.I.: Pocketsphinx: A free, real-time continuous speech recognition system for hand-held devices. In: Proceedings of IEEE International Conference on Acoustics, Speech and Signal Processing 2006, ICASSP 2006, vol. 1, pp. I\u2013I. IEEE (2006)","DOI":"10.1109\/ICASSP.2006.1659988"},{"key":"23_CR2","unstructured":"Ali, S.A., Haider, N.G., Pathan, M.K.: A LPC-PEV based VAD for word boundary detection. Int. J. Electr. Comput. Sci. 12(02) (2012)"},{"key":"23_CR3","doi-asserted-by":"crossref","unstructured":"Cournapeau, D., Kawahara, T., Mase, K., Toriyama, T.: Voice activity detector based on enhanced cumulant of IPC residual and on-line EM algorithm. In: Proceedings of INTERSPEECH06 (2006)","DOI":"10.21437\/Interspeech.2006-363"},{"key":"23_CR4","unstructured":"Wu, B., Wang, K.: Voice activity detection based on auto-correlation function using wavelet transform and teager energy operator. Comput. Linguist. Chin. Lang. Process. 11, 87\u2013100 (2006)"},{"key":"23_CR5","unstructured":"Enqing, D., Guizhong, L., Yatong, Z., Yu, C.: Voice activity detection based on short-time energy and noise spectrum adaptation. In: 6th International Conference on Signal Processing, vol. 1, pp. 464\u2013467. IEEE (2002)"},{"key":"23_CR6","doi-asserted-by":"crossref","unstructured":"Rabiner, L.R., Sambur, M.R.: An algorithm for determining the endpoints of isolated utterances. Bell Syst. Techn. J. 54, 297\u2013315 (1975)","DOI":"10.1002\/j.1538-7305.1975.tb02840.x"},{"key":"23_CR7","doi-asserted-by":"publisher","unstructured":"Tashan, T., Allen, T., Nolle, L.: Speaker verification using heterogeneous neural network architecture with linear correlation speech activity detection. Expert Syst. (2013). doi:10.1111\/exsy.12030","DOI":"10.1111\/exsy.12030"},{"key":"23_CR8","doi-asserted-by":"crossref","unstructured":"Huang, H., Lin, F.: A speech feature extraction method using complexity measure for voice activity detection in WGN. Speech Commun. 51, 714\u2013723 (2009)","DOI":"10.1016\/j.specom.2009.02.004"},{"key":"23_CR9","doi-asserted-by":"crossref","unstructured":"Ghaemmaghami, H., Baker, B.J., Vogt, R.J., Sridharan, S.: Noise robust voice activity detection using features extracted from the time-domain autocorrelation function. In: Proceedings of Interspeech 2010","DOI":"10.21437\/Interspeech.2010-776"},{"key":"23_CR10","unstructured":"Plannerer, B.: An introduction to speech recognition. Munich (2005)"},{"key":"23_CR11","unstructured":"Rabiner, L.R., Schafer, R.W.: Digital processing of speech signals. In: IET (1979)"},{"key":"23_CR12","unstructured":"Kesarkar, M.: Feature extraction for speech recognition. Electronic Systems, Department of Electrical Engineering, IIT Bombay (2003)"},{"key":"23_CR13","unstructured":"Rabiner, L., Juang, B.: Fundamentals of speech recognition (1993)"},{"key":"23_CR14","doi-asserted-by":"crossref","unstructured":"Zheng, F., Zhang, G., Song, Z.: Comparison of different implementations of MFCC. J. Comput. Sci. Technol. 16, 582\u2013589 (2001)","DOI":"10.1007\/BF02943243"},{"key":"23_CR15","doi-asserted-by":"crossref","unstructured":"Waheed, K., Weaver, K., Salam, F.M.: A robust algorithm for detecting speech segments using an entropic contrast. In: 45th Midwest Symposium on Circuits and Systems, 2002, MWSCAS-2002, vol. 3, pp. III-328\u2013III-331. IEEE (2002)","DOI":"10.1109\/MWSCAS.2002.1187039"},{"key":"23_CR16","doi-asserted-by":"crossref","unstructured":"Vaidyanathan, P.: The theory of linear prediction. Synth. Lect. Signal Process. 2, 1\u2013184 (2007)","DOI":"10.2200\/S00086ED1V01Y200712SPR03"},{"key":"23_CR17","unstructured":"Jones, D.L., Appadwedula, S., Berry, M., Haun, M., Janovetz, J., Kramer, M., Moussa, D., Sachs, D., Wade, B.: Speech processing: theory of LPC analysis and synthesis (2009)"},{"key":"23_CR18","unstructured":"Hachkar, Z., Mounir, B., Farchi, A., El Abbadi, J.: Comparison of MFCC and PLP parameterization in pattern recognition of Arabic alphabet speech. Can. J. Artif. Intell. Mach. Learn. Pattern Recognit. 2, 56\u201360 (2011)"},{"key":"23_CR19","unstructured":"Tashan, T.: Biologically inspired speaker verification. Submitted to Nottingham Trent University (2012)"},{"key":"23_CR20","doi-asserted-by":"crossref","unstructured":"Cooley, J.W., Tukey, J.W.: An algorithm for the machine calculation of complex Fourier series. Math. Comput. 19, 297\u2013301 (1965)","DOI":"10.1090\/S0025-5718-1965-0178586-1"},{"key":"23_CR21","unstructured":"CSLU Database: Available at http:\/\/www.cslu.ogi.edu\/corpora\/isolet\/"},{"key":"23_CR22","doi-asserted-by":"crossref","unstructured":"Wilpon, J., Rabiner, L.: A modified K-means clustering algorithm for use in isolated work recognition. Acoust. Speech Signal Process. IEEE Trans. 33, 587\u2013594 (1985)","DOI":"10.1109\/TASSP.1985.1164581"},{"key":"23_CR23","unstructured":"Looney, C.G.: A fuzzy clustering and fuzzy merging algorithm. CS791q Class notes (1999)"},{"key":"23_CR24","unstructured":"A Tutorial on Clustering Algorithms: Available Online at http:\/\/home.deib.polimi.it\/matteucc\/Clustering\/tutorial_html\/kmeans.html"}],"container-title":["Research and Development in Intelligent Systems XXXI"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-12069-0_23","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,5]],"date-time":"2025-05-05T19:38:48Z","timestamp":1746473928000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-12069-0_23"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783319120683","9783319120690"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-12069-0_23","relation":{},"subject":[],"published":{"date-parts":[[2014]]},"assertion":[{"value":"30 October 2014","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}