{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,20]],"date-time":"2025-10-20T10:20:37Z","timestamp":1760955637368,"version":"3.37.3"},"reference-count":22,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2016,7,7]],"date-time":"2016-07-07T00:00:00Z","timestamp":1467849600000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0"}],"funder":[{"DOI":"10.13039\/501100001809","name":"the National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["61370034","61403224"],"award-info":[{"award-number":["61370034","61403224"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J AUDIO SPEECH MUSIC PROC."],"published-print":{"date-parts":[[2016,12]]},"DOI":"10.1186\/s13636-016-0092-y","type":"journal-article","created":{"date-parts":[[2016,7,7]],"date-time":"2016-07-07T07:18:54Z","timestamp":1467875934000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["Voice activity detection algorithm based on long-term pitch information"],"prefix":"10.1186","volume":"2016","author":[{"given":"Xu-Kui","family":"Yang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Liang","family":"He","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dan","family":"Qu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wei-Qiang","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2016,7,7]]},"reference":[{"issue":"2","key":"92_CR1","doi-asserted-by":"publisher","first-page":"297","DOI":"10.1002\/j.1538-7305.1975.tb02840.x","volume":"54","author":"LR Rabiner","year":"1975","unstructured":"LR Rabiner, MR Sambur, An algorithm for determining the endpoints of isolated utterances. The Bell System Technical Journal 54(2), 297\u2013315 (1975)","journal-title":"The Bell System Technical Journal"},{"issue":"3","key":"92_CR2","doi-asserted-by":"publisher","first-page":"600","DOI":"10.1109\/TASL.2010.2052803","volume":"19","author":"PK Ghosh","year":"2011","unstructured":"PK Ghosh, A Tsiartas, S Narayanan, Robust voice activity detection using long-term signal variability. IEEE Transactions on Audio, Speech and Language Processing 19(3), 600\u2013613 (2011)","journal-title":"IEEE Transactions on Audio, Speech and Language Processing"},{"key":"92_CR3","volume-title":"Sparse power spectrum based robust voice activity detector","author":"Y Datao","year":"2012","unstructured":"Y Datao, H Jiqing, Z Guibin, Z Tieran, Sparse power spectrum based robust voice activity detector (IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), Kyoto, 2012)"},{"key":"92_CR4","unstructured":"W Hongzhi, X Yuchao, L Meijing, Study on the MFCC similarity-based voice activity detection algorithm (International Conference on Artificial Intelligence, Management Science and Electronic Commerce (AIMSEC), 2011)"},{"key":"92_CR5","first-page":"709","volume-title":"All for one: feature combination for highly channel-degraded speech activity detection","author":"G Martin","year":"2013","unstructured":"G Martin, A Abeer, E Dan et al., All for one: feature combination for highly channel-degraded speech activity detection (INTERSPEECH, Lyon, 2013), pp. 709\u2013713"},{"key":"92_CR6","doi-asserted-by":"crossref","unstructured":"T Kristjansson, S Deligne, P Olsen, Voicing features for robust speech detection (INTERSPEECH, 2005), pp. 369\u2013372","DOI":"10.21437\/Interspeech.2005-186"},{"key":"92_CR7","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1109\/89.759042","volume":"7","author":"S Ahmadi","year":"1999","unstructured":"S Ahmadi, AS Spanias, Cepstrum-based pitch detection using a new statistical V\/UV classification algorithm. IEEE Transactions on Speech Audio Processing 7, 333\u2013338 (1999)","journal-title":"IEEE Transactions on Speech Audio Processing"},{"key":"92_CR8","doi-asserted-by":"publisher","first-page":"762","DOI":"10.1109\/TSA.2005.851909","volume":"13","author":"BF Wu","year":"2005","unstructured":"BF Wu, KC Wang, Robust endpoint detection algorithm based on the adaptive band partitioning spectral entropy in adverse environments. IEEE Transactions Speech Audio Processing 13, 762\u2013775 (2005)","journal-title":"IEEE Transactions Speech Audio Processing"},{"key":"92_CR9","doi-asserted-by":"crossref","unstructured":"Z Tuske, P Mihajlik, Z Tobler, T Fegyo, Robust voice activity detection based on the entropy of noise-suppressed spectrum (INTERSPEECH, 2005)","DOI":"10.21437\/Interspeech.2005-119"},{"key":"92_CR10","doi-asserted-by":"crossref","unstructured":"L. N. Tan, B. J. Borgstrom, and A. Alwan, Voice activity detection using harmonic frequency components in likelihood ratio test (IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), 2010)","DOI":"10.1109\/ICASSP.2010.5495611"},{"issue":"3\u20134","key":"92_CR11","doi-asserted-by":"publisher","first-page":"271","DOI":"10.1016\/j.specom.2003.10.002","volume":"42","author":"J Ramirez","year":"2004","unstructured":"J Ramirez, JC Segura, C Benitez, A de la Torre, A Rubio, Efficient voice activity detection algorithms using long-term speech information. Speech Communication 42(3\u20134), 271\u2013287 (2004)","journal-title":"Speech Communication"},{"issue":"1","key":"92_CR12","doi-asserted-by":"publisher","first-page":"96","DOI":"10.1016\/j.specom.2005.08.002","volume":"48","author":"K Manohar","year":"2006","unstructured":"K Manohar, P Rao, Speech enhancement in nonstationary noise environments using noise properties. Speech Communication 48(1), 96\u2013109 (2006)","journal-title":"Speech Communication"},{"key":"92_CR13","doi-asserted-by":"publisher","unstructured":"M Muller, Information retrieval for music and motion (Springer Verlag, 2007)","DOI":"10.1007\/978-3-540-74048-3"},{"key":"92_CR14","unstructured":"M Meinard, E Sebastian, Chroma Toolbox: MATLAB implementations for extracting variants of chroma-based audio features, in Proceedings of the 12th International Conference on Music Information Retrieval (ISMIR) (2011)"},{"issue":"1","key":"92_CR15","doi-asserted-by":"publisher","first-page":"96","DOI":"10.1109\/TMM.2004.840597","volume":"7","author":"MA Bartsch","year":"2005","unstructured":"MA Bartsch, GH Wakefield, Audio thumbnailing of popular music using chroma-based representations. IEEE Transactions on Multimedia 7(1), 96\u2013104 (2005)","journal-title":"IEEE Transactions on Multimedia"},{"key":"92_CR16","unstructured":"EH Berger, LH Royster, DP Driscoll, JD Royster, M Layne, The Noise Manual, 5th edn. (American Industrial Hygiene Association, 2003)"},{"key":"92_CR17","volume-title":"\u201cThe effect of bandwidth on speech intelligibility\u201d, White paper","author":"J Rodman","year":"2003","unstructured":"J Rodman, \u201cThe effect of bandwidth on speech intelligibility\u201d, White paper (POLYCOM Inc., USA, 2003)"},{"issue":"4","key":"92_CR18","doi-asserted-by":"publisher","first-page":"1383","DOI":"10.1109\/TASL.2011.2180896","volume":"20","author":"T Gerkmann","year":"2012","unstructured":"T Gerkmann, RC Hendriks, Unbiased MMSE-based noise power estimation with low complexity and low tracking delay. IEEE Transactions on Audio, Speech and Language Processing 20(4), 1383\u20131393 (2012)","journal-title":"IEEE Transactions on Audio, Speech and Language Processing"},{"key":"92_CR19","doi-asserted-by":"crossref","unstructured":"JS Garofolo, LF Lamel, WM Fisher et al., DARPA TIMIT acoustic phonetic continuous speech corpus CDROM (NIST, 1993)","DOI":"10.6028\/NIST.IR.4930"},{"issue":"3","key":"92_CR20","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1016\/0167-6393(93)90095-3","volume":"12","author":"A Varga","year":"1993","unstructured":"A Varga, HJM Steeneken, Assessment for automatic speech recognition: Ii. NOISEX-92: a database and an experiment to study the effect of additive noise on speech recognition systems. Speech Communication 12(3), 247\u2013251 (1993)","journal-title":"Speech Communication"},{"issue":"1","key":"92_CR21","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/97.736233","volume":"6","author":"J Sohn","year":"1999","unstructured":"J Sohn, NS Kim, W Sung, A statistical model-based voice activity detection. IEEE Signal Processing Letter 6(1), 1\u20133 (1999)","journal-title":"IEEE Signal Processing Letter"},{"key":"92_CR22","doi-asserted-by":"crossref","unstructured":"M Yanna, A Nishihara, Efficient voice activity detection algorithm using long-term spectral flatness measure. EURASIP Journal on Audio, Speech and Music Processing, 21 (2013)","DOI":"10.1186\/1687-4722-2013-21"}],"container-title":["EURASIP Journal on Audio, Speech, and Music Processing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13636-016-0092-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s13636-016-0092-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13636-016-0092-y","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13636-016-0092-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,2]],"date-time":"2022-07-02T20:26:56Z","timestamp":1656793616000},"score":1,"resource":{"primary":{"URL":"https:\/\/asmp-eurasipjournals.springeropen.com\/articles\/10.1186\/s13636-016-0092-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,7,7]]},"references-count":22,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2016,12]]}},"alternative-id":["92"],"URL":"https:\/\/doi.org\/10.1186\/s13636-016-0092-y","relation":{},"ISSN":["1687-4722"],"issn-type":[{"type":"electronic","value":"1687-4722"}],"subject":[],"published":{"date-parts":[[2016,7,7]]},"article-number":"14"}}