{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,26]],"date-time":"2025-06-26T04:09:33Z","timestamp":1750910973923,"version":"3.41.0"},"reference-count":35,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2017,9,19]],"date-time":"2017-09-19T00:00:00Z","timestamp":1505779200000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Speech Technol"],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1007\/s10772-017-9459-4","type":"journal-article","created":{"date-parts":[[2017,9,19]],"date-time":"2017-09-19T06:34:02Z","timestamp":1505802842000},"page":"907-917","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Pitch segmentation of speech signals based on short-time energy waveform"],"prefix":"10.1007","volume":"20","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-1138-5888","authenticated-orcid":false,"given":"Sopon","family":"Wiriyarattanakul","sequence":"first","affiliation":[]},{"given":"Nawapak","family":"Eua-anant","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,9,19]]},"reference":[{"key":"9459_CR1","unstructured":"Bereksi-Reguig, F., & Taouli, S. A. (2013). ECG signal denoising by morphological top-hat transform. Global Journal of Computer Science and Technology, 13(5)."},{"issue":"1","key":"9459_CR2","doi-asserted-by":"crossref","first-page":"93","DOI":"10.3844\/ajassp.2012.93.102","volume":"9","author":"Antonios","year":"2012","unstructured":"Antonios (2012). An improved time domain pitch detection algorithm for pathological voice. American Journal of Applied Sciences, 9(1), 93\u2013102.","journal-title":"American Journal of Applied Sciences"},{"issue":"1","key":"9459_CR3","first-page":"50","volume":"1","author":"K Chamnongthai","year":"2005","unstructured":"Chamnongthai, K., Pichitwong, W., & Ayudhya,N. P. (2005). Final consonant segmentation for Thai syllable by using vowel characteristics and wavelet packet transform. ECTI-CIT Transactions on Communications and Information Technology, 1(1), 50\u201362.","journal-title":"ECTI-CIT Transactions on Communications and Information Technology"},{"key":"9459_CR4","doi-asserted-by":"crossref","first-page":"1917","DOI":"10.1121\/1.1458024","volume":"111","author":"A Cheveigneb de","year":"2002","unstructured":"de Cheveigneb, A., & Kawahara, H. (2002). Yin, a fundamental frequency estimator for speech and music. The Journal of the Acoustical Society of America, 111, 1917\u20131930.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"6","key":"9459_CR5","doi-asserted-by":"crossref","first-page":"43","DOI":"10.1016\/j.jvoice.2015.11.016","volume":"30","author":"DA Eddins","year":"2016","unstructured":"Eddins, D. A., Anand, S., Camacho, A., & Shrivastav, R. (2016). Modeling of breathy voice quality using pitch-strength estimates. Journal of Voice, 30(6), 43\u201352.","journal-title":"Journal of Voice"},{"key":"9459_CR6","unstructured":"Gerhard, D. (2002). Pitch extraction and fundamental frequency: History and current techniques. Technical Report TR-CS."},{"key":"9459_CR7","doi-asserted-by":"crossref","unstructured":"Ghahremani, P., BabaAli, B., Povey, D., Riedhammer, K., Trmal, J., & Khudanpur, S. (2014). A pitch extraction algorithm tuned for automatic speech recognition. In IEEE international conference on acoustics, speech and signal processing (ICASSP) (pp.\u00a02494\u20132498).","DOI":"10.1109\/ICASSP.2014.6854049"},{"key":"9459_CR8","doi-asserted-by":"crossref","unstructured":"Huang, Q., Wang, D., & Lu, Y. (2009) Single channel speech enhancement based on prominent pitch estimation. In IET international communication conference on wireless mobile and computing (CCWMC) (pp.\u00a0205\u2013208).","DOI":"10.1049\/cp.2009.1926"},{"key":"9459_CR9","unstructured":"Hui, L., Dai, B.-Q., & Wei, L. (2006). A pitch detection algorithm based on AMDF and ACF. In IEEE international conference on acoustics speech and signal processing proceedings (Vol. 1)."},{"key":"9459_CR10","doi-asserted-by":"crossref","unstructured":"Hunt, M., & Lefebvre, C. (1987). Speech recognition using an auditory model with pitch-synchronous analysis. In IEEE international conference on acoustics, speech, and signal processing (ICASSP) (Vol. 12, pp. 813\u2013816).","DOI":"10.1109\/ICASSP.1987.1169585"},{"key":"9459_CR11","unstructured":"Hyun, K. H., Kim, E. H., & Kwak, Y. K. (2005). Improvement of emotion recognition by Bayesian classifier using non-zero-pitch concept. In IEEE international workshop on robot and human interactive communication (pp.\u00a0312\u2013316)."},{"key":"9459_CR12","doi-asserted-by":"crossref","unstructured":"Jdira, M. B., Jem\u00e2a, I., & Ouni, K. (2014). Speaker recognition system based on pitch estimation. In International conference on electrical sciences and technologies (CISTEM) (pp.\u00a01\u20135).","DOI":"10.1109\/CISTEM.2014.7076752"},{"key":"9459_CR13","doi-asserted-by":"crossref","unstructured":"Kammoun, M., & Ellouze, N. (2006) Pitch and energy contribution in emotion and speaking styles recognition enhancement. In IMACS multiconference on computational engineering in systems applications (Vol. 1, pp.\u00a097\u2013100).","DOI":"10.1109\/CESA.2006.4281631"},{"key":"9459_CR14","doi-asserted-by":"crossref","unstructured":"Khulage, A. A. (2012). Extraction of pitch, duration and formant frequencies for emotion recognition system. In Communication and computing (ARTCom2012) (pp.\u00a07\u20139).","DOI":"10.1049\/cp.2012.2482"},{"key":"9459_CR15","doi-asserted-by":"crossref","unstructured":"Kim, S., Eriksson, T., Kang, H.-G., & Youn, D. H. (2004). A pitch synchronous feature extraction method for speaker recognition. In IEEE international conference on acoustics, speech, and signal processing, 2004. Proceedings (ICASSP\u201904) (Vol. 1, p.\u00a0I-405-8).","DOI":"10.1109\/ICASSP.2004.1326008"},{"key":"9459_CR16","doi-asserted-by":"crossref","unstructured":"Krishnakumar, S., Kumar, K. R. P., & Balakrishnan, N. (2003). Pitch maxima for robust speaker recognition. In IEEE international conference on acoustics, speech, and signal processing (ICASSP) (Vol. 2, p.\u00a0II-201-4).","DOI":"10.1109\/ICASSP.2003.1202329"},{"key":"9459_CR17","doi-asserted-by":"crossref","unstructured":"Li, D., Yang, Y., & Huang, T. (2009). Pitch envelope based frame level score reweighed algorithm for emotion robust speaker recognition. In 2009 3rd international conference on affective computing and intelligent interaction and workshops (pp.\u00a01\u20134).","DOI":"10.1109\/ACII.2009.5349589"},{"key":"9459_CR18","unstructured":"McLaughlin, S., Leith, D., & Mann, I. (2002). Using Gaussian processes to synthesize voiced speech with natural pitch variations. In International conference on digital signal processing."},{"key":"9459_CR19","doi-asserted-by":"crossref","first-page":"13","DOI":"10.1016\/S1319-1578(10)80002-3","volume":"22","author":"G Muhammad","year":"2010","unstructured":"Muhammad, G. (2010). Noise-robust pitch detection using auto-correlation function with enhancements. Journal of King Saud University Computer and Information Sciences, 22, 13\u201328.","journal-title":"Journal of King Saud University Computer and Information Sciences"},{"issue":"6","key":"9459_CR20","doi-asserted-by":"crossref","first-page":"595","DOI":"10.1366\/000370210791414281","volume":"64","author":"R Perez-Pueyo","year":"2010","unstructured":"Perez-Pueyo, R., Soneira, M. J., & Ruiz-Moreno, S. (2010). Morphology-based automated baseline removal for Raman spectra of artistic pigments. Applied Spectroscopy, 64(6), 595\u2013600.","journal-title":"Applied Spectroscopy"},{"key":"9459_CR21","doi-asserted-by":"crossref","unstructured":"Qiang, H., & Youwei, Z. (1998). On prefiltering and endpoint detection of speech signal. In International conference on signal processing proceedings (Vol. 1, pp. 749\u2013752).","DOI":"10.1109\/ICOSP.1998.770320"},{"issue":"1","key":"9459_CR22","doi-asserted-by":"crossref","first-page":"24","DOI":"10.1109\/TASSP.1977.1162905","volume":"25","author":"L Rabiner","year":"1977","unstructured":"Rabiner, L. (1977). On the use of autocorrelation analysis for pitch detection. IEEE Transactions on Acoustics, Speech and Signal Processing, 25(1), 24\u201333.","journal-title":"IEEE Transactions on Acoustics, Speech and Signal Processing"},{"issue":"2","key":"9459_CR23","doi-asserted-by":"crossref","first-page":"297","DOI":"10.1002\/j.1538-7305.1975.tb02840.x","volume":"54","author":"LR Rabiner","year":"1975","unstructured":"Rabiner, L. R., & Sambur, M. R. (1975). An algorithm for determining the endpoints of isolated utterances. Bell System Technical Journal, 54(2), 297\u2013315.","journal-title":"Bell System Technical Journal"},{"key":"9459_CR24","doi-asserted-by":"crossref","unstructured":"Ramalho, M. A., & Mammone, R. J. (1993). New speech enhancement techniques using the pitch mode modulation model. In Proceedings of the 36th midwest symposium on circuits and systems (Vol. 2, pp.\u00a01531\u20131534).","DOI":"10.1109\/MWSCAS.1993.343407"},{"key":"9459_CR25","doi-asserted-by":"crossref","unstructured":"Ru-Wei, L., Long-Tao, C., & Yang, L. (2013). Pitch detection method for noisy speech signals based on wavelet transform and autocorrelation function. In Ninth international conference on intelligent information hiding and multimedia signal processing (pp.\u00a0153\u2013156).","DOI":"10.1109\/IIH-MSP.2013.47"},{"issue":"3","key":"9459_CR26","first-page":"197","volume":"6","author":"T Shimamura","year":"2010","unstructured":"Shimamura, T. (2010). An efficient pitch estimation method using windowless and normalized autocorrelation functions in noisy environments. ResearchGate, 6(3), 197\u2013204.","journal-title":"ResearchGate"},{"issue":"7","key":"9459_CR27","doi-asserted-by":"crossref","first-page":"727","DOI":"10.1109\/89.952490","volume":"9","author":"T Shimamura","year":"2001","unstructured":"Shimamura, T., & Kobayashi, H. (2001). Weighted autocorrelation for pitch extraction of noisy speech. IEEE Transactions Speech and Audio Processing, 9(7), 727\u2013730.","journal-title":"IEEE Transactions Speech and Audio Processing"},{"key":"9459_CR28","doi-asserted-by":"crossref","unstructured":"Stephenson, T. A., Escofet, J., Magimai-Doss, M., & Bourlard, H. (2002). Dynamic Bayesian network based speech recognition with pitch and energy as auxiliary variables. In Proceedings 12th IEEE workshop on neural networks for signal processing (pp.\u00a0637\u2013646).","DOI":"10.1109\/NNSP.2002.1030075"},{"issue":"6","key":"9459_CR29","doi-asserted-by":"crossref","first-page":"465","DOI":"10.1016\/S0010-4825(02)00034-3","volume":"32","author":"Y Sun","year":"2002","unstructured":"Sun, Y., Chan, K. L., & Krishnan, S. M. (2002). ECG signal conditioning by morphological filtering. Computers in Biology and Medicine, 32(6), 465\u2013479.","journal-title":"Computers in Biology and Medicine"},{"key":"9459_CR30","doi-asserted-by":"crossref","unstructured":"Swee, T. T., Salleh, S. H. S., & Jamaludin, M. R. (2010). Speech pitch detection using short-time energy. In International conference on computer and communication engineering (ICCCE) (pp.\u00a01\u20136).","DOI":"10.1109\/ICCCE.2010.5556836"},{"key":"9459_CR31","doi-asserted-by":"crossref","unstructured":"Tabrikian, J., Dubnov, S., & Dickalov, Y. (2002). Speech enhancement by harmonic modeling via map pitch tracking. In IEEE international conference on acoustics, speech, and signal processing (ICASSP) (Vol. 1, pp. I-549\u2013I-552).","DOI":"10.1109\/ICASSP.2002.1005798"},{"issue":"10","key":"9459_CR32","doi-asserted-by":"crossref","first-page":"2006","DOI":"10.1109\/TASL.2013.2263803","volume":"21","author":"YB Wang","year":"2006","unstructured":"Wang, Y. B., Li, S. W., & s Lee, L. (2006). An experimental analysis on integrating multi-stream spectro-temporal, cepstral and pitch information for mandarin speech recognition. IEEE Transactions on Audio, Speech, and Language Processing, 21(10), 2006\u20132014.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"key":"9459_CR33","doi-asserted-by":"crossref","unstructured":"Xu, X., Zhang, T. Q, Shi, S., & Zhang, Y. (2014). An improved pitch detection of speech combined with speech enhancement. In 7th international congress on image and signal processing (CISP) (pp.\u00a0778\u2013782).","DOI":"10.1109\/CISP.2014.7003882"},{"key":"9459_CR34","doi-asserted-by":"crossref","unstructured":"Zhu, J., Sun, S., Liu, X., & Lei, B. (2009). Pitch in speaker recognition. In Ninth international conference on hybrid intelligent systems (Vol. 1, pp.\u00a033\u201336).","DOI":"10.1109\/HIS.2009.14"},{"issue":"2","key":"9459_CR35","doi-asserted-by":"crossref","first-page":"467","DOI":"10.1109\/TSA.2005.857809","volume":"14","author":"RD Zilca","year":"2006","unstructured":"Zilca, R. D., Kingsbury, B., Navratil, J., & Ramaswamy, G. N. (2006). Pseudo pitch synchronous analysis of speech with applications to speaker recognition. IEEE Transactions on Audio, Speech, and Language Processing, 14(2), 467\u2013478.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"}],"container-title":["International Journal of Speech Technology"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10772-017-9459-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-017-9459-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-017-9459-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,25]],"date-time":"2025-06-25T20:12:37Z","timestamp":1750882357000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10772-017-9459-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,9,19]]},"references-count":35,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2017,12]]}},"alternative-id":["9459"],"URL":"https:\/\/doi.org\/10.1007\/s10772-017-9459-4","relation":{},"ISSN":["1381-2416","1572-8110"],"issn-type":[{"type":"print","value":"1381-2416"},{"type":"electronic","value":"1572-8110"}],"subject":[],"published":{"date-parts":[[2017,9,19]]}}}