{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,26]],"date-time":"2026-03-26T13:39:41Z","timestamp":1774532381507,"version":"3.50.1"},"reference-count":45,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2022,6,25]],"date-time":"2022-06-25T00:00:00Z","timestamp":1656115200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,6,25]],"date-time":"2022-06-25T00:00:00Z","timestamp":1656115200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Circuits Syst Signal Process"],"published-print":{"date-parts":[[2022,11]]},"DOI":"10.1007\/s00034-022-02082-8","type":"journal-article","created":{"date-parts":[[2022,6,25]],"date-time":"2022-06-25T17:03:53Z","timestamp":1656176633000},"page":"6266-6294","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["A Novel Pitch Detection Algorithm Based on Instantaneous Frequency for Clean and Noisy Speech"],"prefix":"10.1007","volume":"41","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8929-3609","authenticated-orcid":false,"given":"Zied","family":"Mnasri","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3865-2613","authenticated-orcid":false,"given":"Stefano","family":"Rovetta","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6612-0932","authenticated-orcid":false,"given":"Francesco","family":"Masulli","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,6,25]]},"reference":[{"key":"2082_CR1","doi-asserted-by":"crossref","unstructured":"T. Abe, T. Kobayashi, S. Imai, Harmonics tracking and pitch extraction based on instantaneous frequency, in 1995 International Conference on Acoustics, Speech, and Signal Processing, IEEE, vol.\u00a01, pp. 756\u2013759 (1995)","DOI":"10.1109\/ICASSP.1995.479804"},{"key":"2082_CR2","doi-asserted-by":"crossref","unstructured":"T. Abe, T. Kobayashi, S . Imai, Robust pitch estimation with harmonics enhancement in noisy environments based on instantaneous frequency, in Proceeding of Fourth International Conference on Spoken Language Processing. ICSLP\u201996. IEEE, vol.\u00a02, pp. 1277\u20131280 (1996)","DOI":"10.21437\/ICSLP.1996-329"},{"key":"2082_CR3","unstructured":"Y. Agiomyrgiannaki, Yang: Yet-another-generalized vocoder. https:\/\/github.com\/google\/yang_vocoder\/, last accessed: 31-05-2022 (2017)"},{"key":"2082_CR4","unstructured":"E. Azarov, M. Vashkevich, A. Petrovsky, Instantaneous pitch estimation based on rapt framework, in 2012 Proceedings of the 20th European Signal Processing Conference (EUSIPCO). IEEE, pp. 2787\u20132791 (2012)"},{"key":"2082_CR5","doi-asserted-by":"crossref","unstructured":"H. Ba, N. Yang, I. Demirkol, W. Heinzelman, Bana: a hybrid approach for noise resilient pitch detection, in 2012 IEEE Statistical Signal Processing Workshop (SSP). IEEE, pp. 369\u2013372 (2012)","DOI":"10.1109\/SSP.2012.6319706"},{"issue":"4","key":"2082_CR6","doi-asserted-by":"publisher","first-page":"540","DOI":"10.1109\/5.135378","volume":"80","author":"B Boashash","year":"1992","unstructured":"B. Boashash, Estimating and interpreting the instantaneous frequency of a signal. II. Algorithms and applications. Proc. IEEE 80(4), 540\u2013568 (1992)","journal-title":"Proc. IEEE"},{"key":"2082_CR7","unstructured":"P. Boersma, D. Weenink, Praat: doing phonetics by computer. https:\/\/www.fon.hum.uva.nl\/praat\/, last accessed: 31-05-2022 (2006)"},{"issue":"3","key":"2082_CR8","doi-asserted-by":"publisher","first-page":"1638","DOI":"10.1121\/1.2951592","volume":"124","author":"A Camacho","year":"2008","unstructured":"A. Camacho, J.G. Harris, A sawtooth waveform inspired pitch estimator for speech and music. J. Acoust. Soc. Am. 124(3), 1638\u20131652 (2008)","journal-title":"J. Acoust. Soc. Am."},{"key":"2082_CR9","doi-asserted-by":"crossref","unstructured":"W. Chu, A. Alwan, Reducing f0 frame error of f0 tracking algorithms under noisy conditions with an unvoiced\/voiced classification frontend, in 2009 IEEE International Conference on Acoustics, Speech and Signal Processing. IEEE, pp. 3969\u20133972 (2009)","DOI":"10.1109\/ICASSP.2009.4960497"},{"issue":"4","key":"2082_CR10","doi-asserted-by":"publisher","first-page":"1917","DOI":"10.1121\/1.1458024","volume":"111","author":"A De Cheveign\u00e9","year":"2002","unstructured":"A. De Cheveign\u00e9, H. Kawahara, Yin, a fundamental frequency estimator for speech and music. J. Acoust. Soc. Am. 111(4), 1917\u20131930 (2002)","journal-title":"J. Acoust. Soc. Am."},{"key":"2082_CR11","unstructured":"A. De\u00a0Cheveign\u00e9, H. Kawahara, Yin algorithm. https:\/\/labrosa.ee.columbia.edu\/doc\/yin.html, last accessed: 31-05-2022 (2002)"},{"key":"2082_CR12","doi-asserted-by":"crossref","unstructured":"T. Drugman, A . Alwan, Joint robust voicing detection and pitch estimation based on residual harmonics, in Proceedings of the Interspeech 2011, Florence, Italy. IEEE, pp. 1973\u20131976 (2011)","DOI":"10.21437\/Interspeech.2011-519"},{"issue":"26","key":"2082_CR13","first-page":"429","volume":"93","author":"D Gabor","year":"1946","unstructured":"D. Gabor, Theory of communication. Part 1. The analysis of information. J. Inst. Electr. Eng. Part III Radio Commun. Eng. 93(26), 429\u2013441 (1946)","journal-title":"J. Inst. Electr. Eng. Part III Radio Commun. Eng."},{"issue":"2","key":"2082_CR14","doi-asserted-by":"publisher","first-page":"518","DOI":"10.1109\/TASLP.2013.2295918","volume":"22","author":"S Gonzalez","year":"2014","unstructured":"S. Gonzalez, M. Brookes, Pefac: a pitch estimation algorithm robust to high levels of noise. IEEE\/ACM Trans. Audio Speech Lang. Process. 22(2), 518\u2013530 (2014)","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."},{"key":"2082_CR15","unstructured":"S.W. Group et\u00a0al., Speech signal processing toolkit (sptk) version 3.3, https:\/\/sourceforge.net\/projects\/sp-tk\/\/, last accessed: 31-05-2022 (2009)"},{"issue":"1","key":"2082_CR16","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1121\/1.396427","volume":"83","author":"DJ Hermes","year":"1988","unstructured":"D.J. Hermes, Measurement of pitch by subharmonic summation. J. Acoust. Soc. Am. 83(1), 257\u2013264 (1988)","journal-title":"J. Acoust. Soc. Am."},{"key":"2082_CR17","doi-asserted-by":"crossref","unstructured":"W. Hess, Manual and instrumental pitch determination, voicing determination, in Pitch Determination of Speech Signals. Springer, pp. 92\u2013151 (1983)","DOI":"10.1007\/978-3-642-81926-1_5"},{"issue":"4","key":"2082_CR18","doi-asserted-by":"publisher","first-page":"792","DOI":"10.1016\/j.sigpro.2005.06.011","volume":"86","author":"H Huang","year":"2006","unstructured":"H. Huang, J. Pan, Speech pitch determination based on Hilbert\u2013Huang transform. Signal Process. 86(4), 792\u2013803 (2006)","journal-title":"Signal Process."},{"issue":"1971","key":"2082_CR19","doi-asserted-by":"publisher","first-page":"903","DOI":"10.1098\/rspa.1998.0193","volume":"454","author":"NE Huang","year":"1998","unstructured":"N.E. Huang, Z. Shen, S.R. Long, M.C. Wu, H.H. Shih, Q. Zheng, N.C. Yen, C.C. Tung, H.H. Liu, The empirical mode decomposition and the Hilbert spectrum for nonlinear and non-stationary time series analysis. Proc. R. Soc. Lond. Ser. A Math. Phys. Eng. Sci. 454(1971), 903\u2013995 (1998)","journal-title":"Proc. R. Soc. Lond. Ser. A Math. Phys. Eng. Sci."},{"key":"2082_CR20","doi-asserted-by":"crossref","unstructured":"D. Jouvet, Y. Laprie, Performance analysis of several pitch detection algorithms on simulated and real noisy speech data, in 2017 25th European Signal Processing Conference (EUSIPCO). IEEE, pp. 1614\u20131618 (2017)","DOI":"10.23919\/EUSIPCO.2017.8081482"},{"issue":"2","key":"2082_CR21","doi-asserted-by":"publisher","first-page":"917","DOI":"10.1109\/18.119752","volume":"38","author":"S Kadambe","year":"1992","unstructured":"S. Kadambe, G.F. Boudreaux-Bartels, Application of the wavelet transform for pitch detection of speech signals. IEEE Trans. Inf. Theory 38(2), 917\u2013924 (1992)","journal-title":"IEEE Trans. Inf. Theory"},{"key":"2082_CR22","doi-asserted-by":"crossref","unstructured":"H. Kawahara, Y. Agiomyrgiannakis, H. Zen, Using instantaneous frequency and aperiodicity detection to estimate f0 for high-quality speech synthesis, in 9th ISCA Speech Synthesis Workshop (SSW9), ISCA, pp. 221\u2013228 (2016)","DOI":"10.21437\/SSW.2016-36"},{"key":"2082_CR23","doi-asserted-by":"crossref","unstructured":"A. Kissling, R. Kompe, N. Niemann, A. Batliner, Dp-based determination of f0 contours from speech signals, in Acoustics, Speech, and Signal Processing, 1992. Proceedings. (ICASSP\u201992), IEEE, vol. 1, pp. 1\u20134 (1992)","DOI":"10.1109\/ICASSP.1992.226131"},{"issue":"1","key":"2082_CR24","doi-asserted-by":"publisher","first-page":"19","DOI":"10.12697\/ACUTM.2014.18.03","volume":"18","author":"E Liflyand","year":"2014","unstructured":"E. Liflyand, Interaction between the Fourier transform and the Hilbert transform. Acta et Commentationes Universitatis Tartuensis de Mathematica 18(1), 19\u201332 (2014)","journal-title":"Acta et Commentationes Universitatis Tartuensis de Mathematica"},{"key":"2082_CR25","unstructured":"Z. Mnasri, Proposed algorithm, https:\/\/github.com\/zied-mnasri\/f0_IF_model, last accessed: 31-05-2022 (2021)"},{"key":"2082_CR26","first-page":"23","volume-title":"Studientexte zur Sprachkommunikation: Elektronische Sprachsignalverarbeitung 2018","author":"Z Mnasri","year":"2018","unstructured":"Z. Mnasri, H. Amiri, On the relationship between instantaneous frequency and pitch in speech signals, in Studientexte zur Sprachkommunikation: Elektronische Sprachsignalverarbeitung 2018. ed. by A. Berton, U. Haiber, W. Minker (TUDpress, Dresden, 2018), pp. 23\u201329"},{"key":"2082_CR27","doi-asserted-by":"crossref","unstructured":"Z. Mnasri, S. Rovetta, F. Masulli, A novel pitch detection algorithm based on instantaneous frequency, in 2021 29th European Signal Processing Conference (EUSIPCO), IEEE, pp. 16\u201320 (2021). http:\/\/doi.org\/10.23919\/EUSIPCO54536.2021.9616047","DOI":"10.23919\/EUSIPCO54536.2021.9616047"},{"issue":"2","key":"2082_CR28","doi-asserted-by":"publisher","first-page":"293","DOI":"10.1121\/1.1910339","volume":"41","author":"AM Noll","year":"1967","unstructured":"A.M. Noll, Cepstrum pitch determination. J. Acoust. Soc. Am. 41(2), 293\u2013309 (1967)","journal-title":"J. Acoust. Soc. Am."},{"key":"2082_CR29","doi-asserted-by":"crossref","unstructured":"G. Pirker, M. Wohlmayr, S. Petrik, F. Pernkopf, A pitch tracking corpus with evaluation on multipitch tracking scenario, in Twelfth Annual Conference of the International Speech Communication Association. http:\/\/doi.org\/10.21437\/Interspeech.2011 (2011)","DOI":"10.21437\/Interspeech.2011-317"},{"issue":"23","key":"2082_CR30","first-page":"153","volume":"93","author":"B Van der Pol","year":"1946","unstructured":"B. Van der Pol, The fundamental principles of frequency modulation. J. Inst. Electr. Eng. Part III Radio Commun. Eng. 93(23), 153\u2013158 (1946)","journal-title":"J. Inst. Electr. Eng. Part III Radio Commun. Eng."},{"issue":"2","key":"2082_CR31","doi-asserted-by":"publisher","first-page":"233","DOI":"10.1016\/0165-1684(95)00027-B","volume":"44","author":"L Qiu","year":"1995","unstructured":"L. Qiu, H. Yang, S.N. Koh, Fundamental frequency determination based on instantaneous frequency estimation. Signal Process. 44(2), 233\u2013241 (1995)","journal-title":"Signal Process."},{"issue":"1","key":"2082_CR32","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1109\/TASSP.1977.1162905","volume":"25","author":"L Rabiner","year":"1977","unstructured":"L. Rabiner, On the use of autocorrelation analysis for pitch detection. IEEE Trans. Acoust. Speech Signal Process. 25(1), 24\u201333 (1977)","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"issue":"2","key":"2082_CR33","doi-asserted-by":"publisher","first-page":"772","DOI":"10.1007\/s00034-020-01496-6","volume":"40","author":"P Rengaswamy","year":"2021","unstructured":"P. Rengaswamy, K.S. Rao, P. Dasgupta, Songf0: a spectrum-based fundamental frequency estimation for monophonic songs. Circuits Syst. Signal Process. 40(2), 772\u2013797 (2021)","journal-title":"Circuits Syst. Signal Process."},{"issue":"5","key":"2082_CR34","doi-asserted-by":"publisher","first-page":"353","DOI":"10.1109\/TASSP.1974.1162598","volume":"22","author":"M Ross","year":"1974","unstructured":"M. Ross, H. Shaffer, A. Cohen, R. Freudberg, H. Manley, Average magnitude difference function pitch extractor. IEEE Trans. Acoust. Speech Signal Process. 22(5), 353\u2013362 (1974)","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"key":"2082_CR35","doi-asserted-by":"crossref","unstructured":"S. Shimauchi, S. Kudo, Y. Koizumi, K. Furuya, On relationships between amplitude and phase of short-time Fourier transform, in 2017 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). IEEE, pp. 676\u2013680 (2017)","DOI":"10.1109\/ICASSP.2017.7952241"},{"key":"2082_CR36","doi-asserted-by":"crossref","unstructured":"Y. Stylianou, Modeling speech based on harmonic plus noise models, in International School on Neural Networks, Initiated by IIASS and EMFCSC. (Springer, 2004), pp. 244\u2013260","DOI":"10.1007\/11520153_11"},{"issue":"4","key":"2082_CR37","doi-asserted-by":"publisher","first-page":"410","DOI":"10.1016\/j.jvoice.2014.09.016","volume":"29","author":"L Sukhostat","year":"2015","unstructured":"L. Sukhostat, Y. Imamverdiyev, A comparative analysis of pitch detection methods under the influence of different noise conditions. J. Voice 29(4), 410\u2013417 (2015)","journal-title":"J. Voice"},{"key":"2082_CR38","doi-asserted-by":"crossref","unstructured":"X. Sun, A pitch determination algorithm based on subharmonic-to-harmonic ratio, in Sixth International Conference on Spoken Language Processing (2000)","DOI":"10.21437\/ICSLP.2000-902"},{"key":"2082_CR39","unstructured":"X. Sun, Pitch determination algorithm. https:\/\/www.mathworks.com\/matlabcentral\/fileexchange\/1230-pitch-determination-algorithm, last accessed: 31-05-2022 (2002)"},{"issue":"1","key":"2082_CR40","doi-asserted-by":"publisher","first-page":"76","DOI":"10.1109\/TSA.2003.819950","volume":"12","author":"J Tabrikian","year":"2004","unstructured":"J. Tabrikian, S. Dubnov, Y. Dickalov, Maximum a-posteriori probability pitch tracking in noisy environments using harmonic model. IEEE Trans. Speech Audio Process. 12(1), 76\u201387 (2004)","journal-title":"IEEE Trans. Speech Audio Process."},{"key":"2082_CR41","first-page":"518","volume":"495","author":"D Talkin","year":"1995","unstructured":"D. Talkin, W.B. Kleijn, A robust algorithm for pitch tracking (rapt). Speech Coding Synth. 495, 518 (1995)","journal-title":"Speech Coding Synth."},{"issue":"7\u20138","key":"2082_CR42","doi-asserted-by":"publisher","first-page":"841","DOI":"10.1016\/j.specom.2013.03.001","volume":"55","author":"LN Tan","year":"2013","unstructured":"L.N. Tan, A. Alwan, Multi-band summary correlogram-based pitch detection for noisy speech. Speech Commun. 55(7\u20138), 841\u2013856 (2013)","journal-title":"Speech Commun."},{"issue":"1","key":"2082_CR43","first-page":"61","volume":"2","author":"J Ville","year":"1948","unstructured":"J. Ville, Theorie et application de la notion de signal analytique. C\u00e2bles et transmissions 2(1), 61\u201374 (1948)","journal-title":"C\u00e2bles et transmissions"},{"key":"2082_CR44","doi-asserted-by":"publisher","first-page":"317","DOI":"10.1016\/j.eswa.2016.08.018","volume":"64","author":"K Wu","year":"2016","unstructured":"K. Wu, D. Zhang, G. Lu, Ipeeh: improving pitch estimation by enhancing harmonics. Expert Syst. Appl. 64, 317\u2013329 (2016)","journal-title":"Expert Syst. Appl."},{"issue":"6","key":"2082_CR45","doi-asserted-by":"publisher","first-page":"4559","DOI":"10.1121\/1.2916590","volume":"123","author":"SA Zahorian","year":"2008","unstructured":"S.A. Zahorian, H. Hu, A spectral\/temporal method for robust fundamental frequency tracking. J. Acoust. Soc. Am. 123(6), 4559\u20134571 (2008)","journal-title":"J. Acoust. Soc. Am."}],"container-title":["Circuits, Systems, and Signal Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00034-022-02082-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00034-022-02082-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00034-022-02082-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,27]],"date-time":"2024-09-27T20:25:58Z","timestamp":1727468758000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00034-022-02082-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,6,25]]},"references-count":45,"journal-issue":{"issue":"11","published-print":{"date-parts":[[2022,11]]}},"alternative-id":["2082"],"URL":"https:\/\/doi.org\/10.1007\/s00034-022-02082-8","relation":{},"ISSN":["0278-081X","1531-5878"],"issn-type":[{"value":"0278-081X","type":"print"},{"value":"1531-5878","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,6,25]]},"assertion":[{"value":"20 May 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"31 May 2022","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 June 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 June 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}