{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,30]],"date-time":"2025-12-30T03:42:01Z","timestamp":1767066121734,"version":"3.37.3"},"reference-count":89,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2023,3,18]],"date-time":"2023-03-18T00:00:00Z","timestamp":1679097600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,3,18]],"date-time":"2023-03-18T00:00:00Z","timestamp":1679097600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Speech Technol"],"published-print":{"date-parts":[[2023,7]]},"DOI":"10.1007\/s10772-023-10028-x","type":"journal-article","created":{"date-parts":[[2023,3,18]],"date-time":"2023-03-18T17:02:35Z","timestamp":1679158955000},"page":"417-432","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Linguistic analysis for emotion recognition: a case of Chinese speakers"],"prefix":"10.1007","volume":"26","author":[{"given":"Carlo","family":"Schirru","sequence":"first","affiliation":[]},{"given":"Shahla","family":"Simin","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0713-6261","authenticated-orcid":false,"given":"Paolo","family":"Mengoni","sequence":"additional","affiliation":[]},{"given":"Alfredo","family":"Milani","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,3,18]]},"reference":[{"key":"10028_CR1","doi-asserted-by":"crossref","unstructured":"Adams, C., & Munro, R. R. (1978). In search of the acoustic correlates of stress: Fundamental frequency, amplitude, and duration in the connected utterance of some native and non-native speakers of English. Phonetica, 35(3), 125\u2013156.","DOI":"10.1159\/000259926"},{"key":"10028_CR2","doi-asserted-by":"crossref","unstructured":"Ak\u00e7ay, M. B., & Og\u0306uz, K. (2020). Speech emotion recognition: Emotional models, databases, features, preprocessing methods, supporting modalities, and classifiers. Speech Communications, 116, 56\u201376.","DOI":"10.1016\/j.specom.2019.12.001"},{"issue":"2","key":"10028_CR3","doi-asserted-by":"crossref","first-page":"886","DOI":"10.1121\/1.1852549","volume":"117","author":"PF Assmann","year":"2005","unstructured":"Assmann, P. F., & Katz, W. F. (2005). Synthesis fidelity and time-varying spectral change in vowels. Journal of the Acoustical Society of America, 117(2), 886\u2013895.","journal-title":"Journal of the Acoustical Society of America"},{"key":"10028_CR4","doi-asserted-by":"publisher","unstructured":"Beckman, M. E. (2012). Stress and non-stress accent. De Gruyter Mouton. https:\/\/doi.org\/10.1515\/9783110874020","DOI":"10.1515\/9783110874020"},{"issue":"1","key":"10028_CR6","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/s00221-005-0254-0","volume":"171","author":"C Biele","year":"2006","unstructured":"Biele, C., & Grabowska, A. (2006). Sex differences in perception of emotion intensity in dynamic and static facial expressions. Experimental Brain Research, 171(1), 1\u20136.","journal-title":"Experimental Brain Research"},{"issue":"9","key":"10028_CR7","first-page":"341","volume":"5","author":"P Boersma","year":"2001","unstructured":"Boersma, P. (2001). Praat, a system for doing phonetics by computer. Glot International, 5(9), 341\u2013345.","journal-title":"Glot International"},{"issue":"2\u20133","key":"10028_CR8","doi-asserted-by":"crossref","first-page":"109","DOI":"10.1080\/00437956.1958.11659660","volume":"14","author":"DL Bolinger","year":"1958","unstructured":"Bolinger, D. L. (1958). A theory of pitch accent in English. Word, 14(2\u20133), 109\u2013149.","journal-title":"Word"},{"key":"10028_CR9","doi-asserted-by":"crossref","unstructured":"Burkhardt, F., Paeschke, A., Rolfes, M., Sendlmeier, W.F., & Weiss, B. (2005). A database of German emotional speech. In Ninth European conference on speech communication and technology.","DOI":"10.21437\/Interspeech.2005-446"},{"issue":"4","key":"10028_CR10","doi-asserted-by":"crossref","first-page":"582","DOI":"10.1109\/TASL.2008.2009578","volume":"17","author":"C Busso","year":"2009","unstructured":"Busso, C., Lee, S., & Narayanan, S. (2009). Analysis of emotionally salient aspects of fundamental frequency for emotion detection. IEEE Transactions on Audio, Speech, and Language Processing, 17(4), 582\u2013596.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"key":"10028_CR11","doi-asserted-by":"crossref","unstructured":"Campbell, N. (2008). Individual traits of speaking style and speech rhythm in a spoken discourse. In Verbal and nonverbal features of human-human and human-machine interaction (pp. 107\u2013120). Springer.","DOI":"10.1007\/978-3-540-70872-8_8"},{"key":"10028_CR12","doi-asserted-by":"crossref","unstructured":"Casale, S., Russo, A., Scebba, G., & Serrano, S. (2008). Speech emotion classification using machine learning algorithms. In 2008 IEEE international conference on semantic computing (pp. 158\u2013165).","DOI":"10.1109\/ICSC.2008.43"},{"key":"10028_CR13","volume-title":"A grammar of spoken Chinese","author":"Y Chao","year":"1968","unstructured":"Chao, Y. (1968). A grammar of spoken Chinese. University of California Press."},{"issue":"3","key":"10028_CR14","doi-asserted-by":"crossref","first-page":"129","DOI":"10.1159\/000259312","volume":"22","author":"M Chen","year":"1970","unstructured":"Chen, M. (1970). Vowel length variation as a function of the voicing of the consonant environment. Phonetica, 22(3), 129\u2013159.","journal-title":"Phonetica"},{"issue":"4","key":"10028_CR15","doi-asserted-by":"crossref","first-page":"1681","DOI":"10.1121\/1.1356023","volume":"109","author":"Y Chen","year":"2001","unstructured":"Chen, Y., Robb, M. P., Gilbert, H. R., & Lerman, J. W. (2001). A study of sentence stress production in mandarin speakers of American English. The Journal of the Acoustical Society of America, 109(4), 1681\u20131690.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"1","key":"10028_CR16","doi-asserted-by":"crossref","first-page":"32","DOI":"10.1109\/79.911197","volume":"18","author":"R Cowie","year":"2001","unstructured":"Cowie, R., Douglas-Cowie, E., Tsapatsoulis, N., Votsis, G., Kollias, S., Fellenz, W., & Taylor, J. G. (2001). Emotion recognition in human-computer interaction. IEEE Signal Processing Magazine, 18(1), 32\u201380.","journal-title":"IEEE Signal Processing Magazine"},{"issue":"3","key":"10028_CR17","doi-asserted-by":"crossref","first-page":"217","DOI":"10.3758\/BF03207288","volume":"29","author":"A Cutler","year":"1981","unstructured":"Cutler, A., & Darwin, C. J. (1981). Phoneme-monitoring reaction time and preceding prosody: Effects of stop closure duration and of fundamental frequency. Perception & Psychophysics, 29(3), 217\u2013224.","journal-title":"Perception & Psychophysics"},{"key":"10028_CR18","doi-asserted-by":"crossref","first-page":"91","DOI":"10.1016\/j.procs.2015.08.032","volume":"58","author":"A Davletcharova","year":"2015","unstructured":"Davletcharova, A., Sugathan, S., Abraham, B., & James, A. P. (2015). Detection and analysis of emotion from speech signals. Procedia Computer Science, 58, 91\u201396.","journal-title":"Procedia Computer Science"},{"issue":"8","key":"10028_CR19","doi-asserted-by":"crossref","first-page":"59","DOI":"10.1007\/s00521-016-2712-y","volume":"29","author":"S Demircan","year":"2018","unstructured":"Demircan, S., & Kahramanli, H. (2018). Application of fuzzy c-means clustering algorithm to spectral features for emotion classification from speech. Neural Computing and Applications, 29(8), 59\u201366.","journal-title":"Neural Computing and Applications"},{"key":"10028_CR20","first-page":"2349","volume":"14","author":"J Dem\u0161ar","year":"2013","unstructured":"Dem\u0161ar, J., Curk, T., Erjavec, A., Gorup, \u010crt, Ho\u010devar, T., Milutinovi\u010d, M., & Zupan, B. (2013). Orange: Data mining toolbox in python. Journal of Machine Learning Research, 14, 2349\u20132353.","journal-title":"Journal of Machine Learning Research"},{"key":"10028_CR21","doi-asserted-by":"publisher","unstructured":"Deng, J. J., Leung, C. H. C., Mengoni, P., & Li, Y. (2018). Emotion recognition from human behaviors using attention model. In First IEEE international conference on artificial intelligence and knowledge engineering, AIKE 2018, Laguna Hills, CA, USA, September 26\u201328, 2018 (pp. 249\u2013253). IEEE Computer Society. https:\/\/doi.org\/10.1109\/AIKE.2018.00056","DOI":"10.1109\/AIKE.2018.00056"},{"issue":"1\u20132","key":"10028_CR22","doi-asserted-by":"crossref","first-page":"33","DOI":"10.1016\/S0167-6393(02)00070-5","volume":"40","author":"E Douglas-Cowie","year":"2003","unstructured":"Douglas-Cowie, E., Campbell, N., Cowie, R., & Roach, P. (2003). Emotional speech: Towards a new generation of databases. Speech Communication, 40(1\u20132), 33\u201360.","journal-title":"Speech Communication"},{"key":"10028_CR23","doi-asserted-by":"crossref","DOI":"10.1093\/oso\/9780199215782.001.0001","volume-title":"The phonology of standard Chinese","author":"S Duanmu","year":"2007","unstructured":"Duanmu, S. (2007). The phonology of standard Chinese. OUP Oxford."},{"key":"10028_CR24","unstructured":"Eibe, F., Hall, M. A., Witten, I. H. (2016). The weka workbench. Online appendix for data mining: Practical machine learning tools and techniques. Morgan Kaufmann."},{"issue":"45\u201360","key":"10028_CR25","first-page":"16","volume":"98","author":"P Ekman","year":"1999","unstructured":"Ekman, P. (1999). Basic emotions. Handbook of Cognition and Emotion, 98(45\u201360), 16.","journal-title":"Handbook of Cognition and Emotion"},{"key":"10028_CR26","unstructured":"Ekman, P., & Cole, J. (1972). Universals and cultural differences in facial expressions of emotions. In Nebraska symposium on motivation (Vol. 19, pp. 207\u2013283)."},{"key":"10028_CR27","first-page":"3","volume":"1","author":"C Fan","year":"1982","unstructured":"Fan, C. (1982). Sounds of English and Chinese. Primary and Middle School English Teaching and Research, 1, 3\u20134.","journal-title":"Primary and Middle School English Teaching and Research"},{"key":"10028_CR28","doi-asserted-by":"crossref","unstructured":"Franzoni, V., Li, Y., Mengoni, P., & Milani, A. (2017). Clustering Facebook for biased context extraction. In Computational science and its applications (ICCSA 2017), 17th international conference, Trieste, Italy, July 3\u20136, 2017, proceedings, part I (Vol. 10404, pp. 717\u2013729). Springer.","DOI":"10.1007\/978-3-319-62392-4_52"},{"issue":"4","key":"10028_CR29","doi-asserted-by":"crossref","first-page":"765","DOI":"10.1121\/1.1908022","volume":"27","author":"DB Fry","year":"1955","unstructured":"Fry, D. B. (1955). Duration and intensity as physical correlates of linguistic stress. The Journal of the Acoustical Society of America, 27(4), 765\u2013768.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"2","key":"10028_CR30","doi-asserted-by":"crossref","first-page":"126","DOI":"10.1177\/002383095800100207","volume":"1","author":"DB Fry","year":"1958","unstructured":"Fry, D. B. (1958). Experiments in the perception of stress. Language and Speech, 1(2), 126\u2013152.","journal-title":"Language and Speech"},{"issue":"1","key":"10028_CR31","doi-asserted-by":"crossref","first-page":"505","DOI":"10.1121\/1.423251","volume":"104","author":"Q-J Fu","year":"1998","unstructured":"Fu, Q.-J., Zeng, F.-G., Shannon, R. V., & Soli, S. D. (1998). Importance of tonal envelope cues in Chinese speech recognition. The Journal of the Acoustical Society of America, 104(1), 505\u2013510.","journal-title":"The Journal of the Acoustical Society of America"},{"key":"10028_CR32","doi-asserted-by":"crossref","unstructured":"Fukada, T., Tokuda, K., Kobayashi, T., & Imai, S. (1992). An adaptive algorithm for mel-cepstral analysis of speech. In 1992 IEEE international conference on acoustics, speech, and signal processing (ICA\ufeffSSP-92), (Vol. 1, pp. 137\u2013140).","DOI":"10.1109\/ICASSP.1992.225953"},{"key":"10028_CR33","doi-asserted-by":"crossref","unstructured":"Gandour, J. T. (1978). The perception of tone. Tone (pp. 41\u201376). Elsevier.","DOI":"10.1016\/B978-0-12-267350-4.50007-8"},{"key":"10028_CR34","doi-asserted-by":"crossref","unstructured":"Garcia-Garcia, J. M., Penichet, V. M., Lozano, M. D. (2017). Emotion detection: A technology review. In Proceedings of the xviii International conference on human computer interaction (pp. 1\u20138).","DOI":"10.1145\/3123818.3123852"},{"key":"10028_CR35","first-page":"44","volume":"1","author":"C Gui","year":"1978","unstructured":"Gui, C. (1978). A comparison of Chinese and English sound system. Modern Foreign Languages, 1, 44\u201350.","journal-title":"Modern Foreign Languages"},{"key":"10028_CR36","volume-title":"Contrastive analysis of English and Chinese","author":"S He","year":"2002","unstructured":"He, S. (2002). Contrastive analysis of English and Chinese. Shanghai Foreign Language Education Press."},{"key":"10028_CR37","doi-asserted-by":"publisher","unstructured":"Hodari, Z., Watts, O., & King, S. (2019, Sep). Using generative modelling to produce varied intonation for speech synthesis. In 10th ISCA speech synthesis workshop. https:\/\/doi.org\/10.21437\/ssw.2019-43","DOI":"10.21437\/ssw.2019-43"},{"issue":"9","key":"10028_CR38","doi-asserted-by":"crossref","first-page":"1174","DOI":"10.1121\/1.1908941","volume":"33","author":"AS House","year":"1961","unstructured":"House, A. S. (1961). On vowel duration in English. The Journal of the Acoustical Society of America, 33(9), 1174\u20131178.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"5","key":"10028_CR39","doi-asserted-by":"crossref","first-page":"3109","DOI":"10.1121\/1.2188647","volume":"119","author":"V Hozjan","year":"2006","unstructured":"Hozjan, V., & Ka\u010di\u010d, Z. (2006). A rule-based emotion-dependent feature extraction method for emotion analysis from speech. The Journal of the Acoustical Society of America, 119(5), 3109\u20133120.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"S1","key":"10028_CR40","doi-asserted-by":"crossref","first-page":"S21","DOI":"10.1121\/1.2004098","volume":"64","author":"D Isenberg","year":"1978","unstructured":"Isenberg, D., & Gay, T. (1978). Acoustic correlates of perceived stress in an isolated synthetic disyllable. The Journal of the Acoustical Society of America, 64(S1), S21\u2013S21.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"2","key":"10028_CR41","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1515\/iral.1990.28.2.99","volume":"28","author":"A Juffs","year":"1990","unstructured":"Juffs, A. (1990). Tone, syllable structure and interlanguage phonology: Chinese learners\u2019 stress errors. International Review of Applied Linguistics in Language Teaching, 28(2), 99\u2013118. https:\/\/doi.org\/10.1515\/iral.1990.28.2.99","journal-title":"International Review of Applied Linguistics in Language Teaching"},{"key":"10028_CR42","volume-title":"How to teach pronunciation","author":"G Kelly","year":"2000","unstructured":"Kelly, G. (2000). How to teach pronunciation. Longman."},{"key":"10028_CR43","doi-asserted-by":"crossref","unstructured":"Kostoulas, T., Ganchev, T., & Fakotakis, N. (2008). Study on speakerindependent emotion recognition from speech on real-world data. In Verbal and nonverbal features of human-human and human-machine interaction (pp. 235\u2013242). Springer.","DOI":"10.1007\/978-3-540-70872-8_18"},{"key":"10028_CR44","doi-asserted-by":"crossref","unstructured":"Larsen, R.J., & Prizmic-Larsen, Z. (2006). Measuring emotions: Implications of a multimethod perspective. In Handbook of multimethod measurement in psychology (pp. 337\u2013351). American Psychological Association.","DOI":"10.1037\/11383-023"},{"key":"10028_CR45","volume-title":"Suprasegmentals","author":"I Lehiste","year":"1970","unstructured":"Lehiste, I. (1970). Suprasegmentals. MIT Press."},{"key":"10028_CR46","doi-asserted-by":"crossref","unstructured":"Li, Y., & Zhao, Y. (1998). Recognizing emotions in speech using short-term and long-term features. In Fifth international conference on spoken language processing.","DOI":"10.21437\/ICSLP.1998-560"},{"issue":"4","key":"10028_CR47","doi-asserted-by":"crossref","first-page":"451","DOI":"10.1121\/1.1908095","volume":"32","author":"P Lieberman","year":"1960","unstructured":"Lieberman, P. (1960). Some acoustic correlates of word stress in American English. The Journal of the Acoustical Society of America, 32(4), 451\u2013454.","journal-title":"The Journal of the Acoustical Society of America"},{"key":"10028_CR48","doi-asserted-by":"publisher","unstructured":"Mao, S., Ching, P. C., & Lee, T. (2019). Deep learning of segment-level feature representation with multiple instance learning for utterance-level speech emotion recognition. In Interspeech 2019, 20th Annual conference of the international speech communication association, Graz, Austria, 15\u201319 September 2019 (pp. 1686\u20131690). ISCA. https:\/\/doi.org\/10.21437\/Interspeech.2019-1968","DOI":"10.21437\/Interspeech.2019-1968"},{"issue":"10","key":"10028_CR49","first-page":"3474","volume":"74","author":"K Mase","year":"1991","unstructured":"Mase, K. (1991). Recognition of facial expression from optical flow. IEICE Transactions on Information and Systems, 74(10), 3474\u20133483.","journal-title":"IEICE Transactions on Information and Systems"},{"issue":"2","key":"10028_CR50","doi-asserted-by":"crossref","first-page":"143","DOI":"10.1007\/BF00992959","volume":"13","author":"D Matsumoto","year":"1989","unstructured":"Matsumoto, D., & Ekman, P. (1989). American-Japanese cultural differences in intensity ratings of facial expressions of emotion. Motivation and Emotion, 13(2), 143\u2013157.","journal-title":"Motivation and Emotion"},{"issue":"2","key":"10028_CR51","doi-asserted-by":"crossref","first-page":"253","DOI":"10.3758\/BF03205547","volume":"62","author":"SL Mattys","year":"2000","unstructured":"Mattys, S. L. (2000). The perception of primary and secondary stress in English. Perception & Psychophysics, 62(2), 253\u2013265.","journal-title":"Perception & Psychophysics"},{"issue":"3","key":"10028_CR52","doi-asserted-by":"publisher","first-page":"159","DOI":"10.1177\/002383096500800303","volume":"8","author":"J Morton","year":"1965","unstructured":"Morton, J., & Jassem, W. (1965). Acoustic correlates of stress. Language and Speech, 8(3), 159\u2013181. https:\/\/doi.org\/10.1177\/002383096500800303","journal-title":"Language and Speech"},{"issue":"4","key":"10028_CR53","doi-asserted-by":"crossref","first-page":"1117","DOI":"10.1109\/TASL.2006.876121","volume":"14","author":"E Navas","year":"2006","unstructured":"Navas, E., Hern\u00e1ez, I., & Luengo, I. (2006). An objective and subjective study of the role of semantics and prosodic features in building corpora for emotional tts. IEEE Transactions on Audio, Speech, and Language Processing, 14(4), 1117\u20131127.","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"issue":"2","key":"10028_CR54","doi-asserted-by":"crossref","first-page":"1072","DOI":"10.1121\/1.1940508","volume":"118","author":"S Nittrouer","year":"2005","unstructured":"Nittrouer, S. (2005). Age-related differences in weighting and masking of two cues to word-final stop voicing in noise. The Journal of the Acoustical Society of America, 118(2), 1072\u20131088.","journal-title":"The Journal of the Acoustical Society of America"},{"key":"10028_CR55","unstructured":"Okobi, A.O. (2006). Acoustic correlates of word stress in American English (Unpublished doctoral dissertation). Massachusetts Institute of Technology."},{"issue":"9","key":"10028_CR56","doi-asserted-by":"crossref","first-page":"1370","DOI":"10.1109\/JPROC.2003.817122","volume":"91","author":"M Pantic","year":"2003","unstructured":"Pantic, M., & Rothkrantz, L. J. (2003). Toward an affect-sensitive multimodal human-computer interaction. Proceedings of the IEEE, 91(9), 1370\u20131390.","journal-title":"Proceedings of the IEEE"},{"key":"10028_CR57","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa, F., Varoquaux, G., Gramfort, A., Michel, V., Thirion, B., Grisel, O., & Duchesnay, E. (2011). Scikit-learn: Machine learning in Python. Journal of Machine Learning Research, 12, 2825\u20132830.","journal-title":"Journal of Machine Learning Research"},{"key":"10028_CR58","doi-asserted-by":"crossref","unstructured":"Pervaiz, M., & Ahmed, T. (2016). Emotion recognition from speech using prosodic and linguistic features. International Journal of Advanced Computer Science & Applications, 7(8).","DOI":"10.14569\/IJACSA.2016.070813"},{"issue":"6","key":"10028_CR59","doi-asserted-by":"crossref","first-page":"693","DOI":"10.1121\/1.1908183","volume":"32","author":"GE Peterson","year":"1960","unstructured":"Peterson, G. E., & Lehiste, I. (1960). Duration of syllable nuclei in English. The Journal of the Acoustical Society of America, 32(6), 693\u2013703.","journal-title":"The Journal of the Acoustical Society of America"},{"key":"10028_CR60","doi-asserted-by":"crossref","DOI":"10.7551\/mitpress\/1140.001.0001","volume-title":"Affective computing","author":"RW Picard","year":"1997","unstructured":"Picard, R. W. (1997). Affective computing. MIT Press."},{"key":"10028_CR61","doi-asserted-by":"crossref","first-page":"98","DOI":"10.1016\/j.inffus.2017.02.003","volume":"37","author":"S Poria","year":"2017","unstructured":"Poria, S., Cambria, E., Bajpai, R., & Hussain, A. (2017). A review of affective computing: From unimodal analysis to multimodal fusion. Information Fusion, 37, 98\u2013125.","journal-title":"Information Fusion"},{"key":"10028_CR62","doi-asserted-by":"crossref","first-page":"143","DOI":"10.1007\/s10772-012-9172-2","volume":"16","author":"KS Rao","year":"2013","unstructured":"Rao, K. S., Koolagudi, S. G., & Vempada, R. R. (2013). Emotion recognition from speech using global and local prosodic features. International Journal of Speech Technology, 16, 143\u2013160.","journal-title":"International Journal of Speech Technology"},{"key":"10028_CR63","doi-asserted-by":"crossref","unstructured":"Raphael, L. J. (1972). Preceding vowel duration as a cue to the perception of the voicing characteristic of word-final consonants in American English. The Journal of the Acoustical Society of America, 51(4B), 1296\u20131303.","DOI":"10.1121\/1.1912974"},{"issue":"3","key":"10028_CR64","doi-asserted-by":"crossref","first-page":"217","DOI":"10.1016\/0167-6393(87)90027-6","volume":"6","author":"AC Rietveld","year":"1987","unstructured":"Rietveld, A. C., & Koopmans-van Beinum, F. J. (1987). Vowel reduction and stress. Speech Communication, 6(3), 217\u2013229.","journal-title":"Speech Communication"},{"key":"10028_CR65","doi-asserted-by":"crossref","unstructured":"Salvi, G., Tesser, F., Zovato, E., & Cosi, P. (2010). Cluster analysis of differential spectral envelopes on emotional speech. In Eleventh annual conference of the international speech communication association.","DOI":"10.21437\/Interspeech.2010-121"},{"key":"10028_CR66","unstructured":"Schirru, C. (1992). Premiers \u00e9l\u00e9ments d\u2019analyse prosodique contrastive entre le sarde, l\u2019italien et le francais: R\u00e9sultats statistiques. Travaux de l\u2019Institut de Phon\u00e9tique d\u2019Aix, 14, 77\u2013108."},{"key":"10028_CR67","unstructured":"Schirru, C. (1995). Fenomeni sovrasegmentali: confronto fra comportamento femminile e maschile. In G. Marcato (a cura di): Donna e linguaggio, atti del convegno internazionale di studi su \u201cdialettologia al femminile\u201d (pp. 437\u2013446)."},{"key":"10028_CR68","unstructured":"Schirru, C. (1998). German, Italian and French in a Swiss variety: A first global approach. In Proceedings of the third international symposium on the acquisition of second-language speech (pp. 276\u2013285)."},{"key":"10028_CR69","first-page":"283","volume":"17","author":"C Schirru","year":"2000","unstructured":"Schirru, C. (2000). Sulla durata sillabica nell\u2019italiano della Sardegna. Revista de Filolog\u00eda Rom\u00e1nica, 17, 283\u2013291.","journal-title":"Revista de Filolog\u00eda Rom\u00e1nica"},{"key":"10028_CR70","first-page":"9","volume-title":"Per un\u2019analisi interlinguistica d\u2019epoca: Grazia Deledda e contemporanei","author":"C Schirru","year":"2009","unstructured":"Schirru, C. (2009). Per un\u2019analisi interlinguistica d\u2019epoca: Grazia Deledda e contemporanei (pp. 9\u201332). Anno XI: Rivista Italiana di Linguistica e di Dialettologia."},{"key":"10028_CR71","unstructured":"Schirru, C. (2013). Un autore \u201cin parola\u201d: preliminari fisico-acustici sulla voce di Marinetti: I linguaggi del futurismo. Atti del convegno internazionale di studi (Macerata, 15-17 dicembre 2010). Edizioni Universit\u00e0 di Macerata."},{"issue":"2","key":"10028_CR72","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1111\/j.1467-8535.2005.00459.x","volume":"36","author":"G Sefero\u01e7lu","year":"2005","unstructured":"Sefero\u01e7lu, G. (2005). Improving students\u2019 pronunciation through accent reduction software. British Journal of Educational Technology, 36(2), 303\u2013316. https:\/\/doi.org\/10.1111\/j.1467-8535.2005.00459.x","journal-title":"British Journal of Educational Technology"},{"issue":"4","key":"10028_CR73","doi-asserted-by":"crossref","first-page":"415","DOI":"10.1177\/002383099303600404","volume":"36","author":"XS Shen","year":"1993","unstructured":"Shen, X. S. (1993). Relative duration as a perceptual cue to stress in mandarin. Language and Speech, 36(4), 415\u2013433.","journal-title":"Language and Speech"},{"key":"10028_CR74","unstructured":"Shih, C. E. A. (1988). Tone and intonation in Mandarin. Working Papers, Cornell Phonetics Laboratory, 3 , 83\u2013109."},{"issue":"4","key":"10028_CR75","doi-asserted-by":"crossref","first-page":"2471","DOI":"10.1121\/1.417955","volume":"100","author":"AM Sluijter","year":"1996","unstructured":"Sluijter, A. M., & Van Heuven, V. J. (1996). Spectral balance as an acoustic correlate of linguistic stress. The Journal of the Acoustical Society of America, 100(4), 2471\u20132485.","journal-title":"The Journal of the Acoustical Society of America"},{"key":"10028_CR76","unstructured":"Tseng, C.-Y. (1981). An acoustic phonetic study on tones in Mandarin Chinese. Brown University."},{"key":"10028_CR77","unstructured":"Van der Hulst, H. (1999). Word accent. In Word prosodic systems in the languages of Europe, (pp. 3\u2013115). De Gruyter Mouton."},{"issue":"4","key":"10028_CR78","doi-asserted-by":"crossref","first-page":"2439","DOI":"10.1121\/1.417952","volume":"100","author":"VJ Van Heuven","year":"1996","unstructured":"Van Heuven, V. J., & Menert, L. (1996). Why stress position bias? The Journal of the Acoustical Society of America, 100(4), 2439\u20132451.","journal-title":"The Journal of the Acoustical Society of America"},{"issue":"9","key":"10028_CR79","doi-asserted-by":"crossref","first-page":"1162","DOI":"10.1016\/j.specom.2006.04.003","volume":"48","author":"D Ververidis","year":"2006","unstructured":"Ververidis, D., & Kotropoulos, C. (2006). Emotional speech recognition: Resources, features, and methods. Speech Communication, 48(9), 1162\u20131181.","journal-title":"Speech Communication"},{"key":"10028_CR80","doi-asserted-by":"crossref","unstructured":"Vicsi, K., & Sztah\u00f3, D. (2011). Problems of the automatic emotion recognitions in spontaneous speech; an example for the recognition in a dispatcher center. In Toward autonomous, adaptive, and context-aware multimodal interfaces. Theoretical and practical issues (pp. 331\u2013339). Springer.","DOI":"10.1007\/978-3-642-18184-9_28"},{"key":"10028_CR81","volume-title":"An introduction to comparative studies of Chinese and English","author":"Z Wei","year":"2003","unstructured":"Wei, Z. (2003). An introduction to comparative studies of Chinese and English. Shanghai Foreign Language Education Press."},{"key":"10028_CR82","doi-asserted-by":"crossref","unstructured":"Whalen, D. H., & Xu, Y. (1992). Information for Mandarin tones in the amplitude contour and in brief segments. Phonetica, 49(1), 25\u201347.","DOI":"10.1159\/000261901"},{"issue":"1","key":"10028_CR83","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1111\/j.1467-1770.1972.tb00071.x","volume":"22","author":"RL Whitman","year":"1972","unstructured":"Whitman, R. L., & Jackson, K. L. (1972). The unpredictability of constrastive analysis. Language Learning, 22(1), 29\u201341. https:\/\/doi.org\/10.1111\/j.1467-1770.1972.tb00071.x","journal-title":"Language Learning"},{"issue":"4B","key":"10028_CR84","doi-asserted-by":"crossref","first-page":"1238","DOI":"10.1121\/1.1913238","volume":"52","author":"CE Williams","year":"1972","unstructured":"Williams, C. E., & Stevens, K. N. (1972). Emotions and speech: Some acoustical correlates. The Journal of the Acoustical Society of America, 52(4B), 1238\u20131250.","journal-title":"The Journal of the Acoustical Society of America"},{"key":"10028_CR85","doi-asserted-by":"crossref","unstructured":"Wu, C. -H., Lin, J. -C., & Wei, W. -L. (2014). Survey on audiovisual emotion recognition: Databases, features, and data fusion strategies. APSIPA Transactions on Signal and Information Processing, 3.","DOI":"10.1017\/ATSIP.2014.11"},{"key":"10028_CR86","doi-asserted-by":"crossref","unstructured":"Yuan, J., Shen, L., & Chen, F. (2002). The acoustic realization of anger, fear, joy and sadness in Chinese. In Seventh international conference on spoken language processing.","DOI":"10.21437\/ICSLP.2002-556"},{"key":"10028_CR87","doi-asserted-by":"crossref","unstructured":"Zhang, Y., & Francis, A. (2010). The weighting of vowel quality in native and non-native listeners\u2019 perception of English lexical stress. Journal of Phonetics, 38(2), 260\u2013271.","DOI":"10.1016\/j.wocn.2009.11.002"},{"key":"10028_CR88","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Nissen, S. L., & Francis, A. L. (2008). Acoustic characteristics of English lexical stress produced by native Mandarin speakers. The Journal of the Acoustical Society of America, 123(6), 4498\u20134513.","DOI":"10.1121\/1.2902165"},{"key":"10028_CR89","volume-title":"Phonology","author":"Z Zhao","year":"2006","unstructured":"Zhao, Z. (2006). Phonology. Shanghai Foreign Language Education Press."},{"key":"10028_CR90","doi-asserted-by":"publisher","unstructured":"Zhou, J., & Mengoni, P. (2020). Spot gold price prediction using financial news sentiment analysis. In IEEE\/WIC\/ACM International Joint Conference on Web intelligence and intelligent agent technology, WI\/IAT 2020, Melbourne, Australia, December 14\u201317, 2020 (pp. 758\u2013763). IEEE. https:\/\/doi.org\/10.1109\/WIIAT50758.2020.00117","DOI":"10.1109\/WIIAT50758.2020.00117"}],"container-title":["International Journal of Speech Technology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-023-10028-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10772-023-10028-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-023-10028-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,16]],"date-time":"2024-10-16T16:50:44Z","timestamp":1729097444000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10772-023-10028-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,3,18]]},"references-count":89,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2023,7]]}},"alternative-id":["10028"],"URL":"https:\/\/doi.org\/10.1007\/s10772-023-10028-x","relation":{},"ISSN":["1381-2416","1572-8110"],"issn-type":[{"type":"print","value":"1381-2416"},{"type":"electronic","value":"1572-8110"}],"subject":[],"published":{"date-parts":[[2023,3,18]]},"assertion":[{"value":"6 May 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 February 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 March 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"All authors of the manuscript have read and agreed the final manuscript.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}}]}}