{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,14]],"date-time":"2025-03-14T04:28:43Z","timestamp":1741926523702,"version":"3.38.0"},"reference-count":45,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2011,11,11]],"date-time":"2011-11-11T00:00:00Z","timestamp":1320969600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Int J Speech Technol"],"published-print":{"date-parts":[[2012,6]]},"DOI":"10.1007\/s10772-011-9124-2","type":"journal-article","created":{"date-parts":[[2011,11,10]],"date-time":"2011-11-10T11:56:35Z","timestamp":1320926195000},"page":"87-98","source":"Crossref","is-referenced-by-count":3,"title":["Automatic stress exaggeration by prosody modification to assist language learners perceive sentence stress"],"prefix":"10.1007","volume":"15","author":[{"given":"Jingli","family":"Lu","sequence":"first","affiliation":[]},{"given":"Ruili","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Liyanage C.","family":"De Silva","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2011,11,11]]},"reference":[{"key":"9124_CR1","doi-asserted-by":"crossref","first-page":"606","DOI":"10.1109\/ICSLP.1996.607434","volume-title":"Proceedings of international conference on spoken language processing","author":"R. Akahane-Yamada","year":"1996","unstructured":"Akahane-Yamada, R., Tohkura, Y., Bradlow, A. R., & Pisoni, D. B. (1996). Does training in speech perception modify speech production. In Proceedings of international conference on spoken language processing (Vols.\u00a01\u20134, pp. 606\u2013609)."},{"issue":"1","key":"9124_CR2","doi-asserted-by":"crossref","first-page":"216","DOI":"10.1109\/TASL.2007.907570","volume":"16","author":"S. Ananthakrishnan","year":"2008","unstructured":"Ananthakrishnan, S., & Narayanan, S. (2008). Automatic prosodic event detection using acoustic, lexical, and syntactic evidence. IEEE Trans. Audio, Speech and Language Processing, 16(1), 216\u2013228.","journal-title":"IEEE Trans. Audio, Speech and Language Processing"},{"key":"9124_CR3","first-page":"464","volume-title":"Proceedings of international conference on spoken language processing","author":"J. Beskow","year":"2000","unstructured":"Beskow, J., & Sj\u00f6lander, K. (2000). WaveSurfer\u2014a public domain speech tool. In Proceedings of international conference on spoken language processing, China, Beijing (Vol.\u00a04, pp. 464\u2013467)."},{"issue":"10","key":"9124_CR4","doi-asserted-by":"crossref","first-page":"933","DOI":"10.1016\/j.specom.2009.03.001","volume":"51","author":"M. P. Bissiri","year":"2009","unstructured":"Bissiri, M. P., & Pfitzinger, H. R. (2009). Italian speakers learn lexical stress of German morphologically complex words. Speech Communication, 51(10), 933\u2013947.","journal-title":"Speech Communication"},{"key":"9124_CR5","first-page":"104","volume-title":"Proceedings of workshop on speech and language technology in education","author":"A. Black","year":"2007","unstructured":"Black, A. (2007). Speech synthesis for educational technology. In Proceedings of workshop on speech and language technology in education (pp. 104\u2013107)."},{"key":"9124_CR6","doi-asserted-by":"crossref","DOI":"10.1163\/9789004653412","volume-title":"Slips of the ear: errors in the perception of casual conversation","author":"Z. Bond","year":"1999","unstructured":"Bond, Z. (1999). Slips of the ear: errors in the perception of casual conversation. San Diego: Academic Press."},{"key":"9124_CR7","doi-asserted-by":"crossref","first-page":"470","DOI":"10.3758\/BF03203063","volume":"34","author":"Z. Bond","year":"1983","unstructured":"Bond, Z., & Small, L. H. (1983). Voicing, vowel and stress mispronunciations in continuous speech. Perception and Psychophysics, 34, 470\u2013474.","journal-title":"Perception and Psychophysics"},{"issue":"4","key":"9124_CR8","doi-asserted-by":"crossref","first-page":"2299","DOI":"10.1121\/1.418276","volume":"101","author":"A. Bradlow","year":"1997","unstructured":"Bradlow, A., Pisoni, D., Akahana-Yamada, R., & Tohkura, Y. (1997). Training Japanese listeners to identify English \/r\/ and \/l\/: Some effects of perceptual learning on speech production. Journal of the Acoustical Society of America, 101(4), 2299\u20132310.","journal-title":"Journal of the Acoustical Society of America"},{"key":"9124_CR9","volume-title":"Pronunciation","author":"C. Dalton","year":"1994","unstructured":"Dalton, C., & Seidlhofer, B. (1994). Pronunciation. Oxford: Oxford University Press."},{"key":"9124_CR10","doi-asserted-by":"crossref","first-page":"51","DOI":"10.1016\/S0095-4470(19)30776-4","volume":"11","author":"R. M. Dauer","year":"1983","unstructured":"Dauer, R. M. (1983). Stress-timing and syllable-timing reanalyzed. Journal of Phonetics, 11, 51\u201362.","journal-title":"Journal of Phonetics"},{"key":"9124_CR11","doi-asserted-by":"crossref","first-page":"145","DOI":"10.1016\/S0167-6393(99)00043-6","volume":"30","author":"R. Delmonte","year":"2000","unstructured":"Delmonte, R. (2000). SLIM prosodic automatic tools for self-learning instruction. Speech Communication, 30, 145\u2013166.","journal-title":"Speech Communication"},{"issue":"4","key":"9124_CR12","doi-asserted-by":"crossref","first-page":"161","DOI":"10.1007\/s10772-010-9065-1","volume":"12","author":"R. Delmonte","year":"2009","unstructured":"Delmonte, R. (2009). Prosodic tools for language learning. International Journal of Speech Technology, 12(4), 161\u2013184.","journal-title":"International Journal of Speech Technology"},{"key":"9124_CR13","doi-asserted-by":"crossref","first-page":"406","DOI":"10.1006\/jmla.1996.2500","volume":"36","author":"E. Dupoux","year":"1997","unstructured":"Dupoux, E., Pallier, C., Sebasti\u00e1n-Gall\u00e9s, N., & Mehler, J. (1997). A\u00a0destressing \u2018deafness\u2019 in French?. Journal of Memory and Language, 36, 406\u2013421.","journal-title":"Journal of Memory and Language"},{"key":"9124_CR14","doi-asserted-by":"crossref","first-page":"1234","DOI":"10.1016\/j.specom.2009.06.007","volume":"51","author":"K. P. Engelbrecht","year":"2009","unstructured":"Engelbrecht, K. P., Quade, M., & M\u00f6ller, S. (2009). Analysis of a new simulation approach to dialog system evaluation. Speech Communication, 51, 1234\u20131252.","journal-title":"Speech Communication"},{"issue":"10","key":"9124_CR15","doi-asserted-by":"crossref","first-page":"832","DOI":"10.1016\/j.specom.2009.04.005","volume":"51","author":"M. Eskenazi","year":"2009","unstructured":"Eskenazi, M. (2009). An overview of spoken language technology for education. Speech Communication, 51(10), 832\u2013844.","journal-title":"Speech Communication"},{"key":"9124_CR16","first-page":"77","volume-title":"Proceedings of speech technology in language learning","author":"M. Eskenazi","year":"1998","unstructured":"Eskenazi, M., & Hansma, S. (1998). The Fluency pronunciation trainer. In Proceedings of speech technology in language learning (pp. 77\u201380)."},{"key":"9124_CR17","volume-title":"Acoustic theory of speech production. Moutons\u2019Gravenhage","author":"G. Fant","year":"1960","unstructured":"Fant, G. (1960). Acoustic theory of speech production. Moutons\u2019Gravenhage."},{"issue":"10","key":"9124_CR18","doi-asserted-by":"crossref","first-page":"920","DOI":"10.1016\/j.specom.2008.11.004","volume":"51","author":"D. Felps","year":"2009","unstructured":"Felps, D., Bortfeld, H., & Gutierrez-Osuna, R. (2009). Foreign accent conversion in computer assisted pronunciation training. Speech Communication, 51(10), 920\u2013932.","journal-title":"Speech Communication"},{"key":"9124_CR19","doi-asserted-by":"crossref","first-page":"399","DOI":"10.2307\/3588487","volume":"39","author":"J. Field","year":"2005","unstructured":"Field, J. (2005). Intelligibility and the listener: the role of lexical stress. TESOL. Quarterly, 39, 399\u2013423.","journal-title":"TESOL. Quarterly"},{"key":"9124_CR20","doi-asserted-by":"crossref","first-page":"765","DOI":"10.1121\/1.1908022","volume":"27","author":"D. B. Fry","year":"1955","unstructured":"Fry, D. B. (1955). Duration and intensity as physical correlates of linguistic stress. Journal of the Acoustical Society of America, 27, 765\u2013768.","journal-title":"Journal of the Acoustical Society of America"},{"issue":"2","key":"9124_CR21","doi-asserted-by":"crossref","first-page":"201","DOI":"10.2307\/3588378","volume":"38","author":"L. D. Hahn","year":"2004","unstructured":"Hahn, L. D. (2004). Primary stress and intelligibility: Research to motivate the teaching of suprasegmentals. TESOL Quarterly, 38(2), 201\u2013223.","journal-title":"TESOL Quarterly"},{"key":"9124_CR22","first-page":"153","volume":"44","author":"R. Hincks","year":"2002","unstructured":"Hincks, R. (2002). Speech synthesis for teaching lexical stress. TMH-QPSR, 44, 153\u2013156.","journal-title":"TMH-QPSR"},{"key":"9124_CR23","first-page":"77","volume-title":"Proceedings of international symposium on tonal aspects of languages","author":"K. Hirose","year":"2004","unstructured":"Hirose, K. (2004). Accent type recognition of Japanese using perceived mora pitch values and its use for pronunciation training system. In Proceedings of international symposium on tonal aspects of languages, Beijing (pp. 77\u201380)."},{"issue":"2","key":"9124_CR24","doi-asserted-by":"crossref","first-page":"97","DOI":"10.1007\/s10772-009-9039-3","volume":"11","author":"M. Kang","year":"2008","unstructured":"Kang, M., Kashiwagi, H., Treviranus, J., & Kaburagi, M. (2008). Synthetic speech in foreign language learning: an evaluation by learners. International Journal of Speech Technology, 11(2), 97\u2013106.","journal-title":"International Journal of Speech Technology"},{"key":"9124_CR25","doi-asserted-by":"crossref","first-page":"606","DOI":"10.21437\/Interspeech.2010-234","volume-title":"InterSpeech","author":"J. Lu","year":"2010","unstructured":"Lu, J., Wang, R., De Silva, L. C., Gao, Y., & Liu, J. (2010). CASTLE: a Computer-assisted stress teaching and learning environment for learners of English as a second language. In InterSpeech, Makuhari, Japan (pp. 606\u2013609)."},{"key":"9124_CR26","unstructured":"MIT courseware (2006). Transcribing Prosodic Structure of Spoken Utterances with ToBI http:\/\/ocw.mit.edu\/OcwWeb . Accessed on 15\/08\/2009."},{"issue":"5\u20136","key":"9124_CR27","doi-asserted-by":"crossref","first-page":"453","DOI":"10.1016\/0167-6393(90)90021-Z","volume":"9","author":"E. Moulines","year":"1990","unstructured":"Moulines, E., & Charpentier, F. (1990). Pitch-synchronous waveform processing techniques for text-to-speech synthesis using diphones. Speech Communication, 9(5\u20136), 453\u2013467.","journal-title":"Speech Communication"},{"issue":"4","key":"9124_CR28","first-page":"362","volume":"1","author":"T. Nagamine","year":"2002","unstructured":"Nagamine, T. (2002). An experimental study on the teachability and learnability of English intonational aspect: Acoustic analysis on F0 and native-speaker judgment task. Journal of Language and Linguistics, 1(4), 362\u2013399.","journal-title":"Journal of Language and Linguistics"},{"key":"9124_CR29","first-page":"771","volume-title":"Proceedings of the 15th international congress of phonetic sciences","author":"F. Nolan","year":"2003","unstructured":"Nolan, F. (2003). Intonational equivalence: an experimental evaluation of pitch scales. In Proceedings of the 15th international congress of phonetic sciences, Barcelona (pp. 771\u2013774)."},{"key":"9124_CR30","unstructured":"Ostendorf, M., Price, P. J., & Shattuck-Hufnagel, S. (1995). The Boston University radio news corpus. Boston Univ., Boston, MA, Tech. Rep. ECS-95-001, Mar."},{"key":"9124_CR31","doi-asserted-by":"crossref","first-page":"203","DOI":"10.1515\/9783110197105.1.203","volume-title":"Laboratory Phonology 7","author":"S. Peperkamp","year":"2002","unstructured":"Peperkamp, S., & Dupoux, E. (2002). A typological study of stress \u2018deafness\u2019. In C. Gussenhoven & N. Warner (Eds.), Laboratory Phonology 7 (pp. 203\u2013240). Berlin: Mouton de Gruyter."},{"key":"9124_CR32","doi-asserted-by":"crossref","first-page":"700","DOI":"10.1109\/ASRU.2003.1318525","volume-title":"Proceedings of IEEE workshop on automatic speech recognition and understanding","author":"A. Raux","year":"2003","unstructured":"Raux, A., & Black, A. W. (2003). A unit selection approach to F0 modeling and its application to emphasis. In Proceedings of IEEE workshop on automatic speech recognition and understanding (pp. 700\u2013705)."},{"key":"9124_CR33","first-page":"867","volume-title":"Proceedings of international conference on spoken language processing","author":"K. Silverman","year":"1992","unstructured":"Silverman, K., Beckman, M., Pitrelli, J., Ostendorf, M., Wightman, C., Price, P., Pierrehumbert, J., & Hirschberg, J. (1992). Tobi: a standard for labeling english prosody. In Proceedings of international conference on spoken language processing (pp.\u00a0867\u2013870)."},{"key":"9124_CR34","doi-asserted-by":"crossref","first-page":"503","DOI":"10.1121\/1.417994","volume":"101","author":"A. M. C. Sluijter","year":"1997","unstructured":"Sluijter, A. M. C., van Heuven, V. J., & Pacilly, J. J. A. (1997). Spectral Balance as a cue in the perception of linguistic stress. J. Acoust. Soc. Amer., 101, 503\u2013513.","journal-title":"J. Acoust. Soc. Amer."},{"key":"9124_CR35","doi-asserted-by":"crossref","first-page":"145","DOI":"10.14198\/raei.1991.4.13","volume":"4","author":"M. J. Sol\u00e9 Sabater","year":"1991","unstructured":"Sol\u00e9 Sabater, M. J. (1991). Stress and Rhythm in English. Revista Alicantina de Estudios Ingleses, 4, 145\u2013162.","journal-title":"Revista Alicantina de Estudios Ingleses"},{"key":"9124_CR36","first-page":"49","volume-title":"Proceedings of ISCA workshop on speech technology in language learning (STILL 98)","author":"A. Sundstr\u00f6m","year":"1998","unstructured":"Sundstr\u00f6m, A. (1998). Automatic prosody modification as a means for foreign language pronunciation training. In Proceedings of ISCA workshop on speech technology in language learning (STILL 98), Marholmen, Sweden (pp. 49\u201352)."},{"issue":"1","key":"9124_CR37","doi-asserted-by":"crossref","first-page":"33","DOI":"10.1007\/s10772-005-4760-z","volume":"8","author":"F. Tamburini","year":"2005","unstructured":"Tamburini, F., & Caini, C. (2005). An automatic system for detecting prosodic prominence in American English continuous speech. International Journal of speech technology, 8(1), 33\u201344.","journal-title":"International Journal of speech technology"},{"issue":"8","key":"9124_CR38","doi-asserted-by":"crossref","first-page":"2222","DOI":"10.1109\/TASL.2007.907344","volume":"15","author":"T. Toda","year":"2007","unstructured":"Toda, T., Black, A. W., & Tokuda, K. (2007). Voice conversion based on maximum likelihood estimation of spectral parameter trajectory. IEEE Transactions on Audio, Speech and Language Processing, 15(8), 2222\u20132235.","journal-title":"IEEE Transactions on Audio, Speech and Language Processing"},{"issue":"2","key":"9124_CR39","first-page":"261","volume":"17","author":"Y. Todaka","year":"1995","unstructured":"Todaka, Y. (1995). A preliminary study of voice quality differences between Japanese and American English: Some pedagogical suggestions. JALT Journal, 17(2), 261\u2013268.","journal-title":"JALT Journal"},{"issue":"2","key":"9124_CR40","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/1149290.1149291","volume":"3","author":"C. Wang","year":"2006","unstructured":"Wang, C., & Seneff, S. (2006). High-quality speech-to-speech translation for computer-aided language learning. ACM Transactions on Speech and Language Processing, 3(2), 1\u201321.","journal-title":"ACM Transactions on Speech and Language Processing"},{"key":"9124_CR41","doi-asserted-by":"crossref","first-page":"175","DOI":"10.1016\/j.specom.2010.08.015","volume":"53","author":"R. Wang","year":"2011","unstructured":"Wang, R., & Lu, J. (2011). Investigation of the golden speaker for a language learner from the imitation preference perspective by voice modification. Speech Communication, 53, 175\u2013184.","journal-title":"Speech Communication"},{"key":"9124_CR42","unstructured":"WWW (2011). Voices materials on http:\/\/www.box.net\/shared\/srmu4tjj9f ."},{"issue":"7","key":"9124_CR43","first-page":"145","volume":"26","author":"H. Xie","year":"2004","unstructured":"Xie, H., Andreae, P., Zhang, M., & Warren, P. (2004). Detecting stress in spoken English using decision trees and support vector machines. Australian Computer Science Communications (Data Mining, CRPIT 32), 26(7), 145\u2013150.","journal-title":"Australian Computer Science Communications (Data Mining, CRPIT 32)"},{"key":"9124_CR44","volume-title":"Proceedings of conference of the association of modern British & American language & literature","author":"K. Yoon","year":"2008","unstructured":"Yoon, K. (2008). Synthesis and evaluation of prosodically exaggerated utterances: a\u00a0preliminary study. In Proceedings of conference of the association of modern British & American language & literature."},{"key":"9124_CR45","doi-asserted-by":"crossref","first-page":"69","DOI":"10.1016\/j.system.2007.11.004","volume":"36","author":"B. W. Zielinski","year":"2008","unstructured":"Zielinski, B. W. (2008). The listener: No longer the silent partner in reduced intelligibility. System, 36, 69\u201384.","journal-title":"System"}],"container-title":["International Journal of Speech Technology"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-011-9124-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10772-011-9124-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-011-9124-2","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,13]],"date-time":"2025-03-13T23:42:47Z","timestamp":1741909367000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10772-011-9124-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011,11,11]]},"references-count":45,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2012,6]]}},"alternative-id":["9124"],"URL":"https:\/\/doi.org\/10.1007\/s10772-011-9124-2","relation":{},"ISSN":["1381-2416","1572-8110"],"issn-type":[{"type":"print","value":"1381-2416"},{"type":"electronic","value":"1572-8110"}],"subject":[],"published":{"date-parts":[[2011,11,11]]}}}