{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,7,7]],"date-time":"2024-07-07T19:51:28Z","timestamp":1720381888715},"reference-count":39,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2013,12,28]],"date-time":"2013-12-28T00:00:00Z","timestamp":1388188800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["J Multimodal User Interfaces"],"published-print":{"date-parts":[[2014,3]]},"DOI":"10.1007\/s12193-013-0144-x","type":"journal-article","created":{"date-parts":[[2013,12,27]],"date-time":"2013-12-27T14:16:20Z","timestamp":1388153780000},"page":"75-86","source":"Crossref","is-referenced-by-count":16,"title":["Analysis of significant dialog events in realistic human\u2013computer interaction"],"prefix":"10.1007","volume":"8","author":[{"given":"Dmytro","family":"Prylipko","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dietmar","family":"R\u00f6sner","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ingo","family":"Siegert","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Stephan","family":"G\u00fcnther","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Rafael","family":"Friesen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Matthias","family":"Haase","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bogdan","family":"Vlasenko","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andreas","family":"Wendemuth","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2013,12,28]]},"reference":[{"key":"144_CR1","doi-asserted-by":"crossref","unstructured":"Batliner A, Fischer K, Huber R, Spilker J, N\u00f6th E (2003) How to find trouble in communication. Speech Commun 40(1\u20132):117\u2013143","DOI":"10.1016\/S0167-6393(02)00079-1"},{"issue":"1","key":"144_CR2","doi-asserted-by":"crossref","first-page":"4","DOI":"10.1016\/j.csl.2009.12.003","volume":"25","author":"A Batliner","year":"2011","unstructured":"Batliner A, Steidl S, Schuller B, Seppi D, Vogt T, Wagner J, Devillers L, Vidrascu L, Aharonson V, Kessous L (2011) Whodunnit\u2014searching for the most important feature types signalling emotion-related user states in speech. Comput Speech Lang 25(1):4\u201328","journal-title":"Comput Speech Lang"},{"issue":"9\/10","key":"144_CR3","first-page":"341","volume":"5","author":"P Boersma","year":"2001","unstructured":"Boersma P (2001) Praat, a system for doing phonetics by computer. Glot Int 5(9\/10):341\u2013345","journal-title":"Glot Int"},{"key":"144_CR4","doi-asserted-by":"crossref","first-page":"416","DOI":"10.1016\/j.specom.2008.01.001","volume":"50","author":"Z Callejas","year":"2008","unstructured":"Callejas Z, L\u00f3pez-C\u00f3zar R (2008) Influence of contextual information in emotion annotation for spoken dialogue systems. Speech Commun 50:416\u2013433","journal-title":"Speech Commun"},{"key":"144_CR5","first-page":"117","volume-title":"Cost 2012 workshop (Vietri), LNAI","author":"N Campbell","year":"2007","unstructured":"Campbell N (2007) On the use of nonverbal speech sounds in human communication. Cost 2012 workshop (Vietri), LNAI. Springer, Berlin, Heidelberg, pp 117\u2013128"},{"key":"144_CR6","doi-asserted-by":"crossref","unstructured":"Caridakis G, Karpouzis K, Wallace M, Kessous L, Amir N (2010) Multimodal user\u2019s affective state analysis in naturalistic interaction. J Multimodal User Interfaces 3(1):49\u201366","DOI":"10.1007\/s12193-009-0030-8"},{"issue":"2","key":"144_CR7","doi-asserted-by":"crossref","first-page":"121","DOI":"10.1142\/S021969130400041X","volume":"2","author":"JF Cohn","year":"2004","unstructured":"Cohn JF, Schmidt K (2004) The timing of facial motion in posed and spontaneous smiles. Int J Wavelets Multiresolut Inf Process 2(2):121\u2013132","journal-title":"Int J Wavelets Multiresolut Inf Process"},{"issue":"1","key":"144_CR8","doi-asserted-by":"crossref","first-page":"32","DOI":"10.1109\/79.911197","volume":"18","author":"R Cowie","year":"2001","unstructured":"Cowie R, Douglas-Cowie E, Tsapatsoulis N, Votsis G, Kollias S, Fellenz W, Taylor J (2001) Emotion recognition in human\u2013computer interaction. IEEE Signal Process Mag 18(1):32\u201380","journal-title":"IEEE Signal Process Mag"},{"key":"144_CR9","doi-asserted-by":"crossref","unstructured":"Douglas-Cowie E, Devillers L, Martin JC, Cowie R, Savvidou S, Abrilian S, Cox C (2005) Multimodal databases of everyday emotion: facing up to complexity. In: Proceedings of Interspeech\u201905, pp 813\u2013816","DOI":"10.21437\/Interspeech.2005-381"},{"issue":"8","key":"144_CR10","doi-asserted-by":"crossref","first-page":"630","DOI":"10.1016\/j.specom.2008.04.002","volume":"50","author":"J Edlund","year":"2008","unstructured":"Edlund J, Gustafson J, Heldner M, Hjalmarsson A (2008) Towards human-like spoken dialogue systems. Speech Commun 50(8):630\u2013645","journal-title":"Speech Commun"},{"key":"144_CR11","volume-title":"Detection and avoidance of failures in dialogues\u2014wizard of Oz experiment operator\u2019s manual","author":"J Frommer","year":"2012","unstructured":"Frommer J, R\u00f6sner D, Haase M, Lange J, Friesen R, Otto M (2012) Detection and avoidance of failures in dialogues\u2014wizard of Oz experiment operator\u2019s manual. Pabst Science Publishers, Germany"},{"issue":"598","key":"144_CR12","doi-asserted-by":"crossref","first-page":"2293","DOI":"10.1299\/kikaic.62.2293","volume":"62","author":"S Fukuda","year":"1996","unstructured":"Fukuda S, Matsuura Y (1996) Understanding of emotional feelings in sound. Trans Jpn Soc Mech Eng Part C 62(598):2293\u20132298","journal-title":"Trans Jpn Soc Mech Eng Part C"},{"issue":"1","key":"144_CR13","doi-asserted-by":"crossref","first-page":"10","DOI":"10.1145\/1656274.1656278","volume":"11","author":"M Hall","year":"2009","unstructured":"Hall M, Frank E, Holmes G, Pfahringer B, Reutemann P, Witten IH (2009) The WEKA data mining software: an update. ACM SIGKDD Explor Newslett 11(1):10\u201318","journal-title":"ACM SIGKDD Explor Newslett"},{"key":"144_CR14","unstructured":"Jimenez-Fernandez A, Del Pozo F, Munoz C, Zoreda JL (1987) Pattern recognition in the vocal expression of emotional categories. In: Proceedings of the 25th annual Conference of the IEEE Engineering in Medicine and Biology Society, pp 2090\u20132091"},{"key":"144_CR15","unstructured":"Jurafsky D, Martin JH (2009) Speech and language processing: an introduction to natural language processing, computational linguistics, and speech recognition. Prentice Hall, USA. http:\/\/www.cs.colorado.edu\/%7Emartin\/slp.html"},{"issue":"8","key":"144_CR16","doi-asserted-by":"crossref","first-page":"724","DOI":"10.1016\/j.ijhcs.2007.02.003","volume":"65","author":"A Kapoor","year":"2007","unstructured":"Kapoor A, Burleson W, Picard RW (2007) Automatic prediction of frustration. Int J Hum Comput Stud 65(8):724\u2013736","journal-title":"Int J Hum Comput Stud"},{"key":"144_CR17","doi-asserted-by":"crossref","first-page":"389","DOI":"10.1016\/S0065-2601(08)60241-5","volume":"28","author":"RM Krauss","year":"1996","unstructured":"Krauss RM, Chen Y, Chawla P (1996) Nonverbal behavior and nonverbal communication: what do conversational hand gestures tell us? Adv Exp Soc Psychol 28:389\u2013450","journal-title":"Adv Exp Soc Psychol"},{"issue":"2","key":"144_CR18","doi-asserted-by":"crossref","first-page":"293","DOI":"10.1109\/TSA.2004.838534","volume":"13","author":"CM Lee","year":"2005","unstructured":"Lee CM, Narayanan S (2005) Toward detecting emotions in spoken dialogs. IEEE Trans Speech Audio Process 13(2):293\u2013303","journal-title":"IEEE Trans Speech Audio Process"},{"key":"144_CR19","doi-asserted-by":"crossref","unstructured":"Prylipko D, Schuller B, Wendemuth A (2012) Fine-tuning HMMs for nonverbal vocalizations in spontaneous speech: a multicorpus perspective. In: Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP, pp 4625\u20134628","DOI":"10.1109\/ICASSP.2012.6288949"},{"key":"144_CR20","doi-asserted-by":"crossref","unstructured":"R\u00f6sner D, Friesen R, Otto M, Lange J, Haase M, Frommer J (2011) Human\u2013computer Interaction. Towards mobile and intelligent interaction environments. Intentionality in interacting with companion systems: an empirical approach. Springer, Berlin, pp 593\u2013602","DOI":"10.1007\/978-3-642-21616-9_67"},{"key":"144_CR21","unstructured":"R\u00f6sner D, Frommer J, Andrich R, Friesen R, Haase M, Kunze M, Lange J, Otto M (2012) LAST MINUTE: a novel corpus to support emotion, sentiment and social signal processing. In: Conference on Language Resources and Evaluation, LREC\u201912 Abstracts"},{"key":"144_CR22","unstructured":"R\u00f6sner D, Kunze M, Otto M, Frommer J (2012) Linguistic analyses of the LAST MINUTE corpus. In: Proceedings of KONVENS\u201912, \u00d6GAI, pp 145\u2013154"},{"key":"144_CR23","doi-asserted-by":"crossref","first-page":"211","DOI":"10.1023\/A:1024498629430","volume":"21","author":"KR Scherer","year":"1997","unstructured":"Scherer KR, Ceschi G (1997) Lost luggage: a field study of emotion-antecedent appraisal. Motiv Emot 21:211\u2013235","journal-title":"Motiv Emot"},{"issue":"3\u20134","key":"144_CR24","doi-asserted-by":"crossref","first-page":"117","DOI":"10.1007\/s12193-012-0093-9","volume":"6","author":"S Scherer","year":"2012","unstructured":"Scherer S, Glodek M, Layher G, Schels M, Schmidt M, Brosch T, Tschechne S, Schwenker F, Neumann H, Palm G (2012) A generic framework for the inference of user states in human computer interaction. J Multimodal User Interfaces 6(3\u20134):117\u2013141","journal-title":"J Multimodal User Interfaces"},{"key":"144_CR25","unstructured":"Schmidt T, Sch\u00fctte W (2010) Folker: An annotation tool for efficient transcription of natural, multi-party interaction. In: Proceedings of LREC\u201910, pp 2091\u20132096"},{"key":"144_CR26","doi-asserted-by":"crossref","unstructured":"Schuller B, Batliner A, Steidl S, Seppi D (2011) Recognising realistic emotions and affect in speech: state of the art and lessons learnt from the first challenge. Speech Commun 53(9\u201310):1062\u20131087","DOI":"10.1016\/j.specom.2011.01.011"},{"key":"144_CR27","unstructured":"Selting M, et al (2009) Gespr\u00e4chsanalytisches Transkriptionssystem 2 (GAT 2)"},{"key":"144_CR28","unstructured":"Siegert I, B\u00f6ck R, Philippou-H\u00fcbner D, Vlasenko B, Wendemuth A (2011) Appropriate emotional labeling of non-acted speech using basic emotions, Geneva emotion wheel and self assessment ,anikins. In: Proceedings of ICME\u201911"},{"key":"144_CR29","unstructured":"Suwa M, Sugie N, Fujimora K (1978) A preliminary note on pattern recognition of human emotional expression. In: Proceedings of the IEEE International Conference on Pattern Recognition, pp 408\u2013410"},{"key":"144_CR30","doi-asserted-by":"crossref","unstructured":"Vlasenko B, Prylipko D, Philippou-H\u00fcbner D, Wendemuth A (2011) Vowels formants analysis allows straightforward detection of high arousal acted and spontaneous emotions. In: Proceedings of Interspeech\u201911, pp 1577\u20131580","DOI":"10.21437\/Interspeech.2011-474"},{"key":"144_CR31","doi-asserted-by":"crossref","unstructured":"Vlasenko B, Prylipko D, B\u00f6ck R, Wendemuth A (2014) Modeling phonetic pattern variability in favor of the creation of robust emotion classifiers for real-life applications. Comput Speech Lang (Article in press)","DOI":"10.1016\/j.csl.2012.11.003"},{"key":"144_CR32","unstructured":"Walker M, Langkilde I, Wright J, Gorin A, Litman D (2000) Learning to predict problematic situations in a spoken dialogue system: experiments with how may I help you? In: Proceedings of NAACL\u201900, pp 210\u2013217"},{"key":"144_CR33","doi-asserted-by":"crossref","DOI":"10.1075\/nlp.8","volume-title":"Close engagements with artificial companions: key social, psychological, ethical and design issues","author":"Y Wilks","year":"2010","unstructured":"Wilks Y (2010) Close engagements with artificial companions: key social, psychological, ethical and design issues. John Benjamins, Amsterdam"},{"issue":"4B","key":"144_CR34","doi-asserted-by":"crossref","first-page":"1238","DOI":"10.1121\/1.1913238","volume":"52","author":"CE Williams","year":"1972","unstructured":"Williams CE, Stevens KN (1972) Emotions and speech: some acoustical correlates. J Acoust Soc Am 52(4B):1238\u20131250","journal-title":"J Acoust Soc Am"},{"key":"144_CR35","doi-asserted-by":"crossref","unstructured":"W\u00f6llmer M, Eyben F, Reiter S, Schuller B, Cox C, Douglas-Cowie E, Cowie R (2008) Abandoning emotion classes\u2014towards continuous emotion recognition with modelling of long-range dependencies. In: Proceedings of Interspeech\u201908, pp 597\u2013600","DOI":"10.21437\/Interspeech.2008-192"},{"issue":"1","key":"144_CR36","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/1525840.1525842","volume":"2","author":"M Wolters","year":"2009","unstructured":"Wolters M, Georgila K, Moore JD, MacPherson SE (2009) Being old doesn\u2019t mean acting old: how older users interact with spoken dialog systems. ACM Trans Access Comput 2(1):1\u201339","journal-title":"ACM Trans Access Comput"},{"key":"144_CR37","volume-title":"The HTK book (for HTK Version 3.4)","author":"S Young","year":"2006","unstructured":"Young S, Evermann G, Gales M, Hain T, Kershaw D, Liu X, Moore G, Odell J, Ollason D, Povey D, Valtchev V, Woodland P (2006) The HTK book (for HTK Version 3.4). Cambridge University Press, Cambridge"},{"issue":"2","key":"144_CR38","doi-asserted-by":"crossref","first-page":"424","DOI":"10.1109\/TMM.2006.886310","volume":"9","author":"Z Zeng","year":"2007","unstructured":"Zeng Z, Tu J, Liu M, Huang T, Pianfetti B, Roth D, Levinson S (2007) Audio-visual affect recognition. IEEE Trans Multimed 9(2):424\u2013428","journal-title":"IEEE Trans Multimed"},{"issue":"1","key":"144_CR39","doi-asserted-by":"crossref","first-page":"39","DOI":"10.1109\/TPAMI.2008.52","volume":"31","author":"Z Zeng","year":"2009","unstructured":"Zeng Z, Pantic M, Roisman GI, Huang TS (2009) A survey of affect recognition methods: audio, visual, and spontaneous expressions. IEEE Trans Pattern Anal Mach Intell 31(1):39\u201358","journal-title":"IEEE Trans Pattern Anal Mach Intell"}],"container-title":["Journal on Multimodal User Interfaces"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s12193-013-0144-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s12193-013-0144-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s12193-013-0144-x","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,3,20]],"date-time":"2022-03-20T18:04:27Z","timestamp":1647799467000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s12193-013-0144-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,12,28]]},"references-count":39,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2014,3]]}},"alternative-id":["144"],"URL":"https:\/\/doi.org\/10.1007\/s12193-013-0144-x","relation":{},"ISSN":["1783-7677","1783-8738"],"issn-type":[{"value":"1783-7677","type":"print"},{"value":"1783-8738","type":"electronic"}],"subject":[],"published":{"date-parts":[[2013,12,28]]}}}