{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,2]],"date-time":"2026-05-02T15:31:34Z","timestamp":1777735894192,"version":"3.51.4"},"reference-count":58,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2020,1,22]],"date-time":"2020-01-22T00:00:00Z","timestamp":1579651200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,1,22]],"date-time":"2020-01-22T00:00:00Z","timestamp":1579651200000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Cogn Comput"],"published-print":{"date-parts":[[2021,3]]},"DOI":"10.1007\/s12559-019-09704-5","type":"journal-article","created":{"date-parts":[[2020,1,22]],"date-time":"2020-01-22T02:02:34Z","timestamp":1579658554000},"page":"277-289","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":21,"title":["Emotion Aided Dialogue Act Classification for Task-Independent Conversations in a Multi-modal Framework"],"prefix":"10.1007","volume":"13","author":[{"given":"Tulika","family":"Saha","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dhawal","family":"Gupta","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sriparna","family":"Saha","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Pushpak","family":"Bhattacharyya","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2020,1,22]]},"reference":[{"key":"9704_CR1","unstructured":"Jurafsky D, Bates R, Coccaro N, Martin R, Meteer M, Ries K, Shriberg E, Stolcke A, Taylor P, Van Ess-Dykema C. 1997. Automatic detection of discourse structure for speech recognition and understanding. In: 1997 IEEE workshop on automatic speech recognition and understanding proceedings, IEEE, pp 88\u201395."},{"issue":"3","key":"9704_CR2","doi-asserted-by":"publisher","first-page":"339","DOI":"10.1162\/089120100561737","volume":"26","author":"A Stolcke","year":"2000","unstructured":"Stolcke A, Ries K, Coccaro N, Shriberg E, Bates R, Jurafsky D, Taylor P, Martin R, Ess-Dykema C V, Meteer M. Dialogue act modeling for automatic tagging and recognition of conversational speech. Computational linguistics 2000;26(3):339\u2013373.","journal-title":"Computational linguistics"},{"key":"9704_CR3","unstructured":"Verbree D, Rienks R, Heylen D. 2006. Dialogue-act tagging using smart feature selection; results on multiple corpora. In: Spoken Language Technology Workshop, 2006. IEEE, IEEE, pp 70\u201373."},{"key":"9704_CR4","doi-asserted-by":"crossref","unstructured":"Kalchbrenner N, Blunsom P. 2013. Recurrent convolutional neural networks for discourse compositionality. arXiv:13063584.","DOI":"10.3115\/v1\/P14-1062"},{"key":"9704_CR5","unstructured":"Papalampidi P, Iosif E, Potamianos A. 2017. Dialogue act semantic representation and classification using recurrent neural networks. SEMDIAL 2017 SaarDial, pp 104."},{"key":"9704_CR6","unstructured":"Liu Y, Han K, Tan Z, Lei Y. 2017. Using context information for dialog act classification in dnn framework. In: Proceedings of the 2017 conference on empirical methods in natural language processing, pp 2170\u20132178."},{"issue":"3","key":"9704_CR7","doi-asserted-by":"publisher","first-page":"94","DOI":"10.3390\/info10030094","volume":"10","author":"E Ribeiro","year":"2019","unstructured":"Ribeiro E, Ribeiro R, de Matos D M. A multilingual and multidomain study on dialog act recognition using character-level tokenization. Information 2019;10(3):94.","journal-title":"Information"},{"key":"9704_CR8","doi-asserted-by":"publisher","DOI":"10.1007\/0-387-36921-X","volume-title":"Handbook of social psychology","author":"JD DeLamater","year":"2006","unstructured":"DeLamater JD, Ward A. Handbook of social psychology. Berlin: Springer; 2006."},{"key":"9704_CR9","first-page":"447","volume":"11","author":"KS Fleckenstein","year":"1991","unstructured":"Fleckenstein K S. Defining affect in relation to cognition: A response to susan mcleod. J Adv Comp 1991;11: 447\u2013453.","journal-title":"J Adv Comp"},{"key":"9704_CR10","volume-title":"Handbook of emotions","author":"LF Barrett","year":"1993","unstructured":"Barrett L F, Lewis M, Haviland-Jones JM. Handbook of emotions. New York: The Guilford Press; 1993."},{"key":"9704_CR11","unstructured":"Zadeh AB, Liang PP, Poria S, Cambria E, Morency LP. 2018. Multimodal language analysis in the wild: Cmu-mosei data-set and interpretable dynamic fusion graph. In: Proceedings of the 56th annual meeting of the association for computational linguistics (vol 1: Long Papers), pp 2236\u20132246."},{"issue":"1","key":"9704_CR12","doi-asserted-by":"publisher","first-page":"32","DOI":"10.1109\/79.911197","volume":"18","author":"R Cowie","year":"2001","unstructured":"Cowie R, Douglas-Cowie E, Tsapatsoulis N, Votsis G, Kollias S, Fellenz W, Taylor J G. Emotion recognition in human-computer interaction. IEEE Signal Proc Mag 2001;18(1):32\u201380.","journal-title":"IEEE Signal Proc Mag"},{"key":"9704_CR13","doi-asserted-by":"publisher","first-page":"101","DOI":"10.1016\/j.patrec.2018.04.010","volume":"115","author":"N Jain","year":"2018","unstructured":"Jain N, Kumar S, Kumar A, Shamsolmoali P, Zareapoor M. Hybrid deep neural networks for face emotion recognition. Pattern Recogn Lett 2018;115:101\u2013106.","journal-title":"Pattern Recogn Lett"},{"issue":"10","key":"9704_CR14","doi-asserted-by":"publisher","first-page":"3030","DOI":"10.1109\/TCSVT.2017.2719043","volume":"28","author":"S Zhang","year":"2018","unstructured":"Zhang S, Zhang S, Huang T, Gao W, Tian Q. Learning affective features with a hybrid deep model for audio\u2013visual emotion recognition. IEEE Trans Circuits Syst Video Technol 2018;28(10):3030\u20133043.","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"9704_CR15","unstructured":"Huang C, Zaiane O, Trabelsi A, Dziri N. 2018. Automatic dialogue generation with expressed emotions. In: Proceedings of the 2018 conference of the north american chapter of the association for computational linguistics: Human language technologies, vol 2 (Short Papers), pp 49\u201354."},{"key":"9704_CR16","doi-asserted-by":"crossref","unstructured":"Zhou H, Huang M, Zhang T, Zhu X, Liu B. 2018. Emotional chatting machine: Emotional conversation generation with internal and external memory. In: 32nd AAAI conference on artificial intelligence.","DOI":"10.1609\/aaai.v32i1.11325"},{"key":"9704_CR17","unstructured":"Fung P, Bertero D, Xu P, Park J H, Wu C S, Madotto A. 2018. Empathetic dialog systems. In: The international conference on language resources and evaluation. European Language Resources Association."},{"issue":"4","key":"9704_CR18","doi-asserted-by":"publisher","first-page":"439","DOI":"10.1109\/T-AFFC.2013.20","volume":"4","author":"N Novielli","year":"2013","unstructured":"Novielli N, Strapparava C. The role of affect analysis in dialogue act identification. IEEE Trans Affect Comput 2013;4(4):439\u2013 451.","journal-title":"IEEE Trans Affect Comput"},{"key":"9704_CR19","unstructured":"Bosma W, Andr\u00e9 E. 2004. Exploiting emotions to disambiguate dialogue acts. In: Proceedings of the 9th international conference on Intelligent user interfaces, ACM, pp 85\u201392."},{"key":"9704_CR20","unstructured":"Poria S, Cambria E, Hazarika D, Mazumder N, Zadeh A, Morency LP. 2017. Multi-level multiple attentions for contextual multimodal sentiment analysis. In: 2017 IEEE international conference on data mining (ICDM), IEEE, pp 1033\u20131038."},{"key":"9704_CR21","unstructured":"Poria S, Cambria E, Hazarika D, Majumder N, Zadeh A, Morency LP. 2017. Context-dependent sentiment analysis in user-generated videos. In: Proceedings of the 55th annual meeting of the association for computational linguistics (vol 1: Long Papers), pp 873\u2013883."},{"issue":"4","key":"9704_CR22","doi-asserted-by":"publisher","first-page":"335","DOI":"10.1007\/s10579-008-9076-6","volume":"42","author":"C Busso","year":"2008","unstructured":"Busso C, Bulut M, Lee C C, Kazemzadeh A, Mower E, Kim S, Chang J N, Lee S, Narayanan S S. Iemocap: Interactive emotional dyadic motion capture database. Language resources and evaluation 2008;42(4):335.","journal-title":"Language resources and evaluation"},{"key":"9704_CR23","doi-asserted-by":"crossref","unstructured":"Reithinger N, Klesen M. 1997. Dialogue act classification using language models. In: 5th European conference on speech communication and technology.","DOI":"10.21437\/Eurospeech.1997-589"},{"key":"9704_CR24","unstructured":"Stolcke A, Shriberg E, Bates R, Coccaro N, Jurafsky D, Martin R, Meteer M, Ries K, Taylor P, Van Ess-Dykema C, et al. 1998. Dialog act modeling for conversational speech. In: AAAI spring symposium on applying machine learning to discourse processing, pp 98\u2013105."},{"key":"9704_CR25","unstructured":"Grau S, Sanchis E, Castro MJ, Vilar D. 2004. Dialogue act classification using a bayesian approach. In: 9th Conference Speech and Computer."},{"key":"9704_CR26","unstructured":"Godfrey J J, Holliman E C, McDaniel J. 1992. Switchboard: Telephone speech corpus for research and development. In: 1992 IEEE international conference on acoustics, speech, and signal processing, 1992. ICASSP-92, IEEE, vol 1, pp 517-520."},{"key":"9704_CR27","unstructured":"Khanpour H, Guntakandla N, Nielsen R. 2016. Dialogue act classification in domain-independent conversations using a deep recurrent neural network. In: Proceedings of COLING 2016, The 26th international conference on computational linguistics: Technical Papers, pp 2012\u20132021."},{"key":"9704_CR28","unstructured":"Lee JY, Dernoncourt F. 2016. Sequential short-text classification with recurrent and convolutional neural networks. In: Proceedings of the 2016 Conference of the North American chapter of the association for computational linguistics: Human language technologies, association for computational linguistics, pp 515\u2013520. http:\/\/aclweb.org\/anthology\/N16-1062."},{"key":"9704_CR29","doi-asserted-by":"crossref","unstructured":"Kumar H, Agarwal A, Dasgupta R, Joshi S. 2018. Dialogue act sequence labeling using hierarchical encoder with crf. In: 32nd AAAI conference on artificial intelligence.","DOI":"10.1609\/aaai.v32i1.11701"},{"key":"9704_CR30","unstructured":"Raheja V, Tetreault J. 2019. Dialogue act classification with context-aware self-attention. arXiv:190402594."},{"key":"9704_CR31","doi-asserted-by":"crossref","unstructured":"Yu Y, Peng S, Yang GH. 2019. Modeling long-range context for concurrent dialogue acts recognition. arXiv:190900521.","DOI":"10.1145\/3357384.3358145"},{"issue":"2","key":"9704_CR32","doi-asserted-by":"publisher","first-page":"165","DOI":"10.1016\/0306-4573(92)90044-Z","volume":"28","author":"S Sitter","year":"1992","unstructured":"Sitter S, Stein A. Modeling the illocutionary aspects of information-seeking dialogues. Inf Process Manag 1992;28(2):165\u2013180.","journal-title":"Inf Process Manag"},{"key":"9704_CR33","unstructured":"Ortega D, Li C Y, Vallejo G, Denisov P, Vu NT. 2019. Context-aware neural-based dialog act classification on automatically generated transcriptions. In: ICASSP 2019-2019 IEEE international conference on acoustics, speech and signal processing (ICASSP). IEEE, pp 7265\u20137269."},{"key":"9704_CR34","doi-asserted-by":"publisher","unstructured":"Saha T, Srivastava S, Firdaus M, Saha S, Ekbal A, Bhattacharyya P. 2019. Exploring machine learning and deep learning frameworks for task-oriented dialogue act classification. In: International joint conference on neural networks, IJCNN 2019 Budapest, Hungary, July 14-19, 2019, pp 1\u20138. https:\/\/doi.org\/10.1109\/IJCNN.2019.8851943.","DOI":"10.1109\/IJCNN.2019.8851943"},{"key":"9704_CR35","unstructured":"Boyer KE, Grafsgaard JF, Ha EY, Phillips R, Lester JC. 2011. An affect-enriched dialogue act classification model for task-oriented dialogue. In: Proceedings of the 49th annual meeting of the association for computational linguistics: Human language technologies vol 1, Association for Computational Linguistics, pp 1190\u20131199."},{"key":"9704_CR36","unstructured":"Ihasz P L, Kryssanov V. 2018. Emotions and intentions mediated with dialogue acts. In: 2018 5th international conference on business and industrial research (ICBIR), IEEE, pp 125\u2013130."},{"key":"9704_CR37","unstructured":"Cerisara C, Jafaritazehjani S, Oluokun A, Le H. 2018. Multi-task dialog act and sentiment recognition on mastodon. arXiv:180705013."},{"key":"9704_CR38","doi-asserted-by":"crossref","unstructured":"Vosoughi S, Roy D. 2016. Tweet acts: A speech act classifier for twitter. In: 10th international AAAI conference on web and social media.","DOI":"10.1609\/icwsm.v10i1.14821"},{"issue":"4","key":"9704_CR39","doi-asserted-by":"publisher","first-page":"625","DOI":"10.1007\/s12559-018-9548-y","volume":"10","author":"P Lauren","year":"2018","unstructured":"Lauren P, Qu G, Yang J, Watta P, Huang G B, Lendasse A. Generating word embeddings from an extreme learning machine for sentiment analysis and sequence labeling tasks. Cogn Comput 2018;10(4):625\u2013638.","journal-title":"Cogn Comput"},{"key":"9704_CR40","doi-asserted-by":"crossref","unstructured":"Wang Z, Lin Z. 2019. Optimal feature selection for learning-based algorithms for sentiment classification. Cognitive Computation pp 1\u201311.","DOI":"10.1007\/s12559-019-09669-5"},{"issue":"3","key":"9704_CR41","doi-asserted-by":"publisher","first-page":"389","DOI":"10.1007\/s12559-017-9539-4","volume":"10","author":"X Sun","year":"2018","unstructured":"Sun X, Peng X, Ding S. Emotional human-machine conversation generation based on long short-term memory. Cogn Comput 2018;10(3):389\u2013397. https:\/\/doi.org\/10.1007\/s12559-017-9539-4.","journal-title":"Cogn Comput"},{"issue":"2","key":"9704_CR42","doi-asserted-by":"publisher","first-page":"336","DOI":"10.1007\/s12559-015-9352-x","volume":"8","author":"D Griol","year":"2016","unstructured":"Griol D, Callejas Z. Mobile conversational agents for context-aware care applications. Cogn Comput 2016;8 (2):336\u2013356. https:\/\/doi.org\/10.1007\/s12559-015-9352-x.","journal-title":"Cogn Comput"},{"issue":"3","key":"9704_CR43","doi-asserted-by":"publisher","first-page":"351?","DOI":"10.1007\/s12559-013-9244-x","volume":"6","author":"LF Rodr\u00edguez","year":"2014","unstructured":"Rodr\u00edguez LF, Ramos F. Development of computational models of emotions for autonomous agents: A review. Cogn Comput 2014;6(3):351?-375. https:\/\/doi.org\/10.1007\/s12559-013-9244-x.","journal-title":"Cogn Comput"},{"key":"9704_CR44","doi-asserted-by":"crossref","unstructured":"Shriberg E, Dhillon R, Bhagat S, Ang J, Carvey H. The icsi meeting recorder dialog act (mrda) corpus. Proceedings of the 5th SIGdial Workshop on Discourse and Dialogue at HLT-NAACL; 2004.","DOI":"10.21236\/ADA460980"},{"key":"9704_CR45","doi-asserted-by":"crossref","unstructured":"Heeman P A, Allen J F. 1995. The trains 93 dialogues. Tech. rep., Rochester Univ NY Dept of Computer Science.","DOI":"10.21236\/ADA301012"},{"issue":"4","key":"9704_CR46","doi-asserted-by":"publisher","first-page":"351","DOI":"10.1177\/002383099103400404","volume":"34","author":"AH Anderson","year":"1991","unstructured":"Anderson A H, Bader M, Bard E G, Boyle E, Doherty G, Garrod S, Isard S, Kowtko J, McAllister J, Miller J, et al. The hcrc map task corpus. Language and speech 1991;34(4):351\u2013366.","journal-title":"Language and speech"},{"key":"9704_CR47","unstructured":"Jurafsky D. 1997. Switchboard swbd-damsl shallow-discourse-function annotation coders manual. Institute of Cognitive Science Technical Report."},{"issue":"10","key":"9704_CR48","first-page":"1995","volume":"3361","author":"Y LeCun","year":"1995","unstructured":"LeCun Y, Bengio Y, et al. Convolutional networks for images, speech, and time series. The handbook of brain theory and neural networks 1995;3361(10):1995.","journal-title":"The handbook of brain theory and neural networks"},{"key":"9704_CR49","unstructured":"Pennington J, Socher R, Manning C. 2014. Glove: Global vectors for word representation. In: Proceedings of the 2014 conference on empirical methods in natural language processing (EMNLP), pp 1532\u20131543."},{"key":"9704_CR50","unstructured":"Eyben F, W\u00f6llmer M, Schuller B. 2010. Opensmile: The munich versatile and fast open-source audio feature extractor. In: Proceedings of the 18th ACM international conference on Multimedia, ACM, pp 1459\u20131462."},{"issue":"3","key":"9704_CR51","doi-asserted-by":"publisher","first-page":"994","DOI":"10.1109\/TASL.2011.2170835","volume":"20","author":"T Drugman","year":"2011","unstructured":"Drugman T, Thomas M, Gudnason J, Naylor P, Dutoit T. Detection of glottal closure instants from speech signals: A quantitative review. IEEE Trans Audio, Speech, Language Process 2011;20(3):994\u20131006.","journal-title":"IEEE Trans Audio, Speech, Language Process"},{"issue":"6","key":"9704_CR52","doi-asserted-by":"publisher","first-page":"1170","DOI":"10.1109\/TASL.2013.2245653","volume":"21","author":"J Kane","year":"2013","unstructured":"Kane J, Gobl C. Wavelet maxima dispersion for breathy to tense voice discrimination. IEEE Trans Audio, Speech, Language Process 2013;21(6):1170\u20131179.","journal-title":"IEEE Trans Audio, Speech, Language Process"},{"key":"9704_CR53","doi-asserted-by":"crossref","unstructured":"Drugman T, Alwan A. 2011. Joint robust voicing detection and pitch estimation based on residual harmonics. In: 12th annual conference of the international speech communication association.","DOI":"10.21437\/Interspeech.2011-519"},{"issue":"4","key":"9704_CR54","doi-asserted-by":"publisher","first-page":"1738","DOI":"10.1121\/1.399423","volume":"87","author":"H Hermansky","year":"1990","unstructured":"Hermansky H. Perceptual linear predictive (plp) analysis of speech. The Journal of the Acoustical Society of America 1990;87(4):1738\u20131752.","journal-title":"The Journal of the Acoustical Society of America"},{"key":"9704_CR55","unstructured":"Fastl H. 2005. Psycho-acoustics and sound quality. In: Communication acoustics, Springer, pp 139\u2013162."},{"issue":"9","key":"9704_CR56","doi-asserted-by":"publisher","first-page":"1055","DOI":"10.1109\/PROC.1982.12433","volume":"70","author":"DJ Thomson","year":"1982","unstructured":"Thomson D J. Spectrum estimation and harmonic analysis. Proc IEEE 1982;70(9):1055\u20131096.","journal-title":"Proc IEEE"},{"issue":"8","key":"9704_CR57","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter S, Schmidhuber J. Long short-term memory. Neural Comput 1997;9(8):1735\u20131780.","journal-title":"Neural Comput"},{"issue":"1\/2","key":"9704_CR58","doi-asserted-by":"publisher","first-page":"28","DOI":"10.2307\/2332510","volume":"34","author":"BL Welch","year":"1947","unstructured":"Welch B L. The generalization ofstudent\u2019s\u2019 problem when several different population variances are involved. Biometrika 1947;34(1\/2):28\u201335.","journal-title":"Biometrika"}],"container-title":["Cognitive Computation"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s12559-019-09704-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s12559-019-09704-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s12559-019-09704-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,9,25]],"date-time":"2023-09-25T12:56:31Z","timestamp":1695646591000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s12559-019-09704-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,1,22]]},"references-count":58,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2021,3]]}},"alternative-id":["9704"],"URL":"https:\/\/doi.org\/10.1007\/s12559-019-09704-5","relation":{},"ISSN":["1866-9956","1866-9964"],"issn-type":[{"value":"1866-9956","type":"print"},{"value":"1866-9964","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,1,22]]},"assertion":[{"value":"30 August 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 November 2019","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 January 2020","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Compliance with Ethical Standards"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"<!--Emphasis Type='Bold' removed-->Conflict of Interest"}},{"value":"This article does not contain any studies with human participants or animals performed by any of the authors.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical Approval"}}]}}