{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T12:26:24Z","timestamp":1778243184036,"version":"3.51.4"},"reference-count":26,"publisher":"Springer Science and Business Media LLC","issue":"12","license":[{"start":{"date-parts":[[2012,12,7]],"date-time":"2012-12-07T00:00:00Z","timestamp":1354838400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2013,12]]},"DOI":"10.1007\/s00371-012-0768-y","type":"journal-article","created":{"date-parts":[[2012,12,6]],"date-time":"2012-12-06T07:29:17Z","timestamp":1354778957000},"page":"1269-1275","source":"Crossref","is-referenced-by-count":39,"title":["Human emotion recognition from videos using spatio-temporal and audio features"],"prefix":"10.1007","volume":"29","author":[{"given":"Munaf","family":"Rashid","sequence":"first","affiliation":[]},{"given":"S. A. R.","family":"Abu-Bakar","sequence":"additional","affiliation":[]},{"given":"Musa","family":"Mokji","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2012,12,7]]},"reference":[{"key":"768_CR1","doi-asserted-by":"crossref","first-page":"1468","DOI":"10.1109\/ICME.2005.1521709","volume-title":"IEEE International Conference on Multimedia and Expo, ICME 2005","author":"C.Y. Chen","year":"2005","unstructured":"Chen, C.Y., et al.: Visual\/acoustic emotion recognition. In: IEEE International Conference on Multimedia and Expo, ICME 2005, pp. 1468\u20131471 (2005)"},{"key":"768_CR2","first-page":"15","volume-title":"Proceedings of IEEE 6th Workshop on Multimedia Signal","author":"W. Yongjin","year":"2004","unstructured":"Yongjin, W., Ling, G.: An investigation of speech-based human emotion recognition. In: Proceedings of IEEE 6th Workshop on Multimedia Signal, pp. 15\u201318 (2004)"},{"key":"768_CR3","doi-asserted-by":"crossref","first-page":"1162","DOI":"10.1016\/j.specom.2011.06.004","volume":"53","author":"C.-C. Lee","year":"2011","unstructured":"Lee, C.-C., et al.: Emotion recognition using a hierarchical binary decision tree approach. Speech Commun. 53, 1162\u20131171 (2011)","journal-title":"Speech Commun."},{"key":"768_CR4","doi-asserted-by":"crossref","first-page":"390","DOI":"10.1109\/AFGR.1998.670980","volume-title":"Proceedings of Third IEEE International Conference on Automatic Face and Gesture Recognition","author":"J.J. Lien","year":"1998","unstructured":"Lien, J.J., et al.: Automated facial expression recognition based on FACS action units. In: Proceedings of Third IEEE International Conference on Automatic Face and Gesture Recognition, pp. 390\u2013395 (1998)"},{"key":"768_CR5","first-page":"III-549","volume-title":"Proceedings of International Conference on Multimedia and Expo, ICME\u201903","author":"L. Devillers","year":"2003","unstructured":"Devillers, L., et al.: Emotion detection in task-oriented spoken dialogues. In: Proceedings of International Conference on Multimedia and Expo, ICME\u201903, vol. 3, pp.\u00a0III-549\u2013III-552 (2003)."},{"key":"768_CR6","doi-asserted-by":"crossref","first-page":"737","DOI":"10.1109\/ICME.2002.1035887","volume-title":"Proceedings of IEEE International Conference on Multimedia and Expo, ICME\u201902","author":"L. Chul Min","year":"2002","unstructured":"Chul Min, L., et al.: Classifying emotions in human\u2013machine spoken dialogs. In: Proceedings of IEEE International Conference on Multimedia and Expo, ICME\u201902, vol. 1, pp. 737\u2013740 (2002)"},{"key":"768_CR7","doi-asserted-by":"crossref","first-page":"32","DOI":"10.1109\/79.911197","volume":"18","author":"R. Cowie","year":"2001","unstructured":"Cowie, R., et al.: Emotion recognition in human\u2013computer interaction. IEEE Signal Process. Mag. 18, 32\u201380 (2001)","journal-title":"IEEE Signal Process. Mag."},{"key":"768_CR8","doi-asserted-by":"crossref","first-page":"582","DOI":"10.1109\/TASL.2008.2009578","volume":"17","author":"C. Busso","year":"2009","unstructured":"Busso, C., et al.: Analysis of emotionally salient aspects of fundamental frequency for emotion detection. IEEE Trans. Audio Speech Lang. Process. 17, 582\u2013596 (2009)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"768_CR9","doi-asserted-by":"crossref","first-page":"213","DOI":"10.1016\/S0167-6393(02)00083-3","volume":"40","author":"T.B. Louis","year":"2003","unstructured":"Louis, T.B.: Emotions, speech and the ASR framework. Speech Commun. 40, 213\u2013225 (2003)","journal-title":"Speech Commun."},{"key":"768_CR10","first-page":"2483","volume-title":"SICE 2004 Annual Conference","author":"B. Kwang-Sub","year":"2004","unstructured":"Kwang-Sub, B., et al.: Emotion recognition from facial expression using hybrid-feature extraction. In: SICE 2004 Annual Conference, vol. 3, pp. 2483\u20132487 (2004)"},{"key":"768_CR11","doi-asserted-by":"crossref","first-page":"653","DOI":"10.1109\/ICETET.2008.22","volume-title":"First International Conference on Emerging Trends in Engineering and Technology, ICETET\u201908","author":"G.U. Kharat","year":"2008","unstructured":"Kharat, G.U., Dudul, S.V.: Neural network classifier for human emotion recognition from facial expressions using discrete cosine transform. In: First International Conference on Emerging Trends in Engineering and Technology, ICETET\u201908, pp. 653\u2013658 (2008)"},{"key":"768_CR12","volume-title":"Unmasking the Face: A Guide to Recognizing Emotions from Facial Clues","author":"P. Ekman","year":"1975","unstructured":"Ekman, P., Friesen, W.V.: Unmasking the Face: A Guide to Recognizing Emotions from Facial Clues. Prentice-Hall, Englewood Cliffs (1975)"},{"key":"768_CR13","first-page":"853","volume-title":"Proceedings of Computer Society Conference on Computer Vision and Pattern Recognition","author":"J.J.J. Lien","year":"1998","unstructured":"Lien, J.J.J., et al.: Subtly different facial expression recognition and expression intensity estimation. In: Proceedings of Computer Society Conference on Computer Vision and Pattern Recognition, pp. 853\u2013859 (1998)"},{"key":"768_CR14","doi-asserted-by":"crossref","first-page":"23","DOI":"10.1023\/A:1007977618277","volume":"25","author":"M.J. Black","year":"1997","unstructured":"Black, M.J., Yacoob, Y.: Recognizing facial expressions in image sequences using local parameterized models of image motion. Int. J. Comput. Vis. 25, 23\u201348 (1997)","journal-title":"Int. J. Comput. Vis."},{"key":"768_CR15","doi-asserted-by":"crossref","first-page":"65","DOI":"10.1109\/VSPETS.2005.1570899","volume-title":"2nd Joint IEEE International Workshop on Visual Surveillance and Performance Evaluation of Tracking and Surveillance","author":"P. Dollar","year":"2005","unstructured":"Dollar, P., et al.: Behavior recognition via sparse spatio-temporal features. In: 2nd Joint IEEE International Workshop on Visual Surveillance and Performance Evaluation of Tracking and Surveillance, pp. 65\u201372 (2005)"},{"key":"768_CR16","volume-title":"Facial Action Coding System: A Technique for the Measurement of Facial Movement","author":"P. Ekman","year":"1978","unstructured":"Ekman, P., Friesen, W.V.: Facial Action Coding System: A Technique for the Measurement of Facial Movement. Consulting Psychologists Press, Palo Alto (1978)"},{"key":"768_CR17","doi-asserted-by":"crossref","first-page":"757","DOI":"10.1109\/34.598232","volume":"17","author":"I. Essa","year":"1997","unstructured":"Essa, I., Pentland, A.: Coding, analysis, interpretation and recognition off acial expressions. IEEE Trans. Pattern Anal. Mach. Intell. 17, 757\u2013763 (1997)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"768_CR18","first-page":"85","volume-title":"10th International Conference on Information Science, Signal Processing and Their Applications (ISSPA 2010)","author":"S. Omid","year":"2010","unstructured":"Omid, S., et al.: Facial expression recognition using image orientation field in limited regions and MLP neural network. In: 10th International Conference on Information Science, Signal Processing and Their Applications (ISSPA 2010), pp. 85\u201388 (2010)"},{"key":"768_CR19","first-page":"502","volume":"65","author":"R. Munaf","year":"2012","unstructured":"Munaf, R., et al.: Incorporating interactive genetic algorithm (IGA) for real world human action retrievals. Arch. Sci. 65, 502\u2013515 (2012)","journal-title":"Arch. Sci."},{"key":"768_CR20","doi-asserted-by":"crossref","first-page":"446","DOI":"10.1016\/j.patrec.2011.05.001","volume":"33","author":"S. Jones","year":"2012","unstructured":"Jones, S., et al.: Relevance feedback for real-world human action retrieval. Pattern Recognit. Lett. 33, 446\u2013452 (2012)","journal-title":"Pattern Recognit. Lett."},{"key":"768_CR21","first-page":"II-181","volume-title":"Proceedings of the International Symposium on Circuits and Systems, ISCAS\u201904","author":"M.W. Bhatti","year":"2004","unstructured":"Bhatti, M.W., et al.: A neural network approach for human emotion recognition in speech. In: Proceedings of the International Symposium on Circuits and Systems, ISCAS\u201904, vol. 2, pp.\u00a0II-181\u2013II-184 (2004)"},{"key":"768_CR22","doi-asserted-by":"crossref","first-page":"676","DOI":"10.1109\/TSMCC.2010.2050476","volume":"40","author":"R.M. Jiang","year":"2010","unstructured":"Jiang, R.M., et al.: Multimodal biometric human recognition for perceptual human computer interaction. IEEE Trans. Syst. Man Cybern., Part C, Appl. Rev. 40, 676\u2013681 (2010)","journal-title":"IEEE Trans. Syst. Man Cybern., Part C, Appl. Rev."},{"key":"768_CR23","doi-asserted-by":"crossref","first-page":"523","DOI":"10.1109\/TMM.2010.2051871","volume":"12","author":"G. Irie","year":"2010","unstructured":"Irie, G., et al.: Affective audio-visual words and latent topic driving model for realizing movie affective scene classification. IEEE Trans. Multimed. 12, 523\u2013535 (2010)","journal-title":"IEEE Trans. Multimed."},{"key":"768_CR24","volume-title":"10th International Workshop on Frontiers in Handwriting Recognition","author":"M.C.J. Milgram","year":"2006","unstructured":"Milgram, M.C.J., Sabourin, R.: One-against-one or one-against-all: which one is better for handwriting recognition with SVMs? In: 10th International Workshop on Frontiers in Handwriting Recognition (2006)"},{"key":"768_CR25","first-page":"27:1","volume":"2","author":"C.-C. Chang","year":"2011","unstructured":"Chang, C.-C., Lin, C.-J.: LIBSVM: A library for support vector machines. ACM Trans. Intell. Syst. Technol. 2, 27:1\u201327:27 (2011)","journal-title":"ACM Trans. Intell. Syst. Technol."},{"key":"768_CR26","first-page":"8","volume-title":"Proceedings of the 22nd International Conference on Data Engineering Workshops","author":"O. Martin","year":"2006","unstructured":"Martin, O., et al.: The eNTERFACE\u201905 audio-visual emotion database. In: Proceedings of the 22nd International Conference on Data Engineering Workshops, p. 8 (2006)"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-012-0768-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00371-012-0768-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-012-0768-y","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,28]],"date-time":"2019-05-28T10:59:31Z","timestamp":1559041171000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00371-012-0768-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,12,7]]},"references-count":26,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2013,12]]}},"alternative-id":["768"],"URL":"https:\/\/doi.org\/10.1007\/s00371-012-0768-y","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012,12,7]]}}}