{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,7]],"date-time":"2026-04-07T16:10:51Z","timestamp":1775578251652,"version":"3.50.1"},"reference-count":49,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2015,11,18]],"date-time":"2015-11-18T00:00:00Z","timestamp":1447804800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities of China","doi-asserted-by":"crossref","award":["2012YBXS10"],"award-info":[{"award-number":["2012YBXS10"]}],"id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities of China","doi-asserted-by":"crossref","award":["2014KJJCA15"],"award-info":[{"award-number":["2014KJJCA15"]}],"id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"crossref"}]},{"name":"National Education Science Twelfth Five-Year Plan Key Issues of the Ministry of Education","award":["DCA140229"],"award-info":[{"award-number":["DCA140229"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Multimodal User Interfaces"],"published-print":{"date-parts":[[2016,6]]},"DOI":"10.1007\/s12193-015-0203-6","type":"journal-article","created":{"date-parts":[[2015,11,18]],"date-time":"2015-11-18T14:20:50Z","timestamp":1447856450000},"page":"125-137","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":40,"title":["Combining feature-level and decision-level fusion in a hierarchical classifier for emotion recognition in the wild"],"prefix":"10.1007","volume":"10","author":[{"given":"Bo","family":"Sun","sequence":"first","affiliation":[]},{"given":"Liandong","family":"Li","sequence":"additional","affiliation":[]},{"given":"Xuewen","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Tian","family":"Zuo","sequence":"additional","affiliation":[]},{"given":"Ying","family":"Chen","sequence":"additional","affiliation":[]},{"given":"Guoyan","family":"Zhou","sequence":"additional","affiliation":[]},{"given":"Jun","family":"He","sequence":"additional","affiliation":[]},{"given":"Xiaoming","family":"Zhu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,11,18]]},"reference":[{"key":"203_CR1","volume-title":"Nonverbal communication in human interaction","author":"M Knapp","year":"2013","unstructured":"Knapp M, Hall J, Horgan T (2013) Nonverbal communication in human interaction. Cengage Learning, Oklahoma"},{"issue":"12","key":"203_CR2","doi-asserted-by":"crossref","first-page":"1424","DOI":"10.1109\/34.895976","volume":"22","author":"M Pantic","year":"2000","unstructured":"Pantic M, Rothkrantz LJM (2000) Automatic analysis of facial expressions: the state of the art. Pattern Anal Mach Intell IEEE Trans 22(12):1424\u20131445","journal-title":"Pattern Anal Mach Intell IEEE Trans"},{"key":"203_CR3","doi-asserted-by":"crossref","unstructured":"Wu T, Bartlett MS, Movellan JR (2010) Facial expression recognition using Gabor motion energy filters. In: Computer vision and pattern recognition workshops (CVPRW), 2010 IEEE computer society conference on IEEE, pp 42\u201347","DOI":"10.1109\/CVPRW.2010.5543267"},{"issue":"7","key":"203_CR4","doi-asserted-by":"crossref","first-page":"971","DOI":"10.1109\/TPAMI.2002.1017623","volume":"24","author":"T Ojala","year":"2002","unstructured":"Ojala T, Pietikainen M, Maenpaa T (2002) Multiresolution gray-scale and rotation invariant texture classification with local binary patterns. Pattern Anal Mach Intell IEEE Trans 24(7):971\u2013987","journal-title":"Pattern Anal Mach Intell IEEE Trans"},{"key":"203_CR5","doi-asserted-by":"crossref","unstructured":"Dalal N, Triggs B (2005) Histograms of oriented gradients for human detection. In: Computer vision and pattern recognition. CVPR 2005. IEEE computer society conference, vol 1. IEEE, pp 886\u2013893","DOI":"10.1109\/CVPR.2005.177"},{"issue":"6","key":"203_CR6","doi-asserted-by":"crossref","first-page":"681","DOI":"10.1109\/34.927467","volume":"23","author":"TF Cootes","year":"2001","unstructured":"Cootes TF, Edwards GJ, Taylor CJ (2001) Active appearance models. IEEE Trans Pattern Anal Mach Intell 23(6):681\u2013685","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"203_CR7","first-page":"2211","volume":"12","author":"M G\u00f6nen","year":"2011","unstructured":"G\u00f6nen M, Alpayd\u0131n E (2011) Multiple kernel learning algorithms. J Mach Learn Res 12:2211\u20132268","journal-title":"J Mach Learn Res"},{"key":"203_CR8","doi-asserted-by":"crossref","unstructured":"Dhall A, Goecke R, Joshi J, Sikka K, Gedeon T (2014) Emotion recognition in the wild challenge 2014: Baseline, data and protocol. In: Proceedings of the 16th international conference on multimodal interaction. ACM, pp 461\u2013466","DOI":"10.1145\/2663204.2666275"},{"key":"203_CR9","unstructured":"Zhu X, Ramanan D (2012) Face detection, pose estimation, and landmark localization in the wild. In: Computer vision and pattern recognition (CVPR), 2012 IEEE conference on IEEE, pp 2879\u20132886"},{"key":"203_CR10","doi-asserted-by":"crossref","unstructured":"Xiong X, De la Torre F (2013) Supervised descent method and its applications to face alignment. In: Computer vision and pattern recognition (CVPR), IEEE conference on IEEE, pp 532\u2013539","DOI":"10.1109\/CVPR.2013.75"},{"issue":"3","key":"203_CR11","doi-asserted-by":"crossref","first-page":"34","DOI":"10.1109\/MMUL.2012.26","volume":"19","author":"A Dhall","year":"2012","unstructured":"Dhall A, Goecke R, Lucey S, Gedeon T (2012) Collecting large, richly annotated facial-expression databases from movies. IEEE Multimed 19(3):34\u201341","journal-title":"IEEE Multimed"},{"key":"203_CR12","doi-asserted-by":"crossref","unstructured":"Vedaldi A, Fulkerson B (2010) VLFeat: an open and portable library of computer vision algorithms. In: Proceedings of the international conference on multimedia. ACM, pp 1469\u20131472","DOI":"10.1145\/1873951.1874249"},{"issue":"2","key":"203_CR13","doi-asserted-by":"crossref","first-page":"213","DOI":"10.1007\/s11263-006-9794-4","volume":"73","author":"J Zhang","year":"2007","unstructured":"Zhang J, Marsza\u0142ek M, Lazebnik S, Schmid C (2007) Local features and kernels for classification of texture and object categories: a comprehensive study. Int J Comput Vis 73(2):213\u2013238","journal-title":"Int J Comput Vis"},{"key":"203_CR14","doi-asserted-by":"crossref","unstructured":"Sikka K, Wu T, Susskind J, Bartlett M (2012) Exploring bag of words architectures in the facial expression domain. In: Computer vision-ECCV 2012. Workshops and demonstrations. Springer, Berlin, pp 250\u2013259","DOI":"10.1007\/978-3-642-33868-7_25"},{"key":"203_CR15","doi-asserted-by":"crossref","unstructured":"Wang J, Yang J, Yu K, Lv F, Huang T, Gong Y (2010) Locality-constrained linear coding for image classification. In: Computer Vision and pattern recognition (CVPR), 2010 IEEE conference on IEEE, pp 3360\u20133367","DOI":"10.1109\/CVPR.2010.5540018"},{"key":"203_CR16","doi-asserted-by":"crossref","unstructured":"Lazebnik S, Schmid C, Ponce J (2006) Beyond bags of features: spatial pyramid matching for recognizing natural scene categories. In: Computer vision and pattern recognition, IEEE computer society conference on IEEE, vol. 2, pp 2169\u20132178","DOI":"10.1109\/CVPR.2006.68"},{"key":"203_CR17","doi-asserted-by":"crossref","unstructured":"Yang J, Yu K, Gong Y, Huang T (2009) Linear spatial pyramid matching using sparse coding for image classification. In: Computer vision and pattern recognition, CVPR 2009. IEEE conference on IEEE, pp 1794\u20131801","DOI":"10.1109\/CVPR.2009.5206757"},{"key":"203_CR18","doi-asserted-by":"crossref","unstructured":"Chatfield K, Lempitsky V, Vedaldi A, Zisserman A (2011) The devil is in the details: an evaluation of recent feature encoding methods. BMVC 2(4):239\u2013259","DOI":"10.5244\/C.25.76"},{"key":"203_CR19","doi-asserted-by":"crossref","unstructured":"Bosch A, Zisserman A, Munoz X (2007) Representing shape with a spatial pyramid kernel. In: Proceedings of the 6th ACM international conference on image and video retrieval. ACM, pp 401\u2013408","DOI":"10.1145\/1282280.1282340"},{"key":"203_CR20","doi-asserted-by":"crossref","unstructured":"Grauman K, Darrell T (2005) The pyramid match kernel: discriminative classification with sets of image features. In: Computer vision, ICCV 2005. Tenth IEEE international conference on IEEE, vol. 2, pp 1458\u20131465","DOI":"10.1109\/ICCV.2005.239"},{"key":"203_CR21","doi-asserted-by":"crossref","unstructured":"Dhall A, Asthana A, Goecke R, Gedeon T (2011) Emotion recognition using PHOG and LPQ features. In: Automatic face & gesture recognition and workshops (FG 2011), IEEE international conference on IEEE, pp 878\u2013883","DOI":"10.1109\/FG.2011.5771366"},{"issue":"6","key":"203_CR22","doi-asserted-by":"crossref","first-page":"915","DOI":"10.1109\/TPAMI.2007.1110","volume":"29","author":"G Zhao","year":"2007","unstructured":"Zhao G, Pietikainen M (2007) Dynamic texture recognition using local binary patterns with an application to facial expressions. Pattern Anal Mach Intell IEEE Trans 29(6):915\u2013928","journal-title":"Pattern Anal Mach Intell IEEE Trans"},{"key":"203_CR23","doi-asserted-by":"crossref","unstructured":"P\u00e4iv\u00e4rinta J, Rahtu E, Heikkil\u00e4 J (2011) Volume local phase quantization for blur-insensitive dynamic texture classification. In: Image analysis. Springer, Berlin, pp 360\u2013369","DOI":"10.1007\/978-3-642-21227-7_34"},{"key":"203_CR24","doi-asserted-by":"crossref","unstructured":"Eyben F, W\u00f6llmer M, Schuller B (2010) Opensmile: the Munich versatile and fast open-source audio feature extractor. In: Proceedings of the international conference on multimedia. ACM, pp 1459\u20131462","DOI":"10.1145\/1873951.1874246"},{"issue":"2","key":"203_CR25","first-page":"2","volume":"2","author":"S Young","year":"2006","unstructured":"Young S, Evermann G, Gales M, Hain T, Kershaw D, Liu X, Woodland P (2006) The HTK book (for HTK version 3.4). Camb Univ Eng Dep 2(2):2\u20133","journal-title":"Camb Univ Eng Dep"},{"issue":"3","key":"203_CR26","first-page":"27","volume":"2","author":"CC Chang","year":"2011","unstructured":"Chang CC, Lin CJ (2011) LIBSVM: a library for support vector machines. ACM Trans Intell Syst Technol (TIST) 2(3):27","journal-title":"ACM Trans Intell Syst Technol (TIST)"},{"key":"203_CR27","first-page":"1871","volume":"9","author":"RE Fan","year":"2008","unstructured":"Fan RE, Chang KW, Hsieh CJ, Wang XR, Lin CJ (2008) LIBLINEAR: a library for large linear classification. J Mach Learn Res 9:1871\u20131874","journal-title":"J Mach Learn Res"},{"key":"203_CR28","doi-asserted-by":"crossref","unstructured":"Liu M, Wang R, Huang Z, Shan S, Chen X (2013) Partial least squares regression on grassmannian manifold for emotion recognition. In: Proceedings of the 15th ACM on international conference on multimodal interaction. ACM, pp 525\u2013530","DOI":"10.1145\/2522848.2531738"},{"key":"203_CR29","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/j.cviu.2015.03.015","volume":"138","author":"S Zafeiriou","year":"2015","unstructured":"Zafeiriou S, Zhang C, Zhang Z (2015) A survey on face detection in the wild: past, present and future. Comput Vis Image Underst 138:1\u201324","journal-title":"Comput Vis Image Underst"},{"issue":"11","key":"203_CR30","doi-asserted-by":"crossref","first-page":"2233","DOI":"10.1109\/TPAMI.2011.282","volume":"34","author":"Y Peng","year":"2012","unstructured":"Peng Y, Ganesh A, Wright J, Xu W, Ma Y (2012) RASL: robust alignment by sparse and low-rank decomposition for linearly correlated images. Pattern Anal Mach Intell IEEE Trans 34(11):2233\u20132246","journal-title":"Pattern Anal Mach Intell IEEE Trans"},{"key":"203_CR31","unstructured":"Hassner T, Harel S, Paz E, Enbar R (2014) Effective face frontalization in unconstrained images. Preprint arXiv:1411.7964"},{"key":"203_CR32","volume-title":"Anthropology of the body","author":"P Ekman","year":"1977","unstructured":"Ekman P, Friesen WV (1977) Facial action coding system. In: Blacking J (ed) Anthropology of the body. Academic Press, New York"},{"key":"203_CR33","doi-asserted-by":"crossref","unstructured":"Sikka K, Dykstra K, Sathyanarayana S, Littlewort G, Bartlett M (2013) Multiple kernel learning for emotion recognition in the wild. In: Proceedings of the 15th ACM on international conference on multimodal interaction. ACM, pp 517\u2013524","DOI":"10.1145\/2522848.2531741"},{"key":"203_CR34","doi-asserted-by":"crossref","unstructured":"Kahou SE, Pal C, Bouthillier X, Froumenty P, G\u00fcl\u00e7ehre \u00c7, Memisevic R, Wu Z (2013) Combining modality specific deep neural networks for emotion recognition in video. In: Proceedings of the 15th ACM on international conference on multimodal interaction. ACM, pp 543\u2013550","DOI":"10.1145\/2522848.2531745"},{"key":"203_CR35","doi-asserted-by":"crossref","unstructured":"Liu M, Wang R, Li S, Shan S, Huang Z, Chen X (2014) Combining multiple kernel methods on iemannian manifold for emotion recognition in the wild. In: Proceedings of the 16th international conference on multimodal interaction. ACM, pp 494\u2013501","DOI":"10.1145\/2663204.2666274"},{"key":"203_CR36","doi-asserted-by":"crossref","unstructured":"Chen J, Chen Z, Chi Z, Fu H (2014) Emotion recognition in the wild with feature fusion and multiple kernel learning. In: Proceedings of the 16th international conference on multimodal interaction. ACM, pp 508\u2013513","DOI":"10.1145\/2663204.2666277"},{"issue":"3","key":"203_CR37","doi-asserted-by":"crossref","first-page":"572","DOI":"10.1016\/j.patcog.2010.09.020","volume":"44","author":"M Ayadi El","year":"2011","unstructured":"El Ayadi M, Kamel MS, Karray F (2011) Survey on speech emotion recognition: features, classification schemes, and databases. Pattern Recognit 44(3):572\u2013587","journal-title":"Pattern Recognit"},{"key":"203_CR38","doi-asserted-by":"crossref","first-page":"377","DOI":"10.1007\/978-0-85729-997-0_19","volume-title":"Visual analysis of humans","author":"F Torre De la","year":"2011","unstructured":"De la Torre F, Cohn JF (2011) Facial expression analysis. In: Moeslund TB, Hilton A, Kr\u00fcger V, Sigal L (eds) Visual analysis of humans. Springer, London, pp 377\u2013409"},{"key":"203_CR39","doi-asserted-by":"crossref","unstructured":"Huang X, He Q, Hong X, Zhao G, Pietikainen M (2014) Improved spatiotemporal local monogenic binary pattern for emotion recognition in the wild. In: Proceedings of the 16th international conference on multimodal interaction. ACM, pp 514\u2013520","DOI":"10.1145\/2663204.2666278"},{"issue":"7","key":"203_CR40","doi-asserted-by":"crossref","first-page":"1574","DOI":"10.1109\/TKDE.2012.89","volume":"25","author":"H Xia","year":"2013","unstructured":"Xia H, Hoi SC (2013) Mkboost: a framework of multiple kernel boosting. Knowl Data Eng IEEE Trans 25(7):1574\u20131586","journal-title":"Knowl Data Eng IEEE Trans"},{"issue":"7","key":"203_CR41","doi-asserted-by":"crossref","first-page":"1354","DOI":"10.1109\/TPAMI.2013.212","volume":"36","author":"SS Bucak","year":"2014","unstructured":"Bucak SS, Jin R, Jain AK (2014) Multiple kernel learning for visual object recognition: a review. Pattern Anal Mach Intell IEEE Trans 36(7):1354\u20131369","journal-title":"Pattern Anal Mach Intell IEEE Trans"},{"key":"203_CR42","doi-asserted-by":"crossref","unstructured":"Valstar M, Girard J, Almaev T, McKeown G, Mehu M, Yin L, Cohn J (2015) Fera 2015-second facial expression recognition and analysis challenge. Proceeding of the IEEE ICFG","DOI":"10.1109\/FG.2015.7284874"},{"key":"203_CR43","doi-asserted-by":"crossref","unstructured":"Almaev TR, Valstar MF (2013) Local gabor binary patterns from three orthogonal planes for automatic facial expression recognition. In: Affective computing and intelligent interaction (ACII), humaine association conference on IEEE, pp 356\u2013361","DOI":"10.1109\/ACII.2013.65"},{"key":"203_CR44","doi-asserted-by":"crossref","unstructured":"Valstar MF, Jiang B, Mehu M, Pantic M, Scherer K (2011) The first facial expression recognition and analysis challenge. In: Automatic face & gesture recognition and workshops (FG 2011), IEEE international conference on IEEE, pp 921\u2013926","DOI":"10.1109\/FG.2011.5771374"},{"issue":"2","key":"203_CR45","doi-asserted-by":"crossref","first-page":"97","DOI":"10.1109\/34.908962","volume":"23","author":"YL Tian","year":"2001","unstructured":"Tian YL, Kanade T, Cohn JF (2001) Recognizing action units for facial expression analysis. Pattern Anal Mach Intell IEEE Trans 23(2):97\u2013115","journal-title":"Pattern Anal Mach Intell IEEE Trans"},{"key":"203_CR46","doi-asserted-by":"crossref","unstructured":"Sun B, Li L, Zuo T, Chen Y, Zhou G, Wu X (2014) Combining multimodal features with hierarchical classifier fusion for emotion recognition in the wild. In: Proceedings of the 16th international conference on multimodal interaction. ACM, pp 481\u2013486","DOI":"10.1145\/2663204.2666272"},{"key":"203_CR47","doi-asserted-by":"crossref","unstructured":"Day M (2013) Emotion recognition with boosted tree classifiers. In: Proceedings of the 15th ACM on international conference on multimodal interaction. ACM, pp 531\u2013534","DOI":"10.1145\/2522848.2531740"},{"key":"203_CR48","doi-asserted-by":"crossref","unstructured":"Tariq U, Lin KH, Li Z, Zhou X, Wang Z, Le V, Han TX (2011) Emotion recognition from an ensemble of features. In: Automatic face & gesture recognition and workshops (FG 2011), IEEE international conference on IEEE, pp 872\u2013877","DOI":"10.1109\/FG.2011.5771365"},{"key":"203_CR49","doi-asserted-by":"crossref","unstructured":"Meudt S, Zharkov D, K\u00e4chele M, Schwenker F (2013) Multi classifier systems and forward backward feature selection algorithms to classify emotional coloured speech. In: Proceedings of the 15th ACM on international conference on multimodal interaction. ACM, pp 551\u2013556","DOI":"10.1145\/2522848.2531743"}],"container-title":["Journal on Multimodal User Interfaces"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s12193-015-0203-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s12193-015-0203-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s12193-015-0203-6","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,15]],"date-time":"2023-08-15T22:16:01Z","timestamp":1692137761000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s12193-015-0203-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,11,18]]},"references-count":49,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2016,6]]}},"alternative-id":["203"],"URL":"https:\/\/doi.org\/10.1007\/s12193-015-0203-6","relation":{},"ISSN":["1783-7677","1783-8738"],"issn-type":[{"value":"1783-7677","type":"print"},{"value":"1783-8738","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,11,18]]}}}