{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T17:04:50Z","timestamp":1765040690527,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":28,"publisher":"ACM","license":[{"start":{"date-parts":[[2015,11,9]],"date-time":"2015-11-09T00:00:00Z","timestamp":1447027200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"the Fundamental Research Funds for the Central Universities of China","award":["2014KJJCA15, 2012YBXS10"],"award-info":[{"award-number":["2014KJJCA15, 2012YBXS10"]}]},{"name":"the National Education Science Twelfth Five-Year Plan Key Issues of the Ministry of Education","award":["DCA140229"],"award-info":[{"award-number":["DCA140229"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2015,11,9]]},"DOI":"10.1145\/2818346.2830586","type":"proceedings-article","created":{"date-parts":[[2016,11,9]],"date-time":"2016-11-09T20:43:27Z","timestamp":1478724207000},"page":"497-502","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":37,"title":["Combining Multimodal Features within a Fusion Network for Emotion Recognition in the Wild"],"prefix":"10.1145","author":[{"given":"Bo","family":"Sun","sequence":"first","affiliation":[{"name":"Beijing Normal University, Beijing, China"}]},{"given":"Liandong","family":"Li","sequence":"additional","affiliation":[{"name":"Beijing Normal University, Beijing, China"}]},{"given":"Guoyan","family":"Zhou","sequence":"additional","affiliation":[{"name":"Beijing Normal University, Beijing, China"}]},{"given":"Xuewen","family":"Wu","sequence":"additional","affiliation":[{"name":"Beijing Normal University, Beijing, China"}]},{"given":"Jun","family":"He","sequence":"additional","affiliation":[{"name":"Beijing Normal University, Beijing, China"}]},{"given":"Lejun","family":"Yu","sequence":"additional","affiliation":[{"name":"Beijing Normal University, Beijing, China"}]},{"given":"Dongxue","family":"Li","sequence":"additional","affiliation":[{"name":"Beijing Normal University, Beijing, China"}]},{"given":"Qinglan","family":"Wei","sequence":"additional","affiliation":[{"name":"Beijing Normal University, Beijing, China"}]}],"member":"320","published-online":{"date-parts":[[2015,11,9]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Communication without words. Psychological today,2, 53--55","author":"Mehrabian A.","year":"1968","unstructured":"Mehrabian , A. ( 1968 ). Communication without words. Psychological today,2, 53--55 . Mehrabian, A. (1968). Communication without words. Psychological today,2, 53--55."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/34.895976"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2007.1110"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"crossref","unstructured":"P\u00e4iv\u00e4rinta J. Rahtu E. & Heikkil\u00e4 J. (2011). Volume local phase quantization for blur-insensitive dynamic texture classification. In Image Analysis (pp. 360--369). Springer Berlin Heidelberg.   P\u00e4iv\u00e4rinta J. Rahtu E. & Heikkil\u00e4 J. (2011). Volume local phase quantization for blur-insensitive dynamic texture classification. In Image Analysis (pp. 360--369). Springer Berlin Heidelberg.","DOI":"10.1007\/978-3-642-21227-7_34"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2005.177"},{"key":"e_1_3_2_1_6_1","first-page":"1150","volume-title":"The proceedings of the seventh IEEE international conference on (Vol. 2","author":"Lowe D. G.","year":"1999","unstructured":"Lowe , D. G. ( 1999 ). Object recognition from local scale-invariant features. In Computer vision, 1999 . The proceedings of the seventh IEEE international conference on (Vol. 2 , pp. 1150 -- 1157 ). Ieee. Lowe, D. G. (1999). Object recognition from local scale-invariant features. In Computer vision, 1999. The proceedings of the seventh IEEE international conference on (Vol. 2, pp. 1150--1157). Ieee."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2011.5946910"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/MMUL.2012.26"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2011.6130508"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33868-7_25"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"crossref","first-page":"312","DOI":"10.21437\/Interspeech.2009-103","volume-title":"The INTERSPEECH 2009 emotion challenge. In INTERSPEECH (Vol.","author":"Schuller B.","year":"2009","unstructured":"Schuller , B. , Steidl , S. , & Batliner , A. ( 2009 , September) . The INTERSPEECH 2009 emotion challenge. In INTERSPEECH (Vol. 2009, pp. 312 -- 315 ). Schuller, B., Steidl, S., & Batliner, A. (2009, September). The INTERSPEECH 2009 emotion challenge. In INTERSPEECH (Vol. 2009, pp. 312--315)."},{"key":"e_1_3_2_1_12_1","volume-title":"Advances in neural information processing systems (pp. 1097--1105).","author":"Krizhevsky A.","year":"2012","unstructured":"Krizhevsky , A. , Sutskever , I. , & Hinton , G. E. ( 2012 ). Imagenet classification with deep convolutional neural networks . In Advances in neural information processing systems (pp. 1097--1105). Krizhevsky, A., Sutskever, I., & Hinton, G. E. (2012). Imagenet classification with deep convolutional neural networks. In Advances in neural information processing systems (pp. 1097--1105)."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.81"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/1873951.1874246"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/2818346.2829994"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2006.68"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33868-7_25"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/2522848.2531741"},{"key":"e_1_3_2_1_19_1","volume-title":"Computer Vision and Pattern Recognition (CVPR), 2010 IEEE Conference on (pp. 3360--3367)","author":"Wang J.","year":"2010","unstructured":"Wang , J. , Yang , J. , Yu , K. , Lv , F. , Huang , T. , & Gong , Y. ( 2010 , June). Locality-constrained linear coding for image classification . In Computer Vision and Pattern Recognition (CVPR), 2010 IEEE Conference on (pp. 3360--3367) . IEEE. Wang, J., Yang, J., Yu, K., Lv, F., Huang, T., & Gong, Y. (2010, June). Locality-constrained linear coding for image classification. In Computer Vision and Pattern Recognition (CVPR), 2010 IEEE Conference on (pp. 3360--3367). IEEE."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/1873951.1874249"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/5.726791"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1038\/nature14539"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.5555\/1390681.1442794"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1145\/2663204.2666272"},{"key":"e_1_3_2_1_26_1","volume-title":"EmoNets: Multimodal deep learning approaches for emotion recognition in video. arXiv preprint arXiv:1503.01800","author":"Kahou S. E.","year":"2015","unstructured":"Kahou , S. E. , Bouthillier , X. , Lamblin , P. , Gulcehre , C. , Michalski , V. , Konda , K. , ... & Bengio , Y. ( 2015 ). EmoNets: Multimodal deep learning approaches for emotion recognition in video. arXiv preprint arXiv:1503.01800 . Kahou, S. E., Bouthillier, X., Lamblin, P., Gulcehre, C., Michalski, V., Konda, K., ... & Bengio, Y. (2015). EmoNets: Multimodal deep learning approaches for emotion recognition in video. arXiv preprint arXiv:1503.01800."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2654889"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/1553374.1553510"}],"event":{"name":"ICMI '15: INTERNATIONAL CONFERENCE ON MULTIMODAL INTERACTION","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction"],"location":"Seattle Washington USA","acronym":"ICMI '15"},"container-title":["Proceedings of the 2015 ACM on International Conference on Multimodal Interaction"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2818346.2830586","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2818346.2830586","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T05:43:39Z","timestamp":1750225419000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2818346.2830586"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,11,9]]},"references-count":28,"alternative-id":["10.1145\/2818346.2830586","10.1145\/2818346"],"URL":"https:\/\/doi.org\/10.1145\/2818346.2830586","relation":{},"subject":[],"published":{"date-parts":[[2015,11,9]]},"assertion":[{"value":"2015-11-09","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}