{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T05:17:13Z","timestamp":1776835033302,"version":"3.51.2"},"publisher-location":"Cham","reference-count":39,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030778729","type":"print"},{"value":"9783030778736","type":"electronic"}],"license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-77873-6_16","type":"book-chapter","created":{"date-parts":[[2021,7,2]],"date-time":"2021-07-02T23:04:56Z","timestamp":1625267096000},"page":"219-233","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":14,"title":["Measuring and Integrating Facial Expressions and Head Pose as Indicators of Engagement and Affect in Tutoring Systems"],"prefix":"10.1007","author":[{"given":"Hao","family":"Yu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ankit","family":"Gupta","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Will","family":"Lee","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ivon","family":"Arroyo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Margrit","family":"Betke","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Danielle","family":"Allesio","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tom","family":"Murray","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"John","family":"Magee","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Beverly P.","family":"Woolf","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,7,3]]},"reference":[{"issue":"4","key":"16_CR1","doi-asserted-by":"publisher","first-page":"387","DOI":"10.1007\/s40593-014-0023-y","volume":"24","author":"I Arroyo","year":"2014","unstructured":"Arroyo, I., Woolf, B.P., Burelson, W., Muldner, K., Rai, D., Tai, M.: A multimedia adaptive tutoring system for mathematics that addresses cognition, metacognition and affect. Int. J. Artif. Intell. Educ. 24(4), 387\u2013426 (2014)","journal-title":"Int. J. Artif. Intell. Educ."},{"issue":"4","key":"16_CR2","doi-asserted-by":"publisher","first-page":"223","DOI":"10.1016\/j.ijhcs.2009.12.003","volume":"68","author":"RS Baker","year":"2010","unstructured":"Baker, R.S., D\u2019Mello, S.K., Rodrigo, M.M.T., Graesser, A.C.: Better to be frustrated than bored: The incidence, persistence, and impact of learners\u2019 cognitive-affective states during interactions with three different computer-based learning environments. Int. J. Hum.-Comput. Stud. 68(4), 223\u2013241 (2010)","journal-title":"Int. J. Hum.-Comput. Stud."},{"issue":"2","key":"16_CR3","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2946837","volume":"6","author":"N Bosch","year":"2016","unstructured":"Bosch, N., D\u2019mello, S.K., Ocumpaugh, J., Baker, R.S., Shute, V.: Using video to automatically detect learner affect in computer-enabled classrooms. ACM Trans. Inter. Intell. Syst. (TiiS) 6(2), 1\u201326 (2016)","journal-title":"ACM Trans. Inter. Intell. Syst. (TiiS)"},{"key":"16_CR4","doi-asserted-by":"crossref","unstructured":"Bulat, A., Tzimiropoulos, G.: How far are we from solving the 2d & 3d face alignment problem?(and a dataset of 230,000 3D facial landmarks). In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1021\u20131030 (2017)","DOI":"10.1109\/ICCV.2017.116"},{"key":"16_CR5","doi-asserted-by":"crossref","unstructured":"Chang, F.J., Tuan Tran, A., Hassner, T., Masi, I., Nevatia, R., Medioni, G.: Faceposenet: making a case for landmark-free face alignment. In: Proceedings of the IEEE International Conference on Computer Vision Workshops, pp. 1599\u20131608 (2017)","DOI":"10.1109\/ICCVW.2017.188"},{"key":"16_CR6","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"92","DOI":"10.1007\/978-3-319-20267-9_8","volume-title":"User Modeling, Adaptation and Personalization","author":"S Corrigan","year":"2015","unstructured":"Corrigan, S., Barkley, T., Pardos, Z.: Dynamic approaches to modeling student affect and its changing role in learning and performance. In: Ricci, F., Bontcheva, K., Conlan, O., Lawless, S. (eds.) UMAP 2015. LNCS, vol. 9146, pp. 92\u2013103. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-20267-9_8"},{"issue":"2","key":"16_CR7","doi-asserted-by":"publisher","first-page":"104","DOI":"10.1080\/00461520.2017.1281747","volume":"52","author":"S D\u2019Mello","year":"2017","unstructured":"D\u2019Mello, S., Dieterle, E., Duckworth, A.: Advanced, analytic, automated (AAA) measurement of engagement during learning. Educ. Psychol. 52(2), 104\u2013123 (2017)","journal-title":"Educ. Psychol."},{"issue":"5","key":"16_CR8","doi-asserted-by":"publisher","first-page":"377","DOI":"10.1016\/j.ijhcs.2012.01.004","volume":"70","author":"S D\u2019Mello","year":"2012","unstructured":"D\u2019Mello, S., Olney, A., Williams, C., Hays, P.: Gaze tutor: a gaze-reactive intelligent tutoring system. Int. J. Hum.-Comput. Stud. 70(5), 377\u2013398 (2012)","journal-title":"Int. J. Hum.-Comput. Stud."},{"key":"16_CR9","doi-asserted-by":"publisher","first-page":"153","DOI":"10.1016\/j.learninstruc.2012.05.003","volume":"29","author":"S D\u2019Mello","year":"2014","unstructured":"D\u2019Mello, S., Lehman, B., Pekrun, R., Graesser, A.: Confusion can be beneficial for learning. Learn. Instr. 29, 153\u2013170 (2014)","journal-title":"Learn. Instr."},{"key":"16_CR10","series-title":"Educational Communications and Technology: Issues and Innovations","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1007\/978-3-030-02631-8_6","volume-title":"Mind, Brain and Technology","author":"SK D\u2019Mello","year":"2019","unstructured":"D\u2019Mello, S.K.: Gaze-based attention-aware cyberlearning technologies. In: Parsons, T.D., Lin, L., Cockerham, D. (eds.) Mind, Brain and Technology. ECTII, pp. 87\u2013105. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-02631-8_6"},{"key":"16_CR11","unstructured":"Ekman, P., Friesen, W.V., Hager, J.C.: Facial action coding system. Research Nexus, Salt Lake City (2002)"},{"issue":"2","key":"16_CR12","doi-asserted-by":"publisher","first-page":"124","DOI":"10.1037\/h0030377","volume":"17","author":"P Ekman","year":"1971","unstructured":"Ekman, P., Friesen, W.V.: Constants across cultures in the face and emotion. J. Pers. Soc. Psychol. 17(2), 124 (1971)","journal-title":"J. Pers. Soc. Psychol."},{"key":"16_CR13","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"101","DOI":"10.1007\/978-3-642-23123-0_11","volume-title":"Pattern Recognition","author":"G Fanelli","year":"2011","unstructured":"Fanelli, G., Weise, T., Gall, J., Van Gool, L.: Real time head pose estimation from consumer depth cameras. In: Mester, R., Felsberg, M. (eds.) DAGM 2011. LNCS, vol. 6835, pp. 101\u2013110. Springer, Heidelberg (2011). https:\/\/doi.org\/10.1007\/978-3-642-23123-0_11"},{"key":"16_CR14","doi-asserted-by":"crossref","unstructured":"Gou, C., Wu, Y., Wang, F.Y., Ji, Q.: Coupled cascade regression for simultaneous facial landmark detection and head pose estimation. In: 2017 IEEE International Conference on Image Processing (ICIP), pp. 2906\u20132910. IEEE (2017)","DOI":"10.1109\/ICIP.2017.8296814"},{"key":"16_CR15","doi-asserted-by":"crossref","unstructured":"Grafsgaard, J.F., Wiggins, J.B., Vail, A.K., Boyer, K.E., Wiebe, E.N., Lester, J.C.: The additive value of multimodal features for predicting engagement, frustration, and learning during tutoring. In: Proceedings of the 16th International Conference on Multimodal Interaction, pp. 42\u201349 (2014)","DOI":"10.1145\/2663204.2663264"},{"issue":"6","key":"16_CR16","doi-asserted-by":"publisher","first-page":"787","DOI":"10.3758\/BF03206794","volume":"57","author":"JE Hoffman","year":"1995","unstructured":"Hoffman, J.E., Subramaniam, B.: The role of visual attention in saccadic eye movements. Percept. Psychophysics. 57(6), 787\u2013795 (1995)","journal-title":"Percept. Psychophysics."},{"key":"16_CR17","unstructured":"Hu, Y., Chen, L., Zhou, Y., Zhang, H.: Estimating face pose by facial asymmetry and geometry. In: Proceedings of Sixth IEEE International Conference on Automatic Face and Gesture Recognition, 2004, pp. 651\u2013656. IEEE (2004)"},{"key":"16_CR18","doi-asserted-by":"crossref","unstructured":"Hutt, S., Mills, C., Bosch, N., Krasich, K., Brockmole, J., D\u2019mello, S.: Out of the fr-eye-ing pan towards gaze-based models of attention during learning with technology in the classroom. In: Proceedings of the 25th Conference on User Modeling, Adaptation and Personalization, pp. 94\u2013103 (2017)","DOI":"10.1145\/3079628.3079669"},{"issue":"1","key":"16_CR19","doi-asserted-by":"publisher","first-page":"198","DOI":"10.1152\/jn.90815.2008","volume":"101","author":"AZ Khan","year":"2009","unstructured":"Khan, A.Z., Blohm, G., McPeek, R.M., Lefevre, P.: Differential influence of attention on gaze and head movements. J. Neurophysiol. 101(1), 198\u2013206 (2009)","journal-title":"J. Neurophysiol."},{"key":"16_CR20","doi-asserted-by":"crossref","unstructured":"Khorrami, P., Paine, T., Huang, T.: Do deep neural networks learn facial action units when doing expression recognition? In: Proceedings of the IEEE International Conference on Computer Vision Workshops, pp. 19\u201327 (2015)","DOI":"10.1109\/ICCVW.2015.12"},{"key":"16_CR21","doi-asserted-by":"crossref","unstructured":"Kumar, A., Alavi, A., Chellappa, R.: Kepler: keypoint and pose estimation of unconstrained faces by learning efficient H-CNN regressors. In: 2017 12th IEEE International Conference on Automatic Face & Gesture Recognition (FG 2017), pp. 258\u2013265. IEEE (2017)","DOI":"10.1109\/FG.2017.149"},{"key":"16_CR22","doi-asserted-by":"crossref","unstructured":"Martins, P., Batista, J.: Accurate single view model-based head pose estimation. In: 2008 8th IEEE International Conference on Automatic Face & Gesture Recognition, pp. 1\u20136. IEEE (2008)","DOI":"10.1109\/AFGR.2008.4813369"},{"key":"16_CR23","doi-asserted-by":"crossref","unstructured":"Meng, Z., Liu, P., Cai, J., Han, S., Tong, Y.: Identity-aware convolutional neural network for facial expression recognition. In: 2017 12th IEEE International Conference on Automatic Face & Gesture Recognition (FG 2017), pp. 558\u2013565. IEEE (2017)","DOI":"10.1109\/FG.2017.140"},{"issue":"11","key":"16_CR24","doi-asserted-by":"publisher","first-page":"2094","DOI":"10.1109\/TMM.2015.2482819","volume":"17","author":"SS Mukherjee","year":"2015","unstructured":"Mukherjee, S.S., Robertson, N.M.: Deep head pose: Gaze-direction estimation in multimodal video. IEEE Trans. Multimedia. 17(11), 2094\u20132107 (2015)","journal-title":"IEEE Trans. Multimedia."},{"issue":"1","key":"16_CR25","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1109\/TPAMI.2017.2781233","volume":"41","author":"R Ranjan","year":"2017","unstructured":"Ranjan, R., Patel, V.M., Chellappa, R.: Hyperface: a deep multi-task learning framework for face detection, landmark localization, pose estimation, and gender recognition. IEEE Trans. Pattern Anal. Mach. Intell. 41(1), 121\u2013135 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"3","key":"16_CR26","doi-asserted-by":"publisher","first-page":"372","DOI":"10.1037\/0033-2909.124.3.372","volume":"124","author":"K Rayner","year":"1998","unstructured":"Rayner, K.: Eye movements in reading and information processing: 20 years of research. Psychol. Bull. 124(3), 372 (1998)","journal-title":"Psychol. Bull."},{"key":"16_CR27","doi-asserted-by":"crossref","unstructured":"Ruiz, N., Chong, E., Rehg, J.M.: Fine-grained head pose estimation without keypoints. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition Workshops, pp. 2074\u20132083 (2018)","DOI":"10.1109\/CVPRW.2018.00281"},{"issue":"6","key":"16_CR28","doi-asserted-by":"publisher","first-page":"803","DOI":"10.1016\/j.imavis.2008.08.005","volume":"27","author":"C Shan","year":"2009","unstructured":"Shan, C., Gong, S., McOwan, P.W.: Facial expression recognition based on local binary patterns: A comprehensive study. Image Vis. Comput. 27(6), 803\u2013816 (2009)","journal-title":"Image Vis. Comput."},{"key":"16_CR29","doi-asserted-by":"crossref","unstructured":"Sharma, K., Alavi, H.S., Jermann, P., Dillenbourg, P.: A gaze-based learning analytics model: in-video visual feedback to improve learner\u2019s attention in MOOCs. In: Proceedings of the Sixth International Conference on Learning Analytics & Knowledge, pp. 417\u2013421 (2016)","DOI":"10.1145\/2883851.2883902"},{"issue":"1","key":"16_CR30","doi-asserted-by":"publisher","first-page":"86","DOI":"10.1109\/TAFFC.2014.2316163","volume":"5","author":"J Whitehill","year":"2014","unstructured":"Whitehill, J., Serpell, Z., Lin, Y.C., Foster, A., Movellan, J.R.: The faces of engagement: automatic recognition of student engagement from facial expressions. IEEE Trans. Affect. Comput. 5(1), 86\u201398 (2014)","journal-title":"IEEE Trans. Affect. Comput."},{"key":"16_CR31","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"471","DOI":"10.1007\/978-3-319-08786-3_42","volume-title":"User Modeling, Adaptation, and Personalization","author":"M Wixon","year":"2014","unstructured":"Wixon, M., Arroyo, I.: When the question is part of the answer: examining the impact of emotion self-reports on student emotion. In: Dimitrova, V., Kuflik, T., Chin, D., Ricci, F., Dolog, P., Houben, G.-J. (eds.) UMAP 2014. LNCS, vol. 8538, pp. 471\u2013477. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-08786-3_42"},{"issue":"3\u20134","key":"16_CR32","doi-asserted-by":"publisher","first-page":"129","DOI":"10.1504\/IJLT.2009.028804","volume":"4","author":"B Woolf","year":"2009","unstructured":"Woolf, B., Burleson, W., Arroyo, I., Dragon, T., Cooper, D., Picard, R.: Affect-aware tutors: recognising and responding to student affect. Int. J. Learn. Technol. 4(3\u20134), 129\u2013164 (2009)","journal-title":"Int. J. Learn. Technol."},{"key":"16_CR33","doi-asserted-by":"crossref","unstructured":"Yang, T.Y., Chen, Y.T., Lin, Y.Y., Chuang, Y.Y.: FSA-net: learning fine-grained structure aggregation for head pose estimation from a single image. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1087\u20131096 (2019)","DOI":"10.1109\/CVPR.2019.00118"},{"key":"16_CR34","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/978-3-319-09339-0_1","volume-title":"Intelligent Computing Methodologies","author":"R Zatarain-Cabada","year":"2014","unstructured":"Zatarain-Cabada, R., Barr\u00f3n-Estrada, M.L., Camacho, J.L.O., Reyes-Garc\u00eda, C.A.: Affective tutoring system for android mobiles. In: Huang, D.-S., Jo, K.-H., Wang, L. (eds.) ICIC 2014. LNCS (LNAI), vol. 8589, pp. 1\u201310. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-09339-0_1"},{"key":"16_CR35","doi-asserted-by":"crossref","unstructured":"Zhang, F., Zhang, T., Mao, Q., Xu, C.: Joint pose and expression modeling for facial expression recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3359\u20133368 (2018)","DOI":"10.1109\/CVPR.2018.00354"},{"issue":"1","key":"16_CR36","first-page":"38","volume":"41","author":"R Zhi","year":"2010","unstructured":"Zhi, R., Flierl, M., Ruan, Q., Kleijn, W.B.: Graph-preserving sparse nonnegative matrix factorization with application to facial expression recognition. IEEE Trans. Syst. Man Cybern. B Cybern. 41(1), 38\u201352 (2010)","journal-title":"IEEE Trans. Syst. Man Cybern. B Cybern."},{"key":"16_CR37","doi-asserted-by":"crossref","unstructured":"Zhong, L., Liu, Q., Yang, P., Liu, B., Huang, J., Metaxas, D.N.: Learning active facial patches for expression analysis. In: 2012 IEEE Conference on Computer Vision and Pattern Recognition, pp. 2562\u20132569. IEEE (2012)","DOI":"10.1109\/CVPR.2012.6247974"},{"key":"16_CR38","doi-asserted-by":"crossref","unstructured":"Zhu, X., Lei, Z., Liu, X., Shi, H., Li, S.Z.: Face alignment across large poses: a 3D solution. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 146\u2013155 (2016)","DOI":"10.1109\/CVPR.2016.23"},{"issue":"1","key":"16_CR39","doi-asserted-by":"publisher","first-page":"78","DOI":"10.1109\/TPAMI.2017.2778152","volume":"41","author":"X Zhu","year":"2017","unstructured":"Zhu, X., Liu, X., Lei, Z., Li, S.Z.: Face alignment in full pose range: a 3D total solution. IEEE Trans. Pattern Anal. Mach. Intell. 41(1), 78\u201392 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."}],"container-title":["Lecture Notes in Computer Science","Adaptive Instructional Systems. Adaptation Strategies and Methods"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-77873-6_16","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,2]],"date-time":"2025-07-02T22:13:20Z","timestamp":1751494400000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-77873-6_16"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"ISBN":["9783030778729","9783030778736"],"references-count":39,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-77873-6_16","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021]]},"assertion":[{"value":"3 July 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"HCII","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Human-Computer Interaction","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"24 July 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 July 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"hcii2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/2021.hci.international\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}