{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,7]],"date-time":"2025-11-07T15:47:14Z","timestamp":1762530434289,"version":"build-2065373602"},"reference-count":63,"publisher":"Springer Science and Business Media LLC","issue":"15","license":[{"start":{"date-parts":[[2025,9,30]],"date-time":"2025-09-30T00:00:00Z","timestamp":1759190400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,9,30]],"date-time":"2025-09-30T00:00:00Z","timestamp":1759190400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100019065","name":"Tianjin Science and Technology Planning Project","doi-asserted-by":"crossref","award":["20JCYBJC00300"],"award-info":[{"award-number":["20JCYBJC00300"]}],"id":[{"id":"10.13039\/501100019065","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["11404240, 62001328"],"award-info":[{"award-number":["11404240, 62001328"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Appl Intell"],"published-print":{"date-parts":[[2025,10]]},"DOI":"10.1007\/s10489-025-06893-5","type":"journal-article","created":{"date-parts":[[2025,9,30]],"date-time":"2025-09-30T08:32:06Z","timestamp":1759221126000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Balancing act: engagement detection in online learning through master-assistant models with an enhanced hierarchical attention mechanism"],"prefix":"10.1007","volume":"55","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8326-3839","authenticated-orcid":false,"given":"Tingting","family":"Han","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ruqian","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shuwei","family":"Dou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wei","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiaoming","family":"Ding","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wenxia","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jihao","family":"Lang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wenxuan","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jixing","family":"Han","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,9,30]]},"reference":[{"key":"6893_CR1","unstructured":"Means B, Toyama Y, Murphy R, Bakia M, Jones K (2009) Evaluation of evidence-based practices in online learning: A meta-analysis and review of online learning studies"},{"key":"6893_CR2","unstructured":"Onah DF, Sinclair J, Boyatt R (2014) Dropout rates of massive open online courses: behavioural patterns. EDULEARN14 proceedings, pp 5825\u20135834"},{"key":"6893_CR3","doi-asserted-by":"publisher","first-page":"593","DOI":"10.1007\/s11423-010-9177-y","volume":"59","author":"Y Lee","year":"2011","unstructured":"Lee Y, Choi J (2011) A review of online course dropout research: implications for practice and future research. Edu Technol Res Dev 59:593\u2013618","journal-title":"Edu Technol Res Dev"},{"key":"6893_CR4","doi-asserted-by":"publisher","first-page":"429","DOI":"10.1007\/s12528-019-09241-y","volume":"32","author":"H Aldowah","year":"2020","unstructured":"Aldowah H, Al-Samarraie H, Alzahrani AI, Alalwan N (2020) Factors affecting student dropout in moocs: a cause and effect decision-making model. J Comput Higher Edu 32:429\u2013454","journal-title":"J Comput Higher Edu"},{"key":"6893_CR5","doi-asserted-by":"crossref","unstructured":"Li Y-Y, Hung Y-P (2019) Feature fusion of face and body for engagement intensity detection. In: 2019 IEEE international conference on image processing (ICIP), pp 3312\u20133316. IEEE","DOI":"10.1109\/ICIP.2019.8803488"},{"key":"6893_CR6","doi-asserted-by":"crossref","unstructured":"Chang C, Zhang C, Chen L, Liu Y (2018) An ensemble model using face and body tracking for engagement detection. In: Proceedings of the 20th ACM international conference on multimodal interaction, pp 616\u2013622","DOI":"10.1145\/3242969.3264986"},{"issue":"10","key":"6893_CR7","doi-asserted-by":"publisher","first-page":"6609","DOI":"10.1007\/s10489-020-02139-8","volume":"51","author":"J Liao","year":"2021","unstructured":"Liao J, Liang Y, Pan J (2021) Deep facial spatiotemporal network for engagement prediction in online learning. Appl Intell 51(10):6609\u20136621","journal-title":"Appl Intell"},{"issue":"3","key":"6893_CR8","first-page":"107","volume":"11","author":"X Ma","year":"2021","unstructured":"Ma X, Xu M, Dong Y, Sun Z (2021) Automatic student engagement in online learning environment based on neural turing machine. Int J Inf Edu Technol 11(3):107\u2013111","journal-title":"Int J Inf Edu Technol"},{"issue":"12","key":"6893_CR9","doi-asserted-by":"publisher","first-page":"13803","DOI":"10.1007\/s10489-022-03200-4","volume":"52","author":"NK Mehta","year":"2022","unstructured":"Mehta NK, Prasad SS, Saurav S, Saini R, Singh S (2022) Three-dimensional densenet self-attention neural network for automatic detection of student\u2019s engagement. Appl Intell 52(12):13803\u201313823","journal-title":"Appl Intell"},{"key":"6893_CR10","doi-asserted-by":"crossref","unstructured":"Copur O, Nak\u0131p M, Scardapane S, Slowack J (2022) Engagement detection with multi-task training in e-learning environments. In: International conference on image analysis and processing, pp 411\u2013422. Springer","DOI":"10.1007\/978-3-031-06433-3_35"},{"key":"6893_CR11","unstructured":"Abedi A, Khan S (2021) Affect-driven ordinal engagement measurement from video. arXiv:2106.10882"},{"issue":"1","key":"6893_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s00530-023-01244-1","volume":"30","author":"A Abedi","year":"2024","unstructured":"Abedi A, Thomas C, Jayagopi DB, Khan SS (2024) Bag of states: a non-sequential approach to video-based engagement measurement. Multimed Syst 30(1):1\u201316","journal-title":"Multimed Syst"},{"key":"6893_CR13","doi-asserted-by":"crossref","unstructured":"Coelli S, Sclocco R, Barbieri R, Reni G, Zucca C, Bianchi AM (2015) Eeg-based index for engagement level monitoring during sustained attention. In: 2015 37th Annual international conference of the ieee engineering in medicine and biology society (EMBC), pp 1512\u20131515. IEEE","DOI":"10.1109\/EMBC.2015.7318658"},{"issue":"7","key":"6893_CR14","doi-asserted-by":"publisher","first-page":"509","DOI":"10.3390\/bios12070509","volume":"12","author":"M Bustos-Lopez","year":"2022","unstructured":"Bustos-Lopez M, Cruz-Ram\u00edrez N, Guerra-Hern\u00e1ndez A, S\u00e1nchez-Morales LN, Cruz-Ramos NA, Alor-Hern\u00e1ndez G (2022) Wearables for engagement detection in learning environments: a review. Biosensors 12(7):509","journal-title":"Biosensors"},{"key":"6893_CR15","doi-asserted-by":"crossref","unstructured":"Slov\u00e1k P, Tennent P, Reeves S, Fitzpatrick G (2014) Exploring skin conductance synchronisation in everyday interactions. In: Proceedings of the 8th Nordic Conference on Human-computer Interaction: Fun, Fast, Foundational, pp 511\u2013520","DOI":"10.1145\/2639189.2639206"},{"issue":"9","key":"6893_CR16","doi-asserted-by":"publisher","first-page":"3294","DOI":"10.3390\/s22093294","volume":"22","author":"X Sol\u00e9-Beteta","year":"2022","unstructured":"Sol\u00e9-Beteta X, Navarro J, Gaj\u0161ek B, Guadagni A, Zaballos A (2022) A data-driven approach to quantify and measure students\u2019 engagement in synchronous virtual learning environments. Sensors 22(9):3294","journal-title":"Sensors"},{"issue":"1","key":"6893_CR17","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1177\/2042753019882567","volume":"17","author":"BY Rajabalee","year":"2020","unstructured":"Rajabalee BY, Santally MI, Rennie F (2020) A study of the relationship between students\u2019 engagement and their academic performances in an elearning environment. E-learning and Digital Media 17(1):1\u201320","journal-title":"E-learning and Digital Media"},{"key":"6893_CR18","unstructured":"Gupta A, D\u2019Cunha A, Awasthi K, Balasubramanian V (2016) Daisee: Towards user engagement recognition in the wild. arXiv:1609.01885"},{"key":"6893_CR19","doi-asserted-by":"crossref","unstructured":"Kaur A, Mustafa A, Mehta L, Dhall A (2018) Prediction and localization of student engagement in the wild. In: 2018 Digital image computing: techniques and applications (DICTA), pp 1\u20138. IEEE","DOI":"10.1109\/DICTA.2018.8615851"},{"key":"6893_CR20","doi-asserted-by":"publisher","first-page":"99573","DOI":"10.1109\/ACCESS.2022.3206779","volume":"10","author":"T Selim","year":"2022","unstructured":"Selim T, Elkabani I, Abdou MA (2022) Students engagement level detection in online e-learning using hybrid efficientnetb7 together with tcn, lstm, and bi-lstm. IEEE Access 10:99573\u201399583","journal-title":"IEEE Access"},{"key":"6893_CR21","doi-asserted-by":"crossref","unstructured":"Zhang H, Xiao X, Huang T, Liu S, Xia Y, Li J (2019) An novel end-to-end network for automatic student engagement recognition. In: 2019 IEEE 9th international conference on electronics information and emergency communication (ICEIEC), pp 342\u2013345. IEEE","DOI":"10.1109\/ICEIEC.2019.8784507"},{"key":"6893_CR22","doi-asserted-by":"crossref","unstructured":"Abedi A, Khan SS (2021) Improving state-of-the-art in detecting student engagement with resnet and tcn hybrid network. In: 2021 18th Conference on Robots and vision (CRV), pp 151\u2013157. IEEE","DOI":"10.1109\/CRV52889.2021.00028"},{"key":"6893_CR23","unstructured":"Malekshahi S, Kheyridoost JM, Fatemi O (2024) A general model for detecting learner engagement: Implementation and evaluation. arXiv:2405.04251"},{"key":"6893_CR24","doi-asserted-by":"crossref","unstructured":"Hafiz AM, Parah SA, Bhat RUA (2021) Attention mechanisms and deep learning for machine vision: A survey of the state of the art. arXiv:2106.07550","DOI":"10.21203\/rs.3.rs-510910\/v1"},{"key":"6893_CR25","doi-asserted-by":"crossref","unstructured":"Wang Q, Wu B, Zhu P, Li P, Zuo W, Hu Q (2020) Eca-net: Efficient channel attention for deep convolutional neural networks. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 11534\u201311542","DOI":"10.1109\/CVPR42600.2020.01155"},{"key":"6893_CR26","doi-asserted-by":"crossref","unstructured":"Woo S, Park J, Lee J-Y, Kweon IS (2018) Cbam: Convolutional block attention module. In: Proceedings of the european conference on computer vision (ECCV), pp 3\u201319","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"6893_CR27","doi-asserted-by":"publisher","first-page":"220","DOI":"10.1016\/j.eswa.2016.12.035","volume":"73","author":"G Haixiang","year":"2017","unstructured":"Haixiang G, Yijing L, Shang J, Mingyun G, Yuanyue H, Bing G (2017) Learning from class-imbalanced data: review of methods and applications. Expert Syst Appl 73:220\u2013239","journal-title":"Expert Syst Appl"},{"key":"6893_CR28","unstructured":"Hinton G, Vinyals O, Dean J (2015) Distilling the knowledge in a neural network. arXiv:1503.02531"},{"issue":"1","key":"6893_CR29","doi-asserted-by":"publisher","first-page":"18","DOI":"10.1111\/j.0824-7935.2004.t01-1-00228.x","volume":"20","author":"A Estabrooks","year":"2004","unstructured":"Estabrooks A, Jo T, Japkowicz N (2004) A multiple resampling method for learning from imbalanced data sets. Comput Intell 20(1):18\u201336","journal-title":"Comput Intell"},{"key":"6893_CR30","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla NV, Bowyer KW, Hall LO, Kegelmeyer WP (2002) Smote: synthetic minority over-sampling technique. J Artif Intell Res 16:321\u2013357","journal-title":"J Artif Intell Res"},{"key":"6893_CR31","doi-asserted-by":"crossref","unstructured":"Tahir M.A, Kittler J, Mikolajczyk K, Yan F (2009) A multiple expert approach to the class imbalance problem using inverse random under sampling. In: Multiple classifier systems: 8th international workshop, MCS 2009, Reykjavik, Iceland, June 10-12, 2009. Proceedings 8, pp 82\u201391. Springer","DOI":"10.1007\/978-3-642-02326-2_9"},{"key":"6893_CR32","unstructured":"Guyon I, Elisseeff A (2003) An introduction to variable and feature selection. J Mach Learn Res 3(Mar):1157\u20131182"},{"issue":"12","key":"6893_CR33","doi-asserted-by":"publisher","first-page":"3358","DOI":"10.1016\/j.patcog.2007.04.009","volume":"40","author":"Y Sun","year":"2007","unstructured":"Sun Y, Kamel MS, Wong AK, Wang Y (2007) Cost-sensitive boosting for classification of imbalanced data. Pattern Recogn 40(12):3358\u20133378","journal-title":"Pattern Recogn"},{"key":"6893_CR34","doi-asserted-by":"crossref","unstructured":"Sarfraz F, Arani E, Zonooz B (2021) Knowledge distillation beyond model compression. In: 2020 25th International conference on pattern recognition (ICPR), pp 6136\u20136143. IEEE","DOI":"10.1109\/ICPR48806.2021.9413016"},{"key":"6893_CR35","doi-asserted-by":"crossref","unstructured":"Xing X, Hou Y, Li H, Yuan Y, Li H, Meng MQ-H (2021) Categorical relation-preserving contrastive knowledge distillation for medical image classification. In: Medical Image Computing and Computer Assisted Intervention\u2013MICCAI 2021: 24th International Conference, Strasbourg, France, September 27\u2013October 1, 2021, Proceedings, Part V 24, pp 163\u2013173. Springer","DOI":"10.1007\/978-3-030-87240-3_16"},{"key":"6893_CR36","doi-asserted-by":"publisher","unstructured":"Xiao Z, Tong H (2025) Federated contrastive learning with feature-based distillation for human activity recognition. IEEE Transactions on Computational Social Systems, pp 1\u201314. https:\/\/doi.org\/10.1109\/TCSS.2024.3510428","DOI":"10.1109\/TCSS.2024.3510428"},{"issue":"8","key":"6893_CR37","doi-asserted-by":"publisher","first-page":"4101","DOI":"10.1109\/TAI.2024.3360180","volume":"5","author":"Z Xiao","year":"2024","unstructured":"Xiao Z, Xing H, Qu R, Li H, Feng L, Zhao B, Yang J (2024) Self-bidirectional decoupled distillation for time series classification. IEEE Trans Artif Intell 5(8):4101\u20134110. https:\/\/doi.org\/10.1109\/TAI.2024.3360180","journal-title":"IEEE Trans Artif Intell"},{"issue":"3","key":"6893_CR38","doi-asserted-by":"publisher","first-page":"3735","DOI":"10.1007\/s13369-023-08159-z","volume":"49","author":"A Abed","year":"2024","unstructured":"Abed A, Akrout B, Amous I (2024) Convolutional neural network for head segmentation and counting in crowded retail environment using top-view depth images. Arab J Sci Eng 49(3):3735\u20133749","journal-title":"Arab J Sci Eng"},{"key":"6893_CR39","doi-asserted-by":"crossref","unstructured":"Baltru\u0161aitis T, Robinson P, Morency L-P (2016) Openface: an open source facial behavior analysis toolkit. In: 2016 IEEE Winter conference on applications of computer vision (WACV), pp 1\u201310. IEEE","DOI":"10.1109\/WACV.2016.7477553"},{"key":"6893_CR40","doi-asserted-by":"crossref","unstructured":"Cao Z, Simon T, Wei S-E, Sheikh Y (2017) Realtime multi-person 2d pose estimation using part affinity fields. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 7291\u20137299","DOI":"10.1109\/CVPR.2017.143"},{"key":"6893_CR41","doi-asserted-by":"publisher","unstructured":"Abed A, Akrout B, Amous I (2022) Shoppers interaction classification based on an improved densenet model using rgb-d data. In: 2022 8th International conference on systems and informatics (ICSAI), pp 1\u20136. https:\/\/doi.org\/10.1109\/ICSAI57119.2022.10005508","DOI":"10.1109\/ICSAI57119.2022.10005508"},{"issue":"7","key":"6893_CR42","doi-asserted-by":"publisher","first-page":"2786","DOI":"10.1109\/TIP.2013.2258353","volume":"22","author":"M Mueller","year":"2013","unstructured":"Mueller M, Karasev P, Kolesov I, Tannenbaum A (2013) Optical flow estimation for flame detection in videos. IEEE Trans Image Process 22(7):2786\u20132797","journal-title":"IEEE Trans Image Process"},{"key":"6893_CR43","doi-asserted-by":"crossref","unstructured":"Sun S, Kuang Z, Sheng L, Ouyang W, Zhang W (2018) Optical flow guided feature: A fast and robust motion representation for video action recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1390\u20131399","DOI":"10.1109\/CVPR.2018.00151"},{"key":"6893_CR44","doi-asserted-by":"crossref","unstructured":"Ramadass A, Suk M, Prabhakaran B (2010) Feature extraction method for video based human action recognitions: extended optical flow algorithm. In: 2010 IEEE international conference on acoustics, speech and signal processing, pp 1106\u20131109. IEEE","DOI":"10.1109\/ICASSP.2010.5495352"},{"issue":"31","key":"6893_CR45","doi-asserted-by":"publisher","first-page":"19365","DOI":"10.1007\/s00521-024-10239-6","volume":"36","author":"A Abed","year":"2024","unstructured":"Abed A, Akrout B, Amous I (2024) Deep learning-based few-shot person re-identification from top-view rgb and depth images. Neural Comput Appl 36(31):19365\u201319382","journal-title":"Neural Comput Appl"},{"key":"6893_CR46","doi-asserted-by":"crossref","unstructured":"Tan C, Gao Z, Wu L, Xu Y, Xia J, Li S, Li SZ (2023) Temporal attention unit: Towards efficient spatiotemporal predictive learning. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (CVPR), pp 18770\u201318782","DOI":"10.1109\/CVPR52729.2023.01800"},{"key":"6893_CR47","first-page":"1755","volume":"10","author":"DE King","year":"2009","unstructured":"King DE (2009) Dlib-ml: a machine learning toolkit. J Mach Learn Res 10:1755\u20131758","journal-title":"J Mach Learn Res"},{"key":"6893_CR48","doi-asserted-by":"crossref","unstructured":"Wei S-E, Ramakrishna V, Kanade T, Sheikh Y (2016) Convolutional pose machines. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 4724\u20134732","DOI":"10.1109\/CVPR.2016.511"},{"key":"6893_CR49","doi-asserted-by":"crossref","unstructured":"Simon T, Joo H, Matthews I, Sheikh Y (2017) Hand keypoint detection in single images using multiview bootstrapping. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 1145\u20131153","DOI":"10.1109\/CVPR.2017.494"},{"key":"6893_CR50","doi-asserted-by":"crossref","unstructured":"Cao Z, Simon T, Wei S-E, Sheikh Y (2017) Realtime multi-person 2d pose estimation using part affinity fields. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 7291\u20137299","DOI":"10.1109\/CVPR.2017.143"},{"key":"6893_CR51","doi-asserted-by":"crossref","unstructured":"Chen Q, Ge T, Xu Y, Zhang Z, Yang X, Gai K (2018) Semantic human matting. In: Proceedings of the 26th ACM international conference on multimedia, pp 618\u2013626","DOI":"10.1145\/3240508.3240610"},{"issue":"1\u20133","key":"6893_CR52","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1016\/0004-3702(81)90024-2","volume":"17","author":"BK Horn","year":"1981","unstructured":"Horn BK, Schunck BG (1981) Determining optical flow. Artif Intell 17(1\u20133):185\u2013203","journal-title":"Artif Intell"},{"key":"6893_CR53","doi-asserted-by":"publisher","first-page":"117007","DOI":"10.1016\/j.image.2023.117007","volume":"117","author":"X Liao","year":"2023","unstructured":"Liao X, Cai Z, Chen J, Liu T, Lai J (2023) Physics-based optical flow estimation under varying illumination conditions. Signal Process Image Commun 117:117007","journal-title":"Signal Process Image Commun"},{"key":"6893_CR54","doi-asserted-by":"crossref","unstructured":"Hui T-W, Tang X, Loy CC (2018) Liteflownet: A lightweight convolutional neural network for optical flow estimation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 8981\u20138989","DOI":"10.1109\/CVPR.2018.00936"},{"issue":"8","key":"6893_CR55","doi-asserted-by":"publisher","first-page":"2555","DOI":"10.1109\/TPAMI.2020.2976928","volume":"43","author":"T-W Hui","year":"2020","unstructured":"Hui T-W, Tang X, Loy CC (2020) A lightweight optical flow cnn\u2014revisiting data fidelity and regularization. IEEE Trans Pattern Anal Mach Intell 43(8):2555\u20132569","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"6893_CR56","doi-asserted-by":"crossref","unstructured":"Hui T-W, Loy CC (2020) Liteflownet3: Resolving correspondence ambiguity for more accurate optical flow estimation. In: Computer vision\u2013ECCV 2020: 16th european conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XX 16, pp 169\u2013184. Springer","DOI":"10.1007\/978-3-030-58565-5_11"},{"key":"6893_CR57","doi-asserted-by":"crossref","unstructured":"Hara K, Kataoka H, Satoh Y (2017) Learning spatio-temporal features with 3d residual networks for action recognition. In: Proceedings of the IEEE international conference on computer vision workshops, pp 3154\u20133160","DOI":"10.1109\/ICCVW.2017.373"},{"key":"6893_CR58","doi-asserted-by":"crossref","unstructured":"Lin T-Y, Goyal P, Girshick R, He K, Doll\u00e1r P (2017) Focal loss for dense object detection. In: Proceedings of the IEEE international conference on computer vision, pp 2980\u20132988","DOI":"10.1109\/ICCV.2017.324"},{"key":"6893_CR59","doi-asserted-by":"crossref","unstructured":"Cui Y, Jia M, Lin T-Y, Song Y, Belongie S (2019) Class-balanced loss based on effective number of samples. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 9268\u20139277","DOI":"10.1109\/CVPR.2019.00949"},{"key":"6893_CR60","doi-asserted-by":"crossref","unstructured":"Saurav S, Saini R, Singh S (2022) A dual-stream fused neural network for fall detection in multi-camera and 360$$\\circ$$ videos. Neural Comput Appl 34(2):1455\u20131482","DOI":"10.1007\/s00521-021-06495-5"},{"key":"6893_CR61","unstructured":"Grandini M, Bagli E, Visani G (2020) Metrics for multi-class classification: an overview. arXiv:2008.05756"},{"key":"6893_CR62","doi-asserted-by":"crossref","unstructured":"Lyons M, Akamatsu S, Kamachi M, Gyoba J (1998) Coding facial expressions with gabor wavelets. In: Proceedings third IEEE international conference on automatic face and gesture recognition, pp 200\u2013205. IEEE","DOI":"10.1109\/AFGR.1998.670949"},{"issue":"8","key":"6893_CR63","doi-asserted-by":"publisher","first-page":"1377","DOI":"10.1080\/02699930903485076","volume":"24","author":"O Langner","year":"2010","unstructured":"Langner O, Dotsch R, Bijlstra G, Wigboldus DH, Hawk ST, Van Knippenberg A (2010) Presentation and validation of the radboud faces database. Cogn Emotion 24(8):1377\u20131388","journal-title":"Cogn Emotion"}],"container-title":["Applied Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-025-06893-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10489-025-06893-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-025-06893-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,7]],"date-time":"2025-11-07T15:41:55Z","timestamp":1762530115000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10489-025-06893-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,30]]},"references-count":63,"journal-issue":{"issue":"15","published-print":{"date-parts":[[2025,10]]}},"alternative-id":["6893"],"URL":"https:\/\/doi.org\/10.1007\/s10489-025-06893-5","relation":{},"ISSN":["0924-669X","1573-7497"],"issn-type":[{"type":"print","value":"0924-669X"},{"type":"electronic","value":"1573-7497"}],"subject":[],"published":{"date-parts":[[2025,9,30]]},"assertion":[{"value":"5 July 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 September 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 September 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no relevant, financial or non-financial interests to disclose.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing Interests"}},{"value":"The datasets used in this study (DAiSEE, EmotiW-EP, JAFFE, and RaFD) are publicly available and were obtained from previously published studies.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical and informed consent for data used"}}],"article-number":"992"}}