{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,14]],"date-time":"2026-05-14T00:04:39Z","timestamp":1778717079205,"version":"3.51.4"},"reference-count":119,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T00:00:00Z","timestamp":1769558400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T00:00:00Z","timestamp":1775174400000},"content-version":"vor","delay-in-days":65,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62307025"],"award-info":[{"award-number":["62307025"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62477026"],"award-info":[{"award-number":["62477026"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62407022"],"award-info":[{"award-number":["62407022"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J. King Saud Univ. Comput. Inf. Sci."],"published-print":{"date-parts":[[2026,4]]},"DOI":"10.1007\/s44443-026-00489-w","type":"journal-article","created":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T05:20:04Z","timestamp":1769577604000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Intelligent recognition and analysis of student behavior in real-classroom scenarios: a comprehensive survey, exploration, and future perspectives"],"prefix":"10.1007","volume":"38","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7067-6108","authenticated-orcid":false,"given":"Wanru","family":"Song","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tong","family":"He","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Haopeng","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zheng","family":"Shi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Huaruo","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chenyu","family":"Shangguan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chuanyan","family":"Hao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,1,28]]},"reference":[{"key":"489_CR1","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1109\/TLT.2023.3314610","volume":"17","author":"K Ahmad","year":"2024","unstructured":"Ahmad K, Iqbal W, El-Hassan A, Qadir J, Benhaddou D, Ayyash M, Al-Fuqaha A (2024) Data-driven artificial intelligence in education: A comprehensive review. IEEE Trans Learn Technol 17:12\u201331","journal-title":"IEEE Trans Learn Technol"},{"key":"489_CR2","doi-asserted-by":"publisher","first-page":"102601","DOI":"10.1016\/j.lindif.2024.102601","volume":"118","author":"A Bewersdorff","year":"2025","unstructured":"Bewersdorff A, Hartmann C, Hornberger M, Se\u00dfler K, Bannert M, Kasneci E, Kasneci G, Zhai X, Nerdel C (2025) Taking the next step with generative artificial intelligence: The transformative role of multimodal large language models in science education. Learn Ind Diff 118:102601","journal-title":"Learn Ind Diff"},{"key":"489_CR3","unstructured":"Bochkovskiy A, Wang C, Liao HM (2020) Yolov4: Optimal speed and accuracy of object detection. arXiv:2004.10934"},{"key":"489_CR4","doi-asserted-by":"crossref","unstructured":"Cai Z, Vasconcelos N (2018) Cascade r-cnn: Delving into high quality object detection. In: CVPR","DOI":"10.1109\/CVPR.2018.00644"},{"issue":"5","key":"489_CR5","first-page":"104","volume":"15","author":"Y Cao","year":"2024","unstructured":"Cao Y, Liu D (2024) Optimization of student behavior detection algorithm based on improved ssd algorithm. Int J Adv Comput Sci Appl 15(5):104\u2013114","journal-title":"Int J Adv Comput Sci Appl"},{"key":"489_CR6","doi-asserted-by":"crossref","unstructured":"Cao Y, Cao Q, Qian C, Chen D (2025) Yolo-amm: A real-time classroom behavior detection algorithm based on multi-dimensional feature optimization. Sensors 25(4)","DOI":"10.3390\/s25041142"},{"key":"489_CR7","unstructured":"Cao Z, Hidalgo G, Simon T, Wei S-E, Sheikh Y (2019) OpenPose: realtime multi-person 2D pose estimation using part affinity fields"},{"key":"489_CR8","doi-asserted-by":"crossref","unstructured":"Carion N, Massa F, Synnaeve G, Usunier N, Kirillov A, Zagoruyko S (2020) End-to-end object detection with transformers. In: Computer vision \u2013 ECCV 2020, Cham, pp 213\u2013229","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"489_CR9","doi-asserted-by":"crossref","unstructured":"Chai X, Yang J, Liu Y (2024) Influential factors for medical students\u2019 classroom concentration\u2014evaluation with speech recognition and face recognition technology. BMC Med Educ 14(1236)","DOI":"10.21203\/rs.3.rs-4600797\/v1"},{"issue":"21","key":"489_CR10","doi-asserted-by":"publisher","first-page":"25310","DOI":"10.1007\/s10489-023-04858-0","volume":"53","author":"Z Chen","year":"2023","unstructured":"Chen Z, Liang M, Xue Z, Yu W (2023) Stran: Student expression recognition based on spatio-temporal residual attention network in classroom teaching videos. Appl Intell 53(21):25310\u201325329","journal-title":"Appl Intell"},{"issue":"11","key":"489_CR11","first-page":"13467","volume":"45","author":"G Cheng","year":"2023","unstructured":"Cheng G, Yuan X, Yao X, Yan K, Zeng Q, Xie X, Han J (2023) Towards large-scale small object detection: Survey and benchmarks. IEEE Trans Pattern Anal Mach Intell 45(11):13467\u201313488","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"489_CR12","doi-asserted-by":"crossref","unstructured":"Chen L, Gu L, Zheng D, Fu Y (2024) Frequency-adaptive dilated convolution for semantic segmentation. In: 2024 IEEE\/CVF conference on computer vision and pattern recognition (CVPR), pp 3414\u20133425","DOI":"10.1109\/CVPR52733.2024.00328"},{"key":"489_CR13","doi-asserted-by":"crossref","unstructured":"Chen G, Ji J, Huang C (2022) Student classroom behavior recognition based on openpose and deep learning. In: 2022 7th International conference on intelligent computing and signal processing (ICSP), pp 576\u2013579","DOI":"10.1109\/ICSP54964.2022.9778501"},{"key":"489_CR14","doi-asserted-by":"crossref","unstructured":"Chen J, Kao S-h, He H, Zhuo W, Wen S, Lee C-H (2023) Run, don\u2019t walk: Chasing higher flops for faster neural networks. In: 2023 IEEE\/CVF conference on computer vision and pattern recognition (CVPR)","DOI":"10.1109\/CVPR52729.2023.01157"},{"key":"489_CR15","doi-asserted-by":"crossref","unstructured":"Chen Z, Liang M, Yu W, Huang Y, Wang X (2021) Intelligent teaching evaluation system integrating facial expression and behavior recognition in teaching video. In: 2021 IEEE international conference on big data and smart computing (BIGCOMP 2021), pp 52\u201359","DOI":"10.1109\/BigComp51126.2021.00019"},{"key":"489_CR16","doi-asserted-by":"crossref","unstructured":"Chen Z, Zhang Y, Gu J, Zhang Y, Kong L, Yuan X (2022) Cross aggregation transformer for image restoration. In: Advances in neural information processing systems, vol 35","DOI":"10.52202\/068431-1847"},{"key":"489_CR17","doi-asserted-by":"crossref","unstructured":"Crompton H, Burke D (2023) Artificial intelligence in higher education: the state of the field. Int J Educ Technol Higher Educ 20(22)","DOI":"10.1186\/s41239-023-00392-8"},{"key":"489_CR18","doi-asserted-by":"publisher","first-page":"168106","DOI":"10.1109\/ACCESS.2024.3473990","volume":"12","author":"K Cui","year":"2024","unstructured":"Cui K, Huang M, Lv W, Liu S, Zhou W, You Q (2024) Research on intelligent recognition algorithm of college students\u2019 classroom behavior based on improved single shot multibox detector. IEEE Access 12:168106\u2013168119","journal-title":"IEEE Access"},{"issue":"2","key":"489_CR19","first-page":"533","volume":"19","author":"J Dai","year":"2025","unstructured":"Dai J, Xie A, Yu D (2025) Classroom behavior recognition through joint improvement of faster rcnn algorithm under the construction of smart education. KSII Trans Int Inf Syst 19(2):533\u2013554","journal-title":"KSII Trans Int Inf Syst"},{"key":"489_CR20","doi-asserted-by":"publisher","first-page":"4935","DOI":"10.1007\/s10489-024-05409-x","volume":"54","author":"M Dang","year":"2024","unstructured":"Dang M, Liu G, Li H et al (2024) Multi-object behaviour recognition based on object detection cascaded image classification in classroom scenes. Appl Intell 54:4935\u20134951","journal-title":"Appl Intell"},{"key":"489_CR21","doi-asserted-by":"crossref","unstructured":"Dang M, Liu G, Li X, Wan B, Zhang Y, Pan R (2025) Object detector based on center keypoints for behavior recognition in classroom scenes. IEEE Trans Comput Soc Syst 1\u201313","DOI":"10.1109\/TCSS.2025.3552067"},{"key":"489_CR22","doi-asserted-by":"crossref","unstructured":"Dong C, Liu J, Xie S (2025) Dmsa-net: a deformable multiscale adaptive classroom behavior recognition network. PeerJ Comput Sci","DOI":"10.7717\/peerj-cs.2876"},{"key":"489_CR23","doi-asserted-by":"crossref","unstructured":"Duan H, Zhao Y, Chen K, Lin D, Dai B (2022) Revisiting skeleton-based action recognition. In: 2022 IEEE\/CVF conference on computer vision and pattern recognition (CVPR), pp 2959\u20132968","DOI":"10.1109\/CVPR52688.2022.00298"},{"key":"489_CR24","unstructured":"El-Nouby A, Touvron H, Caron M, Bojanowski P, Douze M, Joulin A, Laptev I, Neverova N, Synnaeve G, Verbeek J, J\u00e9gou H (2021) Xcit: Cross-covariance image transformers"},{"issue":"2","key":"489_CR25","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","volume":"88","author":"M Everingham","year":"2010","unstructured":"Everingham M, Van Gool L, Williams CKI, Winn J, Zisserman A (2010) The pascal visual object classes (voc) challenge. Int J Comput Vis 88(2):303\u2013338","journal-title":"Int J Comput Vis"},{"key":"489_CR26","doi-asserted-by":"crossref","unstructured":"Faure GJ, Chen M-H, Lai S-H (2023) Holistic interaction transformer network for action detection. In: 2023 IEEE\/CVF winter conference on applications of computer vision (WACV), pp 3329\u20133339","DOI":"10.1109\/WACV56688.2023.00334"},{"key":"489_CR27","doi-asserted-by":"publisher","first-page":"7457","DOI":"10.1007\/s10639-024-13085-0","volume":"30","author":"C Feng","year":"2025","unstructured":"Feng C, Liu J, Wang J et al (2025) Bisap: A student academic performance prediction model based on the fusion of classroom behavior images and educational information. Educ Inf Technol 30:7457\u20137483","journal-title":"Educ Inf Technol"},{"key":"489_CR28","volume-title":"Analyzing Teaching Behavior","author":"NA Flanders","year":"1970","unstructured":"Flanders NA (1970) Analyzing Teaching Behavior. Addison-Wesley Publishing Company, MA"},{"key":"489_CR29","doi-asserted-by":"crossref","unstructured":"Fu R, Wu T, Luo Z, Duan F, Qiao X, Guo P (2019) Learning behavior analysis in classroom based on deep learning. In: 2019 Tenth international conference on intelligent control and information processing (ICICIP), pp 206\u2013212","DOI":"10.1109\/ICICIP47338.2019.9012177"},{"issue":"1","key":"489_CR30","doi-asserted-by":"publisher","first-page":"142","DOI":"10.1109\/TPAMI.2015.2437384","volume":"38","author":"R Girshick","year":"2016","unstructured":"Girshick R, Donahue J, Darrell T, Malik J (2016) Region-based convolutional networks for accurate object detection and segmentation. IEEE Trans Pattern Anal Mach Intell 38(1):142\u2013158","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"489_CR31","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1007\/s10648-019-09514-z","volume":"33","author":"P Goldberg","year":"2021","unstructured":"Goldberg P, Suemer O, Stuermer K, Wagner W, Goellner R, Gerjets P, Kasneci E, Trautwein U (2021) Attentive or not? toward a machine learning approach to assessing students\u2019 visible engagement in classroom instruction. Educ Psychol Rev 33:27\u201349","journal-title":"Educ Psychol Rev"},{"issue":"6","key":"489_CR32","doi-asserted-by":"publisher","first-page":"16525","DOI":"10.1007\/s11042-023-16115-0","volume":"83","author":"M Gu","year":"2024","unstructured":"Gu M, Feng J, Chu Y (2024) A novel multi-scale facial expression recognition algorithm based on improved res2net for classroom scenes. Multimed Tools Appl 83(6):16525\u201316542","journal-title":"Multimed Tools Appl"},{"key":"489_CR33","unstructured":"Gu A, Dao T (2024) Mamba: linear-time sequence modeling with selective state spaces. arxiv:2312.00752"},{"key":"489_CR34","unstructured":"Han K, Wang Y, Guo J, Tang Y, Wu E (2022) Vision gnn: An image is worth graph of nodes. In: Advances in neural information processing systems, vol 35"},{"key":"489_CR35","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2015) Spatial pyramid pooling in deep convolutional networks for visual recognition. IEEE Trans Pattern Anal Mach Intell 37(9)","DOI":"10.1109\/TPAMI.2015.2389824"},{"key":"489_CR36","unstructured":"Howard AG, Zhu M, Chen B, Kalenichenko D, Wang W, Weyand T, Andreetto M, Adam H (2017) MobileNets: efficient convolutional neural networks for mobile vision applications"},{"key":"489_CR37","first-page":"1","volume":"63","author":"L Hu","year":"2025","unstructured":"Hu L, Yuan J, Cheng B, Xu Q (2025) Csfpr-rtdetr: Real-time small object detection network for uav images based on cross-spatial-frequency domain and position relation. IEEE Trans Geosci Remote Sens 63:1\u201319","journal-title":"IEEE Trans Geosci Remote Sens"},{"key":"489_CR38","doi-asserted-by":"crossref","unstructured":"Huang L, Yu X, Yan H, Huang L, An Z, Xu Y (2025) Af-yolo: Asymptotic feature extraction and fusion for aerial object detection. IEEE Trans Circ Syst Video Technol 1\u20131","DOI":"10.1109\/TCSVT.2025.3595740"},{"key":"489_CR39","doi-asserted-by":"publisher","first-page":"6321","DOI":"10.1007\/s10462-022-10155-y","volume":"55","author":"P Jiao","year":"2022","unstructured":"Jiao P, Ouyang F, Zhang Q et al (2022) Artificial intelligence-enabled prediction model of student academic performance in online engineering education. Artif Intell Rev 55:6321\u20136344","journal-title":"Artif Intell Rev"},{"issue":"1","key":"489_CR40","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1007\/s13563-024-00472-9","volume":"38","author":"B Jin","year":"2025","unstructured":"Jin B, Xu X (2025) Forecasts of coking coal futures price indices through gaussian process regressions. Mineral Econ 38(1):203\u2013217","journal-title":"Mineral Econ"},{"issue":"3","key":"489_CR41","doi-asserted-by":"publisher","first-page":"595","DOI":"10.1108\/FS-01-2023-0016","volume":"27","author":"B Jin","year":"2025","unstructured":"Jin B, Xu X, Zhang Y (2025) Peanut oil price change forecasts through the neural network. Foresight 27(3):595\u2013612","journal-title":"Foresight"},{"key":"489_CR42","doi-asserted-by":"crossref","unstructured":"Jin B, Xu X (2025) A study of contemporaneous residential real estate price causation across major jiangsu province cities: Methodology using vector error-correction models and directed acyclic graphs. Econ Open 2550008","DOI":"10.1142\/S308284142550008X"},{"key":"489_CR43","doi-asserted-by":"crossref","unstructured":"Jin B, Xu X (2025) China commodity price index (ccpi) forecasting via the neural network. Int J Financial Eng 1\u201327","DOI":"10.1142\/S2424786325500033"},{"key":"489_CR44","doi-asserted-by":"publisher","first-page":"388","DOI":"10.3389\/fnhum.2017.00388","volume":"11","author":"L-W Ko","year":"2017","unstructured":"Ko L-W, Komarov O, Hairston WD, Jung T-P, Lin C-T (2017) Sustained attention in real classroom settings: An EEG study. Front Human Neurosci 11:388","journal-title":"Front Human Neurosci"},{"key":"489_CR45","doi-asserted-by":"publisher","first-page":"143050","DOI":"10.1109\/ACCESS.2023.3340510","volume":"11","author":"L Li","year":"2023","unstructured":"Li L, Yao D (2023) Emotion recognition in complex classroom scenes based on improved convolutional block attention module algorithm. IEEE Access 11:143050\u2013143059","journal-title":"IEEE Access"},{"key":"489_CR46","doi-asserted-by":"crossref","unstructured":"Lin T-Y, Doll\u00e1r P, Girshick R, He K, Hariharan B, Belongie S (2017) Feature pyramid networks for object detection. In: 2017 IEEE conference on computer vision and pattern recognition (CVPR), pp 936\u2013944","DOI":"10.1109\/CVPR.2017.106"},{"key":"489_CR47","doi-asserted-by":"crossref","unstructured":"Lin F, Ngo H, Dow C, Lam K, Le H (2021) Student behavior recognition system for the classroom environment based on skeleton pose estimation and person detection. Sensors 21(16)","DOI":"10.3390\/s21165314"},{"key":"489_CR48","doi-asserted-by":"crossref","unstructured":"Lin L, Yang H, Xu Q, Xue Y, Li D (2024) Research on student classroom behavior detection based on the real-time detection transformer algorithm. Appl Sci 14","DOI":"10.3390\/app14146153"},{"key":"489_CR49","doi-asserted-by":"crossref","unstructured":"Li Y, Qi X, Saudagar AKJ, Badshah AM, Muhammad K, Liu S (2023) Student behavior recognition for interaction detection in the classroom environment. Image Vis Comput 136","DOI":"10.1016\/j.imavis.2023.104726"},{"key":"489_CR50","doi-asserted-by":"publisher","first-page":"36391","DOI":"10.1109\/ACCESS.2024.3373536","volume":"12","author":"Q Liu","year":"2024","unstructured":"Liu Q, Jiang R, Xu Q, Wang D, Sang Z, Jiang X, Wu L (2024) Yolov8n-bt: Research on classroom learning behavior recognition algorithm based on improved yolov8n. IEEE Access 12:36391\u201336403","journal-title":"IEEE Access"},{"key":"489_CR51","doi-asserted-by":"crossref","unstructured":"Liu W, Anguelov D, Erhan D, Szegedy C, Reed S, Fu C-Y, Berg AC (2016) Ssd: Single shot multibox detector. In: Computer Vision - ECCV 2016, pp 21\u201337","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"489_CR52","doi-asserted-by":"crossref","unstructured":"Liu Q, Jiang X, Jiang R (2025) Classroom behavior recognition using computer vision: A systematic review. Sensors 25(2)","DOI":"10.3390\/s25020373"},{"key":"489_CR53","unstructured":"Li S, Wang Z, Liu Z, Tan C, Lin H, Wu D, Chen Z, Zheng J, Li SZ (2024) Moganet: Multi-order gated aggregation network. In: 12th International conference on learning representations, ICLR 2024"},{"key":"489_CR54","doi-asserted-by":"crossref","unstructured":"Li J, Wen Y, He L (2023) Scconv: Spatial and channel reconstruction convolution for feature redundancy. In: 2023 IEEE\/CVF conference on computer vision and pattern recognition (CVPR), pp 6153\u20136162","DOI":"10.1109\/CVPR52729.2023.00596"},{"key":"489_CR55","doi-asserted-by":"crossref","unstructured":"Li M, Zhuang X, Bai L, Ding W (2024) Multimodal graph learning based on 3d haar semi-tight framelet for student engagement prediction. Inf Fusion 105","DOI":"10.1016\/j.inffus.2024.102224"},{"key":"489_CR56","doi-asserted-by":"publisher","first-page":"129965","DOI":"10.1016\/j.neucom.2025.129965","volume":"635","author":"W Lu","year":"2025","unstructured":"Lu W, Liu S, Ding B, Chen P, Lu F (2025) Student behavior detection model based on multilevel residual networks and hybrid attention mechanisms. Neurocomputing 635:129965","journal-title":"Neurocomputing"},{"key":"489_CR57","first-page":"1","volume":"74","author":"W Lu","year":"2025","unstructured":"Lu W, Liu X, Peng Y, Kyrarini M, An K, Cheng Y (2025) Pacr-detr: A real-time end-to-end object detector for behavior recognition in various classroom scenarios. IEEE Trans Instrum Meas 74:1\u201320","journal-title":"IEEE Trans Instrum Meas"},{"key":"489_CR58","doi-asserted-by":"publisher","first-page":"105453","DOI":"10.1016\/j.compedu.2025.105453","volume":"240","author":"X Ma","year":"2026","unstructured":"Ma X, Li C, Xu J, Zhu S, Li Y (2026) Exploring characteristics of primary school students\u2019 self-regulated learning (srl) behaviors in human-genai collaborative programming learning environments: Insights from a proposed framework. Comput Educ 240:105453","journal-title":"Comput Educ"},{"key":"489_CR59","doi-asserted-by":"crossref","unstructured":"Ma X, Dai X, Bai Y, Wang Y, Fu Y (2024) Rewrite the stars. In: 2024 IEEE\/CVF conference on computer vision and pattern recognition (CVPR), pp 5694\u20135703","DOI":"10.1109\/CVPR52733.2024.00544"},{"key":"489_CR60","doi-asserted-by":"crossref","unstructured":"Ma L, Zhou T, Yu B, Li Z, Fang R, Liu X (2024) Improving yolov7 for large target classroom behavior recognition of teachers in smart classroom scenarios. Electronics 13(18)","DOI":"10.3390\/electronics13183726"},{"issue":"4","key":"489_CR61","doi-asserted-by":"publisher","first-page":"388","DOI":"10.1001\/jama.2017.19163","volume":"319","author":"MDF McInnes","year":"2018","unstructured":"McInnes MDF, Moher D, Thombs BD, McGrath TA, Bossuyt PM (2018) PRISMA-DTA Group: Preferred reporting items for a systematic review and meta-analysis of diagnostic test accuracy studies: The prisma-dta statement. JAMA 319(4):388\u2013396","journal-title":"JAMA"},{"issue":"12","key":"489_CR62","doi-asserted-by":"publisher","first-page":"36975","DOI":"10.1007\/s11042-023-16388-5","volume":"83","author":"C Pabba","year":"2024","unstructured":"Pabba C, Bhardwaj V, Kumar P (2024) A visual intelligent system for students\u2019 behavior classification using body pose and facial features in a smart classroom. Multimed Tools Appl 83(12):36975\u201337005","journal-title":"Multimed Tools Appl"},{"key":"489_CR63","doi-asserted-by":"crossref","unstructured":"Pan J, Bulat A, Tan F, Zhu X, Dudziak L, Li H, Tzimiropoulos G, Martinez B (2022) Edgevits: competing light-weight cnns on mobile devices with vision transformers. In: Computer vision \u2013 ECCV 2022, pp 294\u2013311","DOI":"10.1007\/978-3-031-20083-0_18"},{"key":"489_CR64","doi-asserted-by":"crossref","unstructured":"Pandya D, Rana K, Padhiyar A (2025) Comparative analysis of deep learning approach to identify usage of mobile phone in the classroom environment. Educ Inf Technol","DOI":"10.1007\/s10639-025-13351-9"},{"key":"489_CR65","doi-asserted-by":"publisher","first-page":"100174","DOI":"10.1016\/j.caeai.2023.100174","volume":"5","author":"S Pang","year":"2023","unstructured":"Pang S, Lai S, Zhang A, Yang Y, Sun D (2023) Graph convolutional network for automatic detection of teachers\u2019 nonverbal behavior. Comput Educ Artif Intell 5:100174","journal-title":"Comput Educ Artif Intell"},{"issue":"6","key":"489_CR66","doi-asserted-by":"publisher","first-page":"557","DOI":"10.18280\/ts.360611","volume":"36","author":"J Pei","year":"2019","unstructured":"Pei J, Shan P (2019) A micro-expression recognition algorithm for students in classroom learning based on convolutional neural network. Traitement du Signal 36(6):557\u2013563","journal-title":"Traitement du Signal"},{"key":"489_CR67","doi-asserted-by":"crossref","unstructured":"Peng S, Zhang X, Zhou L, Wang P (2025)Yolo-cbd: Classroom behavior detection method based on behavior feature extraction and aggregation. Sensors 25(10)","DOI":"10.3390\/s25103073"},{"key":"489_CR68","doi-asserted-by":"crossref","unstructured":"Qi F, Gao Y, Wang M, Jiang T, Li Z (2024) Data mining of online teaching evaluation based on deep learning. Mathematics 12(17)","DOI":"10.3390\/math12172692"},{"key":"489_CR69","doi-asserted-by":"crossref","unstructured":"Qin Y, Liao Y, Wang Z (2024) Improved yolov8 algorithm for classroom student behavior detection. In: 2024 IEEE 6th advanced information management, communicates, electronic and automation control conference (IMCEC), vol 6, pp 757\u2013761","DOI":"10.1109\/IMCEC59810.2024.10575569"},{"key":"489_CR70","unstructured":"Radford A, Kim JW, Hallacy C et al (2021) Learning transferable visual models from natural language supervision. In: International conference on machine learning"},{"key":"489_CR71","doi-asserted-by":"crossref","unstructured":"Ramadevi Y, Krishna JA, Rafay A (2026) A review on student behavior detection. In: Advances in smart computing and applications. Springer, Cham, pp 255\u2013268","DOI":"10.1007\/978-3-032-00350-8_19"},{"key":"489_CR72","doi-asserted-by":"crossref","unstructured":"Redmon J, Divvala S, Girshick R, Farhadi A (2016) You only look once: Unified, real-time object detection. In: 2016 IEEE conference on computer vision and pattern recognition (CVPR), pp 779\u2013788","DOI":"10.1109\/CVPR.2016.91"},{"key":"489_CR73","unstructured":"Redmon J, Farhadi A (2018) Yolov3: An incremental improvement"},{"issue":"6","key":"489_CR74","doi-asserted-by":"publisher","first-page":"1137","DOI":"10.1109\/TPAMI.2016.2577031","volume":"39","author":"S Ren","year":"2017","unstructured":"Ren S, He K, Girshick R, Sun J (2017) Faster r-cnn: Towards real-time object detection with region proposal networks. IEEE Trans Pattern Anal Mach Intell 39(6):1137\u20131149","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"1\u20133","key":"489_CR75","doi-asserted-by":"publisher","first-page":"157","DOI":"10.1007\/s11263-007-0090-8","volume":"77","author":"BC Russell","year":"2008","unstructured":"Russell BC, Torralba A, Murphy KP, Freeman WT (2008) Labelme: A database and web-based tool for image annotation. Int J Comput Vis 77(1\u20133):157\u2013173","journal-title":"Int J Comput Vis"},{"key":"489_CR76","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1016\/j.neucom.2019.05.031","volume":"359","author":"J Si","year":"2019","unstructured":"Si J, Lin J, Jiang F, Shen R (2019) Hand-raising gesture detection in real classrooms using improved r-fcn. Neurocomputing 359:69\u201376","journal-title":"Neurocomputing"},{"key":"489_CR77","unstructured":"Solawetz J (2020) Yolov5 new version - improvements and evaluation"},{"key":"489_CR78","doi-asserted-by":"publisher","first-page":"8335","DOI":"10.1007\/s00521-020-05587-y","volume":"33","author":"B Sun","year":"2021","unstructured":"Sun B, Wu Y, Zhao K et al (2021) Student class behavior dataset: a video dataset for recognizing, detecting, and captioning students\u2019 behaviors in classroom scenes. Neural Comput Applic 33:8335\u20138354","journal-title":"Neural Comput Applic"},{"key":"489_CR79","first-page":"1","volume":"74","author":"Z Tang","year":"2025","unstructured":"Tang Z, Fang L, Sun S, Gong Y, Li Q (2025) Ml-detr: Multiscale-lite detection transformer for identification of mature cherry tomatoes. IEEE Trans Instrum Meas 74:1\u201318","journal-title":"IEEE Trans Instrum Meas"},{"key":"489_CR80","doi-asserted-by":"crossref","unstructured":"Tang W, Cheng Y, Ai M, Yi X (2022) Case study on a high-quality information technology lesson based on ifias. In: ACM international conference proceeding series, pp 327\u2013332","DOI":"10.1145\/3582580.3582637"},{"key":"489_CR81","doi-asserted-by":"crossref","unstructured":"Tang J, Mai F, Xie X (2024) Intelligent recognition of teaching behaviors in smart classroom. In: 2024 International conference on informatics education and computer technology applications, pp 54\u201360","DOI":"10.1109\/IECA62822.2024.00017"},{"key":"489_CR82","unstructured":"Tian Y, Ye Q, Doermann D (2025) YOLOv12: attention-centric real-time object detectors. arxiv:2502.12524"},{"key":"489_CR83","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser L, Polosukhin I (2017) Attention is all you need"},{"key":"489_CR84","doi-asserted-by":"crossref","unstructured":"Wang C (2021) Analysis of students\u2019 behavior in english online education based on data mining. Mobile Inf Syst 2021(1)","DOI":"10.1155\/2021\/1856690"},{"key":"489_CR85","doi-asserted-by":"crossref","unstructured":"Wang C-Y, Bochkovskiy A, Liao H-YM (2022) YOLOv7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors","DOI":"10.1109\/CVPR52729.2023.00721"},{"key":"489_CR86","doi-asserted-by":"publisher","first-page":"111996","DOI":"10.1016\/j.patcog.2025.111996","volume":"169","author":"L Wang","year":"2026","unstructured":"Wang L, Xu X (2026) Db-sbr: A dual-backbone model for student behavior recognition. Pattern Recognit 169:111996","journal-title":"Pattern Recognit"},{"key":"489_CR87","doi-asserted-by":"publisher","first-page":"125392","DOI":"10.1016\/j.eswa.2024.125392","volume":"260","author":"Z Wang","year":"2025","unstructured":"Wang Z, Li L, Zeng C, Dong S, Sun J (2025) Slbdetection-net: Towards closed-set and open-set student learning behavior detection in smart classroom of k-12 education. Expert Syst Appl 260:125392","journal-title":"Expert Syst Appl"},{"key":"489_CR88","doi-asserted-by":"crossref","unstructured":"Wang D, Chen G (2025) Evaluating the use of bert and llama to analyse classroom dialogue for teachers\u2019 learning of dialogic pedagogy. British J Educ Technol","DOI":"10.1111\/bjet.13604"},{"key":"489_CR89","doi-asserted-by":"crossref","unstructured":"Wang A, Chen H, Liu L, Chen K, Lin Z, Han J, Ding G (2024) YOLOv10: real-time end-to-end object detection","DOI":"10.52202\/079017-3429"},{"key":"489_CR90","doi-asserted-by":"crossref","unstructured":"Wang Z, Ji Y, Xue K, Lin S, Yang L, Jin Y, Tan S (2023) Multi-scale classroom behavior recognition study based on ca-yolov7. In: 2023 International conference on image processing, computer vision and machine learning (ICICML), pp 294\u2013301","DOI":"10.1109\/ICICML60161.2023.10424952"},{"key":"489_CR91","unstructured":"Wang Z, Wang M, Zeng C, Li L (2024) Multi-scale deformable transformers for student learning behavior detection in smart classroom arxiv:2410.07834"},{"key":"489_CR92","doi-asserted-by":"crossref","unstructured":"Wang Z, Yao J, Zeng C, Li L, Tan C (2023) Students\u2019 classroom behavior detection system incorporating deformable detr with swin transformer and light-weight feature pyramid network. Systems 11(7)","DOI":"10.3390\/systems11070372"},{"key":"489_CR93","doi-asserted-by":"crossref","unstructured":"Wang Z, Zhou Z, Chen Y, Zheng T, He Y (2024) Classroom behavior recognition model for elementary and middle school students based on improved yolopose and feature fusion. In: 2024 International joint conference on neural networks (IJCNN), pp 1\u20138","DOI":"10.1109\/IJCNN60899.2024.10651244"},{"issue":"1","key":"489_CR94","first-page":"8269683","volume":"2020","author":"D Wu","year":"2020","unstructured":"Wu D, Chen J, Deng W, Wei Y, Luo H, Wei Y (2020) The recognition of teacher behavior based on multimodal information fusion. Math Probl Eng 2020(1):8269683","journal-title":"Math Probl Eng"},{"key":"489_CR95","doi-asserted-by":"publisher","first-page":"9989","DOI":"10.1007\/s10639-023-12058-z","volume":"29","author":"Y Xiong","year":"2024","unstructured":"Xiong Y, Xinya G, Xu J (2024) Cnn-transformer: A deep learning method for automatically identifying learning engagement. Educ Inf Technol 29:9989\u201310008","journal-title":"Educ Inf Technol"},{"key":"489_CR96","doi-asserted-by":"publisher","first-page":"111668","DOI":"10.1016\/j.engappai.2025.111668","volume":"159","author":"Y Xiong","year":"2025","unstructured":"Xiong Y, He C, Chen L, Cai T (2025) Spatio-temporal graph interaction networks for teacher behavior description in classroom scene. Eng Appl Artif Intell 159:111668","journal-title":"Eng Appl Artif Intell"},{"issue":"4","key":"489_CR97","doi-asserted-by":"publisher","first-page":"1297","DOI":"10.1002\/ajae.12041","volume":"102","author":"X Xu","year":"2020","unstructured":"Xu X (2020) Corn cash price forecasting. Am J Agric Econ 102(4):1297\u20131320","journal-title":"Am J Agric Econ"},{"issue":"2","key":"489_CR98","doi-asserted-by":"publisher","first-page":"1044","DOI":"10.1109\/TAFFC.2024.3491106","volume":"16","author":"L Xu","year":"2025","unstructured":"Xu L, Gan Y, Jin Y (2025) Class activation regularization-based facial emotion recognition network and its application in students\u2019 emotional engagement assessment. IEEE Trans Affect Comput 16(2):1044\u20131055","journal-title":"IEEE Trans Affect Comput"},{"key":"489_CR99","unstructured":"Yang F (2023) Scb-dataset: A dataset for detecting student classroom behavior. arXiv:2304.02488"},{"key":"489_CR100","doi-asserted-by":"crossref","unstructured":"Yang J, Chen Z, Kochan O, Fedchyshyn O (2024) Fkd-yolo: a lightweight student classroom behavior recognition algorithm. In: 2024 14th International conference on advanced computer information technologies (ACIT), pp 729\u2013734","DOI":"10.1109\/ACIT62333.2024.10712466"},{"key":"489_CR101","doi-asserted-by":"crossref","unstructured":"Yang W, Some L, Bain M, Kang B (2025) A comprehensive survey on integrating large language models with knowledge-based methods. Knowl-Based Syst 318","DOI":"10.1016\/j.knosys.2025.113503"},{"key":"489_CR102","unstructured":"Yang F, Wang T (2024) SCB-Dataset3: a benchmark for detecting student classroom behavior"},{"key":"489_CR103","doi-asserted-by":"crossref","unstructured":"Yang F, Wang T, Wang X (2023) Student classroom behavior detection based on yolov7+bra and multi-model fusion. In: Image and graphics, pp 41\u201352. Springer, Cham","DOI":"10.1007\/978-3-031-46311-2_4"},{"key":"489_CR104","doi-asserted-by":"publisher","first-page":"845","DOI":"10.18280\/ts.380331","volume":"38","author":"JY Yu","year":"2021","unstructured":"Yu JY, Bai XJ (2021) Analysis of classroom learning behaviors based on internet of things and image processing. Traitement du Signal 38:845\u2013851","journal-title":"Traitement du Signal"},{"key":"489_CR105","doi-asserted-by":"crossref","unstructured":"Yu S, Androsov A, Yan H (2025) Exploring the prospects of multimodal large language models for automated emotion recognition in education: Insights from gemini. Comput Educ 232","DOI":"10.1016\/j.compedu.2025.105307"},{"key":"489_CR106","doi-asserted-by":"crossref","unstructured":"Yun S, Ro Y (2024) Shvit: Single-head vision transformer with memory efficient macro design. In: 2024 IEEE\/CVF conference on computer vision and pattern recognition (CVPR), pp 5756\u20135767","DOI":"10.1109\/CVPR52733.2024.00550"},{"issue":"12","key":"489_CR107","doi-asserted-by":"publisher","first-page":"12399","DOI":"10.1109\/TCSVT.2024.3436029","volume":"34","author":"W-L Zhang","year":"2024","unstructured":"Zhang W-L, Jia R-S, Wang H, Che C-Y, Sun H-M (2024) A self-supervised learning network for student engagement recognition from facial expressions. IEEE Trans Circ Syst Video Technol 34(12):12399\u201312410","journal-title":"IEEE Trans Circ Syst Video Technol"},{"issue":"14","key":"489_CR108","doi-asserted-by":"publisher","first-page":"12325","DOI":"10.1007\/s00371-025-04159-2","volume":"41","author":"H Zhang","year":"2025","unstructured":"Zhang H, Peng Y, Liu Y (2025) Multimodal fusion for real-time classroom engagement assessment using yolov9 and deepface. Vis Comput 41(14):12325\u201312337","journal-title":"Vis Comput"},{"issue":"5","key":"489_CR109","doi-asserted-by":"publisher","first-page":"2097","DOI":"10.26599\/TST.2024.9010097","volume":"30","author":"J Zhang","year":"2025","unstructured":"Zhang J, Xu C, Shen S, Zhu J, Zhang P (2025) Mff-yolo: An improved yolo algorithm based on multi-scale semantic feature fusion. Tsinghua Sci Technol 30(5):2097\u20132113","journal-title":"Tsinghua Sci Technol"},{"key":"489_CR110","doi-asserted-by":"crossref","unstructured":"Zhang Y, Wu Z, Chen X, Dai L, Li Z, Zong X, Liu T (2020) Classroom behavior recognition based on improved yolov3. In: 2020 International conference on artificial intelligence and education (ICAIE), pp 93\u201397","DOI":"10.1109\/ICAIE50891.2020.00029"},{"key":"489_CR111","doi-asserted-by":"crossref","unstructured":"Zhao J, Zhu H (2023) Cbph-net: A small object detector for behavior recognition in classroom scenarios. IEEE Trans Instrum Meas 72:1\u201312","DOI":"10.1109\/TIM.2023.3296124"},{"key":"489_CR112","doi-asserted-by":"crossref","unstructured":"Zhao J, Li J, Jia J (2021) A study on posture-based teacher-student behavioral engagement pattern. Sustain Cities Soc 67:102749","DOI":"10.1016\/j.scs.2021.102749"},{"issue":"8","key":"489_CR113","doi-asserted-by":"publisher","first-page":"101670","DOI":"10.1016\/j.jksuci.2023.101670","volume":"35","author":"J Zhao","year":"2023","unstructured":"Zhao J, Zhu H, Niu L (2023) Bitnet: A lightweight object detection network for real-time classroom behavior recognition with transformer and bi-directional pyramid network. J King Saud Univ Comput Inf Sci 35(8):101670","journal-title":"J King Saud Univ Comput Inf Sci"},{"key":"489_CR114","doi-asserted-by":"crossref","unstructured":"Zhao Q, Liang Z (2023) Research on multimodal based learning evaluation method in smart classroom. Learn Motiv 84","DOI":"10.1016\/j.lmot.2023.101943"},{"key":"489_CR115","doi-asserted-by":"crossref","unstructured":"Zheng R, Jiang F, Shen R (2020) Intelligent student behavior analysis system for real classrooms. In: 2020 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp 9244\u20139248","DOI":"10.1109\/ICASSP40776.2020.9053457"},{"key":"489_CR116","doi-asserted-by":"crossref","unstructured":"Zheng R, Jiang F, Shen R (2020) Intelligent student behavior analysis system for real classrooms. In: 2020 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp 9244\u20139248","DOI":"10.1109\/ICASSP40776.2020.9053457"},{"issue":"1","key":"489_CR117","doi-asserted-by":"publisher","first-page":"254","DOI":"10.1109\/TETC.2023.3344131","volume":"12","author":"D Zhou","year":"2024","unstructured":"Zhou D, Yu H, Yu J, Zhao S, Xu W, Li Q, Cai F (2024) Mfds-stgcn: Predicting the behaviors of college students with fine-grained spatial-temporal activities data. IEEE Trans Emerging Top Comput 12(1):254\u2013265","journal-title":"IEEE Trans Emerging Top Comput"},{"key":"489_CR118","doi-asserted-by":"crossref","unstructured":"Zhou H, Jiang F, Si J, Xiong L, Lu H (2023) Stuart: Individualized classroom observation of students with automatic behavior recognition and tracking. In: 2023 IEEE international conference on acoustics, speech and signal processing (ICASSP), pp 1\u20135","DOI":"10.1109\/ICASSP49357.2023.10094982"},{"key":"489_CR119","unstructured":"Zhu X, Su W, Lu L, Li B, Wang X, Dai J (2021) Deformable detr: Deformable transformers for end-to-end object detection. In: ICLR 2021 - 9th international conference on learning representations"}],"container-title":["Journal of King Saud University Computer and Information Sciences"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s44443-026-00489-w","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s44443-026-00489-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s44443-026-00489-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,5]],"date-time":"2026-05-05T01:03:24Z","timestamp":1777943004000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s44443-026-00489-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1,28]]},"references-count":119,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2026,4]]}},"alternative-id":["489"],"URL":"https:\/\/doi.org\/10.1007\/s44443-026-00489-w","relation":{},"ISSN":["1319-1578","2213-1248"],"issn-type":[{"value":"1319-1578","type":"print"},{"value":"2213-1248","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,1,28]]},"assertion":[{"value":"24 September 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 January 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing Interest"}}],"article-number":"99"}}