{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,28]],"date-time":"2026-03-28T16:44:13Z","timestamp":1774716253785,"version":"3.50.1"},"reference-count":53,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2024,7,27]],"date-time":"2024-07-27T00:00:00Z","timestamp":1722038400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,7,27]],"date-time":"2024-07-27T00:00:00Z","timestamp":1722038400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100008871","name":"Yunnan Province Science and Technology Department","doi-asserted-by":"crossref","award":["202305AF150045"],"award-info":[{"award-number":["202305AF150045"]}],"id":[{"id":"10.13039\/501100008871","id-type":"DOI","asserted-by":"crossref"}]},{"name":"Yunnan Development and Reform Commission","award":["YNWR-CYJS-2020-017"],"award-info":[{"award-number":["YNWR-CYJS-2020-017"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Real-Time Image Proc"],"published-print":{"date-parts":[[2024,8]]},"DOI":"10.1007\/s11554-024-01515-8","type":"journal-article","created":{"date-parts":[[2024,7,27]],"date-time":"2024-07-27T03:28:34Z","timestamp":1722050914000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":32,"title":["Csb-yolo: a rapid and efficient real-time algorithm for classroom student behavior detection"],"prefix":"10.1007","volume":"21","author":[{"given":"Wenqi","family":"Zhu","sequence":"first","affiliation":[]},{"given":"Zhijun","family":"Yang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,7,27]]},"reference":[{"key":"1515_CR1","doi-asserted-by":"publisher","first-page":"224","DOI":"10.1016\/j.patrec.2019.11.023","volume":"129","author":"B Yang","year":"2020","unstructured":"Yang, B., Yao, Z., Lu, H., Zhou, Y., Xu, J.: In-classroom learning analytics based on student behavior, topic and teaching characteristic mining. Pattern Recogn. Lett. 129, 224\u2013231 (2020)","journal-title":"Pattern Recogn. Lett."},{"issue":"4","key":"1515_CR2","first-page":"361","volume":"20","author":"SK D\u2019Mello","year":"2010","unstructured":"D\u2019Mello, S.K., Lehman, B., Person, N.: Monitoring affect states during effortful problem solving activities. Int. J. Artif. Intell. Educ. 20(4), 361\u2013389 (2010)","journal-title":"Int. J. Artif. Intell. Educ."},{"issue":"5","key":"1515_CR3","doi-asserted-by":"publisher","first-page":"398","DOI":"10.5573\/IEIESPC.2023.12.5.398","volume":"12","author":"X Su","year":"2023","unstructured":"Su, X., Wang, W.: Recognition and identification of college students$$\\backslash$$classroom behaviors through deep learning. IEIE Transactions on Smart Processing & Computing 12(5), 398\u2013403 (2023)","journal-title":"IEIE Transactions on Smart Processing & Computing"},{"issue":"10","key":"1515_CR4","doi-asserted-by":"publisher","first-page":"12861","DOI":"10.1007\/s11227-022-04402-w","volume":"78","author":"S Liu","year":"2022","unstructured":"Liu, S., Zhang, J., Su, W.: An improved method of identifying learner\u2019s behaviors based on deep learning. J. Supercomput. 78(10), 12861\u201312872 (2022)","journal-title":"J. Supercomput."},{"key":"1515_CR5","doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Rich feature hierarchies for accurate object detection and semantic segmentation, in: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 580\u2013587 (2014)","DOI":"10.1109\/CVPR.2014.81"},{"key":"1515_CR6","doi-asserted-by":"crossref","unstructured":"Girshick, R.: Fast r-cnn, in: Proceedings of the IEEE international conference on computer vision, pp. 1440\u20131448 (2015)","DOI":"10.1109\/ICCV.2015.169"},{"key":"1515_CR7","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster r-cnn: Towards real-time object detection with region proposal networks, Advances in neural information processing systems 28 (2015)"},{"key":"1515_CR8","doi-asserted-by":"crossref","unstructured":"Redmon, J., Divvala, S., Girshick, R., Farhadi, A.: You only look once: Unified, real-time object detection, in: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 779\u2013788 (2016)","DOI":"10.1109\/CVPR.2016.91"},{"key":"1515_CR9","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Goyal, P., Girshick, R., He, K., Doll\u00e1r, P.: Focal loss for dense object detection, in: Proceedings of the IEEE international conference on computer vision, pp. 2980\u20132988 (2017)","DOI":"10.1109\/ICCV.2017.324"},{"key":"1515_CR10","doi-asserted-by":"crossref","unstructured":"Liu, W., Anguelov, D., Erhan, D., Szegedy, C., Reed, S., Fu, C.-Y., Berg, A.C.: Ssd: Single shot multibox detector, in: Computer Vision\u2013ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11\u201314, Proceedings, Part I 14, Springer, 2016, pp. 21\u201337 (2016)","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"1515_CR11","doi-asserted-by":"crossref","unstructured":"Sultana, F., Sufian, A., Dutta, P.: A review of object detection models based on convolutional neural network, Intelligent computing: image processing based applications 1\u201316 (2020)","DOI":"10.1007\/978-981-15-4288-6_1"},{"key":"1515_CR12","doi-asserted-by":"crossref","unstructured":"Zhao, J., Zhu, H.: Cbph-net: A small object detector for behavior recognition in classroom scenarios, IEEE Transactions on Instrumentation and Measurement (2023)","DOI":"10.1109\/TIM.2023.3296124"},{"key":"1515_CR13","doi-asserted-by":"crossref","unstructured":"Tan, M., Pang, R., Le, Q.V.: Efficientdet: Scalable and efficient object detection, in: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 10781\u201310790 (2020)","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"1515_CR14","doi-asserted-by":"crossref","unstructured":"Liu, J.-J., Hou, Q., Cheng, M.-M., Wang, C., Feng, J.: Improving convolutional networks with self-calibrated convolutions, in: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 10096\u201310105 (2020)","DOI":"10.1109\/CVPR42600.2020.01011"},{"key":"1515_CR15","unstructured":"Lee, J., Park, S., Mo, S., Ahn, S., Shin, J.: Layer-adaptive sparsity for the magnitude-based pruning, arXiv preprint (2020) arXiv:2010.07611"},{"key":"1515_CR16","doi-asserted-by":"crossref","unstructured":"Yang, L., Zhou, X., Li, X., Qiao, L., Li, Z., Yang, Z., Wang, G., Li, X.: Bridging cross-task protocol inconsistency for distillation in dense object detection, in: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 17175\u201317184 (2023)","DOI":"10.1109\/ICCV51070.2023.01575"},{"key":"1515_CR17","doi-asserted-by":"publisher","first-page":"151","DOI":"10.1016\/j.cag.2022.11.009","volume":"110","author":"G Zhang","year":"2023","unstructured":"Zhang, G., Wang, L., Wang, L., Chen, Z.: Hand-raising gesture detection in classroom with spatial context augmentation and dilated convolution. Computers & Graphics 110, 151\u2013161 (2023)","journal-title":"Computers & Graphics"},{"key":"1515_CR18","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Doll\u00e1r, P., Girshick, R., He, K., Hariharan, B., Belongie, S.: Feature pyramid networks for object detection, in: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 2117\u20132125 (2017)","DOI":"10.1109\/CVPR.2017.106"},{"key":"1515_CR19","doi-asserted-by":"crossref","unstructured":"Wang, Z., Jiang, F., Shen, R.: An effective yawn behavior detection method in classroom, in: International conference on neural information processing, Springer, pp. 430\u2013441 (2019)","DOI":"10.1007\/978-3-030-36708-4_35"},{"key":"1515_CR20","unstructured":"Dai, J., Li, Y., He, K., Sun, J.: R-fcn: Object detection via region-based fully convolutional networks, Advances in neural information processing systems 29 (2016)"},{"issue":"23","key":"1515_CR21","doi-asserted-by":"publisher","first-page":"3998","DOI":"10.3390\/electronics11233998","volume":"11","author":"H Chen","year":"2022","unstructured":"Chen, H., Guan, J.: Teacher-student behavior recognition in classroom teaching based on improved yolo-v4 and internet of things technology. Electronics 11(23), 3998 (2022)","journal-title":"Electronics"},{"key":"1515_CR22","unstructured":"Bochkovskiy, A., Wang, C.-Y., Liao, H.-Y.M.: Yolov4: Optimal speed and accuracy of object detection, arXiv preprint (2020) arXiv:2004.10934"},{"key":"1515_CR23","doi-asserted-by":"crossref","unstructured":"Bao, D., Su, W.: Research on the detection and analysis of students\u2019 classroom behavioral features based on deep cnns, ACM Transactions on Asian and Low-Resource Language Information Processing (2023)","DOI":"10.1145\/3615865"},{"key":"1515_CR24","doi-asserted-by":"crossref","unstructured":"Han, K., Wang, Y., Tian, Q., Guo, J., Xu, C., Xu, C.: Ghostnet: More features from cheap operations, in: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 1580\u20131589 (2020)","DOI":"10.1109\/CVPR42600.2020.00165"},{"issue":"19","key":"1515_CR25","doi-asserted-by":"publisher","first-page":"8190","DOI":"10.3390\/s23198190","volume":"23","author":"Z Wang","year":"2023","unstructured":"Wang, Z., Li, L., Zeng, C., Yao, J.: Student learning behavior recognition incorporating data augmentation with learning feature representation in smart classrooms. Sensors 23(19), 8190 (2023)","journal-title":"Sensors"},{"key":"1515_CR26","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, J.-Y., Kweon, I.S.: Cbam: Convolutional block attention module, in: Proceedings of the European conference on computer vision (ECCV), pp. 3\u201319 (2018)","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"1515_CR27","doi-asserted-by":"crossref","unstructured":"Wang, C.-Y., Bochkovskiy, A., Liao, H.-Y.M.: Yolov7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors, in: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 7464\u20137475 (2023)","DOI":"10.1109\/CVPR52729.2023.00721"},{"issue":"20","key":"1515_CR28","doi-asserted-by":"publisher","first-page":"8385","DOI":"10.3390\/s23208385","volume":"23","author":"H Chen","year":"2023","unstructured":"Chen, H., Zhou, G., Jiang, H.: Student behavior detection in the classroom based on improved yolov8. Sensors 23(20), 8385 (2023)","journal-title":"Sensors"},{"issue":"2","key":"1515_CR29","doi-asserted-by":"publisher","first-page":"652","DOI":"10.1109\/TPAMI.2019.2938758","volume":"43","author":"S-H Gao","year":"2019","unstructured":"Gao, S.-H., Cheng, M.-M., Zhao, K., Zhang, X.-Y., Yang, M.-H., Torr, P.: Res2net: A new multi-scale backbone architecture. IEEE Trans. Pattern Anal. Mach. Intell. 43(2), 652\u2013662 (2019)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1515_CR30","doi-asserted-by":"crossref","unstructured":"Ouyang, D., He, S., Zhang, G., Luo, M., Guo, H., Zhan, J., Huang, Z.: Efficient multi-scale attention module with cross-spatial learning, in: ICASSP 2023-2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), IEEE, pp. 1\u20135 (2023)","DOI":"10.1109\/ICASSP49357.2023.10096516"},{"key":"1515_CR31","doi-asserted-by":"crossref","unstructured":"Liu, Q., Jiang, R., Xu, Q., Wang, D., Sang, Z., Jiang, X., Wu, L.: Yolov8n_bt: Research on classroom learning behavior recognition algorithm based on improved yolov8n, IEEE Access (2024)","DOI":"10.1109\/ACCESS.2024.3373536"},{"issue":"11","key":"1515_CR32","doi-asserted-by":"publisher","first-page":"3609","DOI":"10.3390\/s24113609","volume":"24","author":"G Xiao","year":"2024","unstructured":"Xiao, G., Xu, Q., Wei, Y., Yao, H., Liu, Q.: Occlusion robust cognitive engagement detection in real-world classroom. Sensors 24(11), 3609 (2024)","journal-title":"Sensors"},{"key":"1515_CR33","doi-asserted-by":"crossref","unstructured":"Jiang, Y., Zhu, X., Wang, X., Yang, S., Li, W., Wang, H., Fu, P., Luo, Z.: R2cnn: Rotational region cnn for orientation robust scene text detection, arXiv preprint (2017) arXiv:1706.09579","DOI":"10.1109\/ICPR.2018.8545598"},{"key":"1515_CR34","doi-asserted-by":"crossref","unstructured":"Liu, S., Qi, L., Qin, H., Shi, J., Jia, J.: Path aggregation network for instance segmentation, in: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 8759\u20138768 (2018)","DOI":"10.1109\/CVPR.2018.00913"},{"key":"1515_CR35","doi-asserted-by":"crossref","unstructured":"Ding, X., Zhang, X., Han, J., Ding, G.: Diverse branch block: Building a convolution as an inception-like unit, in: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 10886\u201310895 (2021)","DOI":"10.1109\/CVPR46437.2021.01074"},{"key":"1515_CR36","doi-asserted-by":"crossref","unstructured":"Ding, X., Guo, Y., Ding, G., Han, J.: Acnet: Strengthening the kernel skeletons for powerful cnn via asymmetric convolution blocks, in: Proceedings of the IEEE\/CVF international conference on computer vision, pp. 1911\u20131920 (2019)","DOI":"10.1109\/ICCV.2019.00200"},{"key":"1515_CR37","doi-asserted-by":"crossref","unstructured":"Ding, X., Zhang, X., Ma, N., Han, J., Ding, G., Sun, J.: Repvgg: Making vgg-style convnets great again, in: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 13733\u201313742 (2021)","DOI":"10.1109\/CVPR46437.2021.01352"},{"key":"1515_CR38","unstructured":"Ioffe, S., Szegedy, C.: Batch normalization: Accelerating deep network training by reducing internal covariate shift, in: International conference on machine learning, pmlr, pp. 448\u2013456 (2015)"},{"key":"1515_CR39","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Liu, W., Jia, Y., Sermanet, P., Reed, S., Anguelov, D., Erhan, D., Vanhoucke, V., Rabinovich, A.: Going deeper with convolutions, in: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 1\u20139 (2015)","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"1515_CR40","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Vanhoucke, V., Ioffe, S., Shlens, J., Wojna, Z.: Rethinking the inception architecture for computer vision, in: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 2818\u20132826 (2016)","DOI":"10.1109\/CVPR.2016.308"},{"key":"1515_CR41","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Ioffe, S., Vanhoucke, V., Alemi, A.: Inception-v4, inception-resnet and the impact of residual connections on learning, in: Proceedings of the AAAI conference on artificial intelligence, Vol. 31, (2017)","DOI":"10.1609\/aaai.v31i1.11231"},{"key":"1515_CR42","unstructured":"Yang, F., Wang, T.: Scb-dataset3: A benchmark for detecting student classroom behavior, arXiv preprint (2023) arXiv:2310.02522"},{"key":"1515_CR43","unstructured":"Zhou, Z., Zhuge, C., Guan, X., Liu, W.: Channel distillation: Channel-wise attention for knowledge distillation, arXiv preprint (2020) arXiv:2006.01683"},{"key":"1515_CR44","doi-asserted-by":"crossref","unstructured":"Yang, Z., Li, Z., Shao, M., Shi, D., Yuan, Z., Yuan, C.: Masked generative distillation, in: European Conference on Computer Vision, Springer, pp. 53\u201369 (2022)","DOI":"10.1007\/978-3-031-20083-0_4"},{"key":"1515_CR45","doi-asserted-by":"crossref","unstructured":"Li, Q., Jin, S., Yan, J.: Mimicking very efficient network for object detection, in: Proceedings of the ieee conference on computer vision and pattern recognition, pp. 6356\u20136364 (2017)","DOI":"10.1109\/CVPR.2017.776"},{"key":"1515_CR46","unstructured":"Hinton, G., Vinyals, O., Dean, J.: Distilling the knowledge in a neural network, arXiv preprint (2015) arXiv:1503.02531"},{"key":"1515_CR47","unstructured":"Jocher, G., Chaurasia, A., Qiu, J.: YOLOv8, (2023) https:\/\/github.com\/ultralytics\/ultralytics"},{"key":"1515_CR48","unstructured":"Redmon, J., Farhadi, A.: Yolov3: An incremental improvement, arXiv preprint (2018) arXiv:1804.02767"},{"key":"1515_CR49","unstructured":"Jocher, G.: YOLOv5, (2020) https:\/\/github.com\/ultralytics\/yolov5"},{"key":"1515_CR50","unstructured":"Li, C., Li, L., Jiang, H., Weng, K., Geng, Y., Li, L., Ke, Z., Li, Q., Cheng, M., Nie, W., et al.: Yolov6: A single-stage object detection framework for industrial applications, arXiv preprint (2022) arXiv:2209.02976"},{"key":"1515_CR51","unstructured":"Wang, C.-Y., Yeh, I.-H., Liao, H.-Y.M.: Yolov9: Learning what you want to learn using programmable gradient information, arXiv preprint (2024) arXiv:2402.13616"},{"key":"1515_CR52","unstructured":"Zhao, Y., Lv, W., Xu, S., Wei, J., Wang, G., Dang, Q., Liu, Y., Chen, J.: Detrs beat yolos on real-time object detection, arXiv preprint (2023) arXiv:2304.08069"},{"key":"1515_CR53","doi-asserted-by":"crossref","unstructured":"Dai, X., Chen, Y., Xiao, B., Chen, D., Liu, M., Yuan, L., Zhang, L.: Dynamic head: Unifying object detection heads with attentions, in: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 7373\u20137382 (2021)","DOI":"10.1109\/CVPR46437.2021.00729"}],"container-title":["Journal of Real-Time Image Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-024-01515-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11554-024-01515-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-024-01515-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,27]],"date-time":"2024-08-27T16:34:17Z","timestamp":1724776457000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11554-024-01515-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7,27]]},"references-count":53,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2024,8]]}},"alternative-id":["1515"],"URL":"https:\/\/doi.org\/10.1007\/s11554-024-01515-8","relation":{},"ISSN":["1861-8200","1861-8219"],"issn-type":[{"value":"1861-8200","type":"print"},{"value":"1861-8219","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,7,27]]},"assertion":[{"value":"29 April 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 July 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 July 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"140"}}