{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,1,17]],"date-time":"2025-01-17T10:40:17Z","timestamp":1737110417883,"version":"3.33.0"},"reference-count":24,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,12,9]],"date-time":"2024-12-09T00:00:00Z","timestamp":1733702400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,12,9]],"date-time":"2024-12-09T00:00:00Z","timestamp":1733702400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,12,9]]},"DOI":"10.1109\/tale62452.2024.10834376","type":"proceedings-article","created":{"date-parts":[[2025,1,15]],"date-time":"2025-01-15T19:36:30Z","timestamp":1736969790000},"page":"1-7","source":"Crossref","is-referenced-by-count":0,"title":["Video-Based Recognition of Online Learning Behaviors Using Attention Mechanisms"],"prefix":"10.1109","author":[{"given":"Bingchao","family":"Huang","sequence":"first","affiliation":[{"name":"Beihang University,Sino-French Engineer School,Beijing,China"}]},{"given":"Chuantao","family":"Yin","sequence":"additional","affiliation":[{"name":"Beihang University,Sino-French Engineer School,Beijing,China"}]},{"given":"Chao","family":"Wang","sequence":"additional","affiliation":[{"name":"EURECOM Sorbonne University,Biot,France"}]},{"given":"Hui","family":"Chen","sequence":"additional","affiliation":[{"name":"Beihang University,Department of Planning and Finance,Beijing,China"}]},{"given":"Yanmei","family":"Chai","sequence":"additional","affiliation":[{"name":"Central University of Finance and Economics,School of Information,Beijing,China"}]},{"given":"Yuanxin","family":"Ouyang","sequence":"additional","affiliation":[{"name":"Beihang University,School of Computer Science and Engineering,Beijing,China"}]}],"member":"263","reference":[{"key":"ref1","first-page":"30","article-title":"Attention is all you need[J]","author":"Vaswani","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2017.10.013"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2021.08.098"},{"article-title":"Very deep convolutional networks for large-scale image recognition[C]","volume-title":"3rd International Conference on Learning Representations, ICLR 2015, San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings","author":"Simonyan","key":"ref6"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-33-6757-9_61"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/3501409.3501529"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.4324\/9780203978948-13"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.3389\/fnbot.2021.675827"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.3390\/s21165314"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.18280\/ts.380109"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/s00521-020-05587-y"},{"article-title":"Daisee: Towards user engagement recognition in the wild[J]","year":"2016","author":"Gupta","key":"ref14"},{"article-title":"Blazeface: Sub-millisecond neural face detection on mobile gpus[J]","year":"2019","author":"Bazarevsky","key":"ref15"},{"article-title":"An image is worth 16x16 words: Transformers for image recognition at scale[J]","volume-title":"ICLR","author":"Dosovitskiy","key":"ref16"},{"article-title":"Mediapipe: A framework for building perception pipelines","year":"2019","author":"Lugaresi","key":"ref17"},{"article-title":"How to train your vit? data, augmentation, and regularization in vision transformers[J]","year":"2021","author":"Steiner","key":"ref18"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00140"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr52688.2022.01169"},{"article-title":"Vision transformers need registers","year":"2023","author":"Darcet","key":"ref21"},{"article-title":"Multi-scale Transformers with Adaptive Pathways for Time Series Forecasting","volume-title":"The Twelfth International Conference on Learning Representations","author":"Chen","key":"ref22"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00292"},{"article-title":"Regionvit: Regional-to-local attention for vision transformers[C]","year":"2021","author":"Chen","key":"ref24"}],"event":{"name":"2024 IEEE International Conference on Teaching, Assessment and Learning for Engineering (TALE)","start":{"date-parts":[[2024,12,9]]},"location":"Bengaluru, India","end":{"date-parts":[[2024,12,12]]}},"container-title":["2024 IEEE International Conference on Teaching, Assessment and Learning for Engineering (TALE)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10834301\/10834287\/10834376.pdf?arnumber=10834376","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,16]],"date-time":"2025-01-16T06:09:16Z","timestamp":1737007756000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10834376\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,9]]},"references-count":24,"URL":"https:\/\/doi.org\/10.1109\/tale62452.2024.10834376","relation":{},"subject":[],"published":{"date-parts":[[2024,12,9]]}}}