{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,27]],"date-time":"2026-03-27T19:02:21Z","timestamp":1774638141118,"version":"3.50.1"},"reference-count":8,"publisher":"Wiley","issue":"6","license":[{"start":{"date-parts":[[2025,10,4]],"date-time":"2025-10-04T00:00:00Z","timestamp":1759536000000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/onlinelibrary.wiley.com\/termsAndConditions#vor"}],"content-domain":{"domain":["onlinelibrary.wiley.com"],"crossmark-restriction":true},"short-container-title":["Internet Technology Letters"],"published-print":{"date-parts":[[2025,11]]},"abstract":"<jats:title>ABSTRACT<\/jats:title>\n                  <jats:p>This letter presents a novel framework combining large language models with a sparse attention vision transformer (SA\u2010ViT) to classify English teaching video traffic in wireless networks. Our approach analyzes both visual content frames and extracted English speech transcripts to identify educational content types, difficulty levels, and priority requirements. The proposed model transforms video frames into visual patches while simultaneously processing English linguistic content through pre\u2010trained language models, enabling an understanding of educational multimedia traffic. Through extensive evaluation of real\u2010world English teaching video datasets transmitted over wireless networks, our SA\u2010ViT framework achieves 97.5% classification accuracy, representing an 11.3% improvement over conventional video traffic classification methods. The results demonstrate effective integration of visual understanding, English language comprehension, and wireless network optimization for enhanced educational content delivery.<\/jats:p>","DOI":"10.1002\/itl2.70153","type":"journal-article","created":{"date-parts":[[2025,10,4]],"date-time":"2025-10-04T07:49:20Z","timestamp":1759564160000},"update-policy":"https:\/\/doi.org\/10.1002\/crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Intelligent English Teaching Video Traffic Classification in Wireless Communication Networks via Large Model\u2010Enhanced Sparse Attention Vision Transformer"],"prefix":"10.1002","volume":"8","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-2016-4694","authenticated-orcid":false,"given":"Jinjin","family":"Liu","sequence":"first","affiliation":[{"name":"Huanghe University of Science and Technology  Zhengzhou People's Republic of China"}]}],"member":"311","published-online":{"date-parts":[[2025,10,4]]},"reference":[{"key":"e_1_2_6_2_1","doi-asserted-by":"publisher","DOI":"10.17223\/19996195\/58\/13"},{"key":"e_1_2_6_3_1","doi-asserted-by":"publisher","DOI":"10.1155\/2021\/7404712"},{"issue":"30","key":"e_1_2_6_4_1","first-page":"123","article-title":"Synchronous Computer\u2010Mediated Communication in English Pronunciation Teaching: A Case Study of Rovira i Virgili University","volume":"15","author":"Vazquez L. Q.","year":"2023","journal-title":"Journal of Learning Styles"},{"key":"e_1_2_6_5_1","doi-asserted-by":"publisher","DOI":"10.32604\/cmc.2022.021780"},{"key":"e_1_2_6_6_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-98355-0_35"},{"key":"e_1_2_6_7_1","first-page":"1965","volume-title":"TRANSTL: Spatial\u2010Temporal Localization Transformer for Multi\u2010Label Video Classification","author":"Wu H. J.","year":"2023"},{"key":"e_1_2_6_8_1","first-page":"502","article-title":"HaViT: Hybrid\u2010Attention Based Vision Transformer for Video Classification","volume":"13844","author":"Li L.","year":"2023","journal-title":"Computer VISION"},{"key":"e_1_2_6_9_1","article-title":"HaViT: Hybrid\u2010Attention Based Vision Transformer for Video Classification","volume":"178","author":"Hammou B. A.","year":"2023","journal-title":"International Journal of Medical Informatics"}],"container-title":["Internet Technology Letters"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/onlinelibrary.wiley.com\/doi\/pdf\/10.1002\/itl2.70153","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,10]],"date-time":"2025-11-10T12:20:28Z","timestamp":1762777228000},"score":1,"resource":{"primary":{"URL":"https:\/\/onlinelibrary.wiley.com\/doi\/10.1002\/itl2.70153"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,4]]},"references-count":8,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2025,11]]}},"alternative-id":["10.1002\/itl2.70153"],"URL":"https:\/\/doi.org\/10.1002\/itl2.70153","archive":["Portico"],"relation":{"has-review":[{"id-type":"doi","id":"10.1002\/ITL2.70153\/v2\/review1","asserted-by":"object"},{"id-type":"doi","id":"10.1002\/ITL2.70153\/v2\/decision1","asserted-by":"object"},{"id-type":"doi","id":"10.1002\/ITL2.70153\/v2\/response1","asserted-by":"object"},{"id-type":"doi","id":"10.1002\/ITL2.70153\/v1\/review2","asserted-by":"object"},{"id-type":"doi","id":"10.1002\/ITL2.70153\/v2\/review2","asserted-by":"object"},{"id-type":"doi","id":"10.1002\/ITL2.70153\/v1\/review1","asserted-by":"object"},{"id-type":"doi","id":"10.1002\/ITL2.70153\/v1\/decision1","asserted-by":"object"}]},"ISSN":["2476-1508","2476-1508"],"issn-type":[{"value":"2476-1508","type":"print"},{"value":"2476-1508","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,10,4]]},"assertion":[{"value":"2025-06-20","order":0,"name":"received","label":"Received","group":{"name":"publication_history","label":"Publication History"}},{"value":"2025-09-16","order":2,"name":"accepted","label":"Accepted","group":{"name":"publication_history","label":"Publication History"}},{"value":"2025-10-04","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}],"article-number":"e70153"}}