{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,17]],"date-time":"2026-03-17T09:00:46Z","timestamp":1773738046450,"version":"3.50.1"},"reference-count":239,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,1,20]],"date-time":"2026-01-20T00:00:00Z","timestamp":1768867200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,20]],"date-time":"2026-01-20T00:00:00Z","timestamp":1768867200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100004739","name":"Youth Innovation Promotion Association of the Chinese Academy of Sciences","doi-asserted-by":"publisher","award":["E1290301"],"award-info":[{"award-number":["E1290301"]}],"id":[{"id":"10.13039\/501100004739","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2026,2]]},"DOI":"10.1007\/s11263-025-02672-4","type":"journal-article","created":{"date-parts":[[2026,1,20]],"date-time":"2026-01-20T08:35:47Z","timestamp":1768898147000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["A Decade of Action Quality Assessment: Largest Systematic Survey of Trends, Challenges, and Future Directions"],"prefix":"10.1007","volume":"134","author":[{"ORCID":"https:\/\/orcid.org\/0009-0001-0943-3502","authenticated-orcid":false,"given":"Hao","family":"Yin","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0002-9894-9523","authenticated-orcid":false,"given":"Paritosh","family":"Parmar","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0007-9942-3204","authenticated-orcid":false,"given":"Daoliang","family":"Xu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2615-3585","authenticated-orcid":false,"given":"Yang","family":"Zhang","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2310-2988","authenticated-orcid":false,"given":"Tianyou","family":"Zheng","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7192-3118","authenticated-orcid":false,"given":"Weiwei","family":"Fu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,1,20]]},"reference":[{"key":"2672_CR1","doi-asserted-by":"crossref","unstructured":"Abedi, A., & Khan, S. S. (2021). Improving state-of-the-art in detecting student engagement with resnet and tcn hybrid network. In Conference on robots and vision, pp. 151\u2013157. IEEE.","DOI":"10.1109\/CRV52889.2021.00028"},{"key":"2672_CR2","doi-asserted-by":"crossref","unstructured":"An, Q., Qi, M., & Ma, H. (2024). Multi-stage contrastive regression for action quality assessment. In IEEE international conference on acoustics, speech and signal processing, pp. 4110\u20134114. IEEE.","DOI":"10.1109\/ICASSP48485.2024.10447069"},{"issue":"3","key":"2672_CR3","doi-asserted-by":"crossref","first-page":"1755","DOI":"10.1109\/LRA.2023.3242466","volume":"8","author":"D Anastasiou","year":"2023","unstructured":"Anastasiou, D., Jin, Y., Stoyanov, D., & Mazomenos, E. (2023). Keep your eye on the best: Contrastive regression transformer for skill assessment in robotic surgery. IEEE Robotics and Automation Letters,8(3), 1755\u20131762.","journal-title":"IEEE Robotics and Automation Letters"},{"issue":"2","key":"2672_CR4","doi-asserted-by":"crossref","first-page":"103","DOI":"10.1080\/02701367.1988.10605486","volume":"59","author":"CJ Ansorge","year":"1988","unstructured":"Ansorge, C. J., & Scheer, J. K. (1988). International bias detected in judging gymnastic competition at the 1984 olympic games. Research Quarterly for Exercise and Sport,59(2), 103\u2013107.","journal-title":"Research Quarterly for Exercise and Sport"},{"key":"2672_CR5","doi-asserted-by":"crossref","unstructured":"Ashutosh, K., Nagarajan, T., Pavlakos, G., Kitani, K., & Grauman, K. (2025). Expertaf: Expert actionable feedback from video. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 13582\u201313594.","DOI":"10.1109\/CVPR52734.2025.01268"},{"key":"2672_CR6","unstructured":"Authors, G. (2024). Genesis: A universal and generative physics engine for robotics and beyond."},{"key":"2672_CR7","unstructured":"Bai, Y. (2023). Towards interaction-level video action understanding. Thesis."},{"key":"2672_CR8","doi-asserted-by":"crossref","unstructured":"Bai, Y., Zhou, D., Zhang, S., Wang, J., Ding, E., Guan, Y., Long, Y., & Wang, J. (2022). Action quality assessment with temporal parsing transformer. In European conference on computer vision, pp. 422\u2013438. Springer.","DOI":"10.1007\/978-3-031-19772-7_25"},{"key":"2672_CR9","doi-asserted-by":"crossref","unstructured":"Bertasius, G., Soo Park, H., Yu, S. X., & Shi, J. (2017). Am i a baller? basketball performance assessment from first-person videos. In Proceedings of the IEEE international conference on computer vision, pp. 2177\u20132185.","DOI":"10.1109\/ICCV.2017.239"},{"key":"2672_CR10","unstructured":"Bruce, X. B., Liu, Y., Chan, K. C. C., & Chen, C. W. (2024). Egcn++: A new fusion strategy for ensemble learning in skeleton-based rehabilitation exercise assessment. IEEE transactions on pattern analysis and machine intelligence."},{"key":"2672_CR11","unstructured":"Burgess, J., Wang, X., Zhang, Y., Rau, A., Lozano, A., Dunlap, L., Darrell, T., & Yeung-Levy, S. (2025). Video action differencing. arXiv preprint arXiv:2503.07860."},{"issue":"7","key":"2672_CR12","doi-asserted-by":"crossref","first-page":"1436","DOI":"10.1109\/TNSRE.2019.2923060","volume":"27","author":"M Capecci","year":"2019","unstructured":"Capecci, M., Ceravolo, M. G., Ferracuti, F., Iarlori, S., Monteriu, A., Romeo, L., & Verdini, F. (2019). The kimore dataset: Kinematic assessment of movement and clinical scores for remote monitoring of physical rehabilitation. IEEE Transactions on Neural Systems and Rehabilitation Engineering,27(7), 1436\u20131448.","journal-title":"IEEE Transactions on Neural Systems and Rehabilitation Engineering"},{"key":"2672_CR13","doi-asserted-by":"crossref","unstructured":"Carreira, J., & Zisserman, A. (2017). Quo vadis, action recognition? a new model and the kinetics dataset. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 6299\u20136308.","DOI":"10.1109\/CVPR.2017.502"},{"key":"2672_CR14","unstructured":"Carreira, J., Noland, E., Banki-Horvath, A., Hillier, C., & Zisserman, A. (2018). A short note about kinetics-600. arXiv preprint arXiv:1808.01340."},{"issue":"1","key":"2672_CR15","doi-asserted-by":"crossref","first-page":"3673","DOI":"10.1038\/s41467-020-17478-w","volume":"11","author":"DC Castro","year":"2020","unstructured":"Castro, D. C., Walker, I., & Glocker, B. (2020). Causality matters in medical imaging. Nature Communications,11(1), 3673.","journal-title":"Nature Communications"},{"issue":"6","key":"2672_CR16","doi-asserted-by":"crossref","first-page":"2566","DOI":"10.1016\/j.ridd.2011.07.002","volume":"32","author":"Y-J Chang","year":"2011","unstructured":"Chang, Y.-J., Chen, S.-F., & Huang, J.-D. (2011). A kinect-based system for physical rehabilitation: A pilot study for young adults with motor disabilities. Research in Developmental Disabilities,32(6), 2566\u20132570.","journal-title":"Research in Developmental Disabilities"},{"key":"2672_CR17","doi-asserted-by":"crossref","unstructured":"Chen, D., Graham, S., Depp, C., & Nguyen, T. (2021). Assessing physical rehabilitation exercises using graph convolutional network with self-supervised regularization. In Annual international conference of the IEEE engineering in medicine & biology society, pp. 281\u2013285. IEEE.","DOI":"10.1109\/EMBC46164.2021.9629569"},{"key":"2672_CR18","doi-asserted-by":"crossref","unstructured":"Chen, Z., Sun, W., Tian, Y., Jia, J., Zhang, Z., Wang, J., Huang, R., Min, X., Zhai, G., & Zhang, W. (2024). Gaia: Rethinking action quality assessment for ai-generated videos. In Advances in neural information processing systems.","DOI":"10.52202\/079017-1267"},{"key":"2672_CR19","doi-asserted-by":"crossref","unstructured":"Chen, L., Zhang, J., Wu, W., Han, C., & Gao, H. (2024). Long video scoring method fusing high-precision pose and spatio-temporal attention modules. Asia-pacific web and web-age information management joint international conference on web and big data (pp. 466\u2013475). Springer.","DOI":"10.1007\/978-981-97-7232-2_31"},{"key":"2672_CR20","unstructured":"Chen, R., Zheng, G., Yang, X., Chen, Z., Shu, J., Yang, W., Zhu, K., & Feng, C. (2024). Unlabeled action quality assessment based on multi-dimensional adaptive constrained dynamic time warping. arXiv preprint arXiv:2410.14161."},{"key":"2672_CR21","doi-asserted-by":"crossref","first-page":"2846","DOI":"10.1007\/s11263-021-01486-4","volume":"129","author":"X Chen","year":"2021","unstructured":"Chen, X., Pang, A., Yang, W., Ma, Y., Xu, L., & Sportscap, J. Y. (2021). Monocular 3d human motion capture and fine-grained understanding in challenging sports videos. International Journal of Computer Vision,129, 2846\u20132864.","journal-title":"International Journal of Computer Vision"},{"key":"2672_CR22","doi-asserted-by":"crossref","unstructured":"Cui, W.-B., Song, W.-A., Pei, Z.-T., Lei, Y., Wang, Q., Chen, Y.-J., & Yang, J.-J. (2023). Study on assessment methods of developmental coordination disorder in children. In IEEE annual computers, software, and applications conference, pp. 1507\u20131512. IEEE.","DOI":"10.1109\/COMPSAC57700.2023.00232"},{"key":"2672_CR23","unstructured":"Dadashzadeh, A. (2024). Learning strategies for parkinson\u2019s disease severity assessment. Thesis."},{"key":"2672_CR24","doi-asserted-by":"crossref","unstructured":"Dadashzadeh, A., Duan, S., Whone, A., & Mirmehdi, M. (2024). Pecop: Parameter efficient continual pretraining for action quality assessment. In Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp. 42\u201352.","DOI":"10.1109\/WACV57701.2024.00012"},{"key":"2672_CR25","unstructured":"De la Torre Frade, F., Hodgins, J. K., Bargteil, A. W., Artal, X. M., Macey, J. C., Castells, A. C. I., & Beltran, J. (2008). Guide to the carnegie mellon university multimodal activity (cmu-mmac) database. Technical Report CMU-RI-TR-08-22, Pittsburgh, PA."},{"key":"2672_CR26","doi-asserted-by":"crossref","unstructured":"Ding, X., Xiaowei, X., & Li, X. (2023). Sedskill: Surgical events driven method for skill assessment from thoracoscopic surgical videos. In International conference on medical image computing and computer-assisted intervention, pp. 35\u201345. Springer.","DOI":"10.1007\/978-3-031-43996-4_4"},{"key":"2672_CR27","doi-asserted-by":"crossref","unstructured":"Ding, Y., Zhang, S., Shenglan, L., Zhang, J., Chen, W., Haifei, D., Dong, B., & Sun, T. (2024). 2m-af: A strong multi-modality framework for human action quality assessment with self-supervised representation learning. In Proceedings of the acm international conference on multimedia, pp. 1564\u20131572.","DOI":"10.1145\/3664647.3681084"},{"key":"2672_CR28","unstructured":"Dong, X., Liu, X., Li, W., Adeyemi-Ejeye, A., & Gilbert, A. (2024). Interpretable long-term action quality assessment. arXiv preprint arXiv:2408.11687."},{"key":"2672_CR29","doi-asserted-by":"crossref","unstructured":"Dong, L., Wang, W., Qiao, Y., & Sun, X. (2024). Lucidaction: A hierarchical and multi-model dataset for comprehensive action quality assessment. In Advances in neural information processing systems.","DOI":"10.52202\/079017-3058"},{"key":"2672_CR30","volume":"229","author":"L-J Dong","year":"2021","unstructured":"Dong, L.-J., Zhang, H.-B., Shi, Q., Lei, Q., Du, J.-X., & Gao, S. (2021). Learning and fusing multiple hidden substages for action quality assessment. Knowledge-Based Systems,229, Article 107388.","journal-title":"Knowledge-Based Systems"},{"key":"2672_CR31","unstructured":"Doughty, H. R. (2021). Skill determination from long videos. Thesis."},{"key":"2672_CR32","doi-asserted-by":"crossref","unstructured":"Doughty, H., Damen, D., & Mayol-Cuevas, W. (2018). Who\u2019s better? who\u2019s best? pairwise deep ranking for skill determination. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 6057\u20136066.","DOI":"10.1109\/CVPR.2018.00634"},{"key":"2672_CR33","doi-asserted-by":"crossref","unstructured":"Doughty, H., Mayol-Cuevas, W., & Damen, D. (2019). The pros and cons: Rank-aware temporal attention for skill determination in long videos. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 7862\u20137871.","DOI":"10.1109\/CVPR.2019.00805"},{"key":"2672_CR34","doi-asserted-by":"crossref","unstructured":"Du, Z., He, D., Wang, X., & Wang, Q. (2023). Learning semantics-guided representations for scoring figure skating. IEEE transactions on multimedia.","DOI":"10.1109\/TMM.2023.3328180"},{"issue":"2","key":"2672_CR35","doi-asserted-by":"crossref","first-page":"124","DOI":"10.1198\/tast.2009.0026","volume":"63","author":"JW Emerson","year":"2009","unstructured":"Emerson, J. W., Seltzer, M., & Lin, D. (2009). Assessing judging bias: An example from the 2000 olympic games. The American Statistician,63(2), 124\u2013131.","journal-title":"The American Statistician"},{"key":"2672_CR36","doi-asserted-by":"crossref","unstructured":"Epstein, D., & Vondrick, C. (2021). Learning goals from failure. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 11194\u201311204.","DOI":"10.1109\/CVPR46437.2021.01104"},{"key":"2672_CR37","doi-asserted-by":"crossref","unstructured":"Fan, S., Wei, Y., Xia, J., & Zheng, F. (2022). Hightlight video detection in figure skating. In Chinese conference on pattern recognition and computer vision, pp. 651\u2013664. Springer.","DOI":"10.1007\/978-3-031-18913-5_50"},{"key":"2672_CR38","doi-asserted-by":"crossref","unstructured":"Fang, M., Du, X., Liu, Q., Zhou, Y., Liang, Q., & Liu, S. (2024). Which is the better teacher action? a new ranking model and dataset. In IEEE international conference on acoustics, speech and signal processing, pp. 7695\u20137699. IEEE.","DOI":"10.1109\/ICASSP48485.2024.10448158"},{"key":"2672_CR39","doi-asserted-by":"crossref","unstructured":"Fang, H., Zhou, W., & Li, H. (2023). End-to-end action quality assessment with action parsing transformer. In IEEE international conference on visual communications and image processing, pp. 1\u20135. IEEE.","DOI":"10.1109\/VCIP59821.2023.10402700"},{"key":"2672_CR40","doi-asserted-by":"crossref","unstructured":"Farabi, S., Himel, Gazzali, H. F., Hasan, M.\u00a0B., Kabir, M.\u00a0H., & Farazi, M. (2022). Improving action quality assessment using weighted aggregation. In Iberian conference on pattern recognition and image analysis, pp. 576\u2013587. Springer.","DOI":"10.1007\/978-3-031-04881-4_46"},{"key":"2672_CR41","doi-asserted-by":"crossref","unstructured":"Farha, Y.\u00a0A. & Gall, J. (2019). Ms-tcn: Multi-stage temporal convolutional network for action segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 3575\u20133584.","DOI":"10.1109\/CVPR.2019.00369"},{"key":"2672_CR42","doi-asserted-by":"crossref","unstructured":"Freire-Obreg\u00f3n, D., Lorenzo-Navarro, J., Santana, O. J., Hern\u00e1ndez-Sosa, D., & Castrill\u00f3n-Santana, M. (2022). Towards cumulative race time regression in sports: I3d convnet transfer learning in ultra-distance running events. In International conference on pattern recognition, pp. 805\u2013811. IEEE.","DOI":"10.1109\/ICPR56361.2022.9956174"},{"key":"2672_CR43","doi-asserted-by":"crossref","unstructured":"Freire-Obreg\u00f3n, D., Lorenzo-Navarro, J., Santana, O. J., Hern\u00e1ndez-Sosa, D., & Castrill\u00f3n-Santana, M. (2023). An x3d neural network analysis for runner\u2019s performance assessment in a wild sporting environment. In International conference on machine vision and applications, pp. 1\u20135. IEEE.","DOI":"10.23919\/MVA57639.2023.10215918"},{"key":"2672_CR44","doi-asserted-by":"crossref","unstructured":"Gallardo, U., Caro, F., Hern\u00e1ndez, E., Espinosa, R., & Ochoa-Ruiz, G. (2024). Gymetricpose: A light-weight angle-based graph adaptation for action quality assessment. In IEEE international symposium on computer-based medical systems, pp. 43\u201350. IEEE.","DOI":"10.1109\/CBMS61543.2024.00016"},{"key":"2672_CR45","doi-asserted-by":"crossref","unstructured":"Gan, Z., Jin, L., Cheng, Y., Cheng, Y., Teng, Y., Li, Z., Li, Y., Yang, W., Zhu, Z., & Xing, J. (2024). Skatingverse: A large-scale benchmark for comprehensive evaluation on human action understanding. IET computer vision.","DOI":"10.1049\/cvi2.12287"},{"key":"2672_CR46","doi-asserted-by":"crossref","unstructured":"Ganesh, Y., Sri\u00a0Teja, A., Munnangi, S.\u00a0K., & Rama\u00a0Murthy, G. (2019). A novel framework for fine grained action recognition in soccer. In Advances in computational intelligence, pp. 137\u2013150. Springer.","DOI":"10.1007\/978-3-030-20518-8_12"},{"key":"2672_CR47","doi-asserted-by":"crossref","unstructured":"Gao,H., Yu, S., Iqbal, M., & Guizani, M. (2024). Resfnn: Residual structure-based feedforward neural network for action quality assessment in sports consumer electronics. IEEE transactions on consumer electronics.","DOI":"10.1109\/TCE.2024.3482560"},{"key":"2672_CR48","doi-asserted-by":"crossref","unstructured":"Gao, J., Zheng, W.-S., Pan, J.-H., Gao, C., Wang, Y., Zeng, W., & Lai, J. (2020). An asymmetric modeling for action assessment. In European conference on computer vision, pp. 222\u2013238. Springer.","DOI":"10.1007\/978-3-030-58577-8_14"},{"issue":"3","key":"2672_CR49","doi-asserted-by":"crossref","first-page":"659","DOI":"10.1007\/s11263-022-01695-5","volume":"131","author":"J Gao","year":"2023","unstructured":"Gao, J., Pan, J.-H., Zhang, S.-J., & Zheng, W.-S. (2023). Automatic modelling for interactive action assessment. International Journal of Computer Vision,131(3), 659\u2013679.","journal-title":"International Journal of Computer Vision"},{"key":"2672_CR50","first-page":"3","volume":"3","author":"Y Gao","year":"2014","unstructured":"Gao, Y., Vedula, S. S., Reiley, C. E., Ahmidi, N., Varadarajan, B., Lin, H. C., Tao, L., Zappella, L., B\u00e9jar, B., & Yuh, D. D. (2014). Jhu-isi gesture and skill assessment working set (jigsaws): A surgical activity dataset for human motion modeling. In Medical Image Computing and Computer Assisted Intervention Workshop,3, 3.","journal-title":"In Medical Image Computing and Computer Assisted Intervention Workshop"},{"key":"2672_CR51","doi-asserted-by":"crossref","unstructured":"Gedamu, Kumie, Ji, Yanli, Yang, Yang, Shao, Jie, & Shen, Heng Tao. (2024). Self-supervised subaction parsing network for semi-supervised action quality assessment. IEEE transactions on image processing.","DOI":"10.1109\/TIP.2024.3468870"},{"key":"2672_CR52","doi-asserted-by":"crossref","unstructured":"Gedamu, K., Ji, Y., Yang, Y., Shao, J., & Shen, H.\u00a0T. (2024). Visual-semantic alignment temporal parsing for action quality assessment. IEEE transactions on circuits and systems for video technology.","DOI":"10.1109\/TCSVT.2024.3487242"},{"key":"2672_CR53","doi-asserted-by":"crossref","first-page":"6386","DOI":"10.1109\/TIP.2023.3331212","volume":"32","author":"K Gedamu","year":"2023","unstructured":"Gedamu, K., Ji, Y., Yang, Y., Shao, J., & Shen, H. T. (2023). Fine-grained spatio-temporal parsing network for action quality assessment. IEEE Transactions on Image Processing,32, 6386\u20136400.","journal-title":"IEEE Transactions on Image Processing"},{"issue":"2","key":"2672_CR54","doi-asserted-by":"crossref","first-page":"185","DOI":"10.1001\/jamasurg.2023.6262","volume":"159","author":"ED Goodman","year":"2024","unstructured":"Goodman, E. D., Patel, K. K., Zhang, Y., Locke, W., Kennedy, C. J., Mehrotra, R., Ren, S., Guan, M., Zohar, O., Downing, M., et al. (2024). Analyzing surgical technique in diverse open surgical videos with multitask machine learning. JAMA surgery,159(2), 185\u2013192.","journal-title":"JAMA surgery"},{"key":"2672_CR55","first-page":"541","volume":"2","author":"AS Gordon","year":"1995","unstructured":"Gordon, A. S. (1995). Automated video assessment of human performance. Proceedings of AI-ED,2, 541\u2013546.","journal-title":"Proceedings of AI-ED"},{"key":"2672_CR56","doi-asserted-by":"crossref","unstructured":"Grauman, K., Westbury, A., Torresani, L., Kitani, K., Malik, J., Afouras, T., Ashutosh, K., Baiyya, V., Bansal, S., & Boote, B. (2024). Ego-exo4d: Understanding skilled human activity from first-and third-person perspectives. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 19383\u201319400.","DOI":"10.1109\/CVPR52733.2024.01834"},{"issue":"4","key":"2672_CR57","first-page":"1","volume":"53","author":"R Guo","year":"2020","unstructured":"Guo, R., Cheng, L., Li, J., Hahn, P. R., & Liu, H. (2020). A survey of learning causality with data: Problems and methods. ACM Computing Surveys,53(4), 1\u201337.","journal-title":"ACM Computing Surveys"},{"key":"2672_CR58","doi-asserted-by":"crossref","unstructured":"Han, R., Zhou, K., Atapour-Abarghouei, A., Liang, X., & Shum, H. P. H. (2025). Finecausal: A causal-based framework for interpretable fine-grained action quality assessment. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 6018\u20136027.","DOI":"10.1109\/CVPRW67362.2025.00599"},{"issue":"1","key":"2672_CR59","doi-asserted-by":"crossref","first-page":"21","DOI":"10.3390\/systems11010021","volume":"11","author":"C Han","year":"2023","unstructured":"Han, C., Shen, F., Chen, L., Lian, X., Gou, H., & Gao, H. (2023). Mla-lstm: A local and global location attention lstm learning model for scoring figure skating. Systems,11(1), 21.","journal-title":"Systems"},{"key":"2672_CR60","doi-asserted-by":"crossref","unstructured":"Hao, N., Ruan, S., Song, Y., Chen, J., & Tian, L. (2023). The establishment of a precise intelligent evaluation system for sports events: Diving. Heliyon,9(11).","DOI":"10.1016\/j.heliyon.2023.e21361"},{"key":"2672_CR61","doi-asserted-by":"crossref","unstructured":"He, T., Chen, Y., Wang, L., & Cheng, H. (2024). An expert-knowledge-based graph convolutional network for skeleton-based physical rehabilitation exercises assessment. IEEE transactions on neural systems and rehabilitation engineering.","DOI":"10.1109\/TNSRE.2024.3400790"},{"key":"2672_CR62","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. (2016). Deep residual learning for image recognition. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 770\u2013778.","DOI":"10.1109\/CVPR.2016.90"},{"issue":"1","key":"2672_CR63","doi-asserted-by":"crossref","first-page":"96","DOI":"10.26555\/ijain.v9i1.919","volume":"9","author":"I Hipiny","year":"2023","unstructured":"Hipiny, I., Ujir, H., Alias, A. A., Shanat, M., & Ishak, M. K. (2023). Who danced better? ranked tiktok dance video dataset and pairwise action quality assessment method. International Journal of Advances in Intelligent Informatics,9(1), 96\u2013107.","journal-title":"International Journal of Advances in Intelligent Informatics"},{"key":"2672_CR64","unstructured":"Hirosawa, S. (2024). Computer vision-based action quality assessment incorporating human expert\u2019s knowledge: Focusing on the figure skating jump. Thesis."},{"key":"2672_CR65","doi-asserted-by":"crossref","unstructured":"Hirosawa, S., Yamashita, T., & Aoki, Y. (2023). Expert\u2019s gaze-based prediction model for assessing the quality of figure skating jumps. In International symposium on computer science in sport, pp. 42\u201352. Springer.","DOI":"10.1007\/978-981-97-2898-5_5"},{"issue":"22","key":"2672_CR66","doi-asserted-by":"crossref","first-page":"9282","DOI":"10.3390\/s23229282","volume":"23","author":"S Hirosawa","year":"2023","unstructured":"Hirosawa, S., Kato, T., Yamashita, T., & Aoki, Y. (2023). Action quality assessment model using specialists\u2019 gaze location and kinematics data-focusing on evaluating figure skating jumps. Sensors,23(22), 9282.","journal-title":"Sensors"},{"issue":"4","key":"2672_CR67","doi-asserted-by":"crossref","first-page":"470","DOI":"10.1080\/02640414.2021.1997407","volume":"40","author":"S Hirosawa","year":"2022","unstructured":"Hirosawa, S., Watanabe, M., & Aoki, Y. (2022). Determinant analysis and developing evaluation indicators of grade of execution score of double axel jump in figure skating. Journal of Sports Sciences,40(4), 470\u2013481.","journal-title":"Journal of Sports Sciences"},{"issue":"8","key":"2672_CR68","doi-asserted-by":"crossref","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S., & Schmidhuber, J. (1997). Long short-term memory. Neural Comput.,9(8), 1735\u20131780.","journal-title":"Neural Comput."},{"key":"2672_CR69","doi-asserted-by":"crossref","unstructured":"Huang, Y., Chen, G., Xu, J., Zhang, M., Yang, L., Pei, B., Zhang, H., Dong, L., Wang, Y., & Wang, L. (2024). Egoexolearn: A dataset for bridging asynchronous ego-and exo-centric view of procedural activities in real world. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 22072\u201322086.","DOI":"10.1109\/CVPR52733.2024.02084"},{"key":"2672_CR70","doi-asserted-by":"crossref","unstructured":"Huang, Y., Yuan, Y., Zeng, X., Xie, L., Fu, Y., Yue, G., & Zhao, B. (2024). Full-reference motion quality assessment based on efficient monocular parametric 3d human body reconstruction. In IEEE international conference on multimedia and expo, pp. 1\u20136. IEEE.","DOI":"10.1109\/ICME57554.2024.10687714"},{"key":"2672_CR71","doi-asserted-by":"crossref","first-page":"8869","DOI":"10.1609\/aaai.v39i8.32959","volume":"39","author":"X Huangbiao","year":"2025","unstructured":"Huangbiao, X., Ke, X., Huanqi, W., Rui, X., Li, Y., Peirong, X., & Guo, W. (2025). Dancefix: An exploration in group dance neatness assessment through fixing abnormal challenges of human pose. In Proceedings of the AAAI Conference on Artificial Intelligence,39, 8869\u20138877.","journal-title":"In Proceedings of the AAAI Conference on Artificial Intelligence"},{"issue":"4","key":"2672_CR72","doi-asserted-by":"crossref","first-page":"3245","DOI":"10.1007\/s10489-024-05349-6","volume":"54","author":"F Huang","year":"2024","unstructured":"Huang, F., & Li, J. (2024). Assessing action quality with semantic-sequence performance regression and densely distributed sample weighting. Applied Intelligence,54(4), 3245\u20133259.","journal-title":"Applied Intelligence"},{"key":"2672_CR73","volume":"614","author":"K Huang","year":"2025","unstructured":"Huang, K., Tian, Y., Chen, Yu., & Huang, Y. (2025). Dual-referenced assistive network for action quality assessment. Neurocomputing,614, Article 128786.","journal-title":"Neurocomputing"},{"issue":"7","key":"2672_CR74","doi-asserted-by":"crossref","first-page":"1325","DOI":"10.1109\/TPAMI.2013.248","volume":"36","author":"C Ionescu","year":"2013","unstructured":"Ionescu, C., Papava, D., Olaru, V., & Sminchisescu, C. (2013). Human3. 6m: Large scale datasets and predictive methods for 3d human sensing in natural environments. IEEE Transactions on Pattern Analysis and Machine Intelligence,36(7), 1325\u20131339.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2672_CR75","unstructured":"Iyer, A., Alali, M., Bodala, H., & Vaidya, S. (2022). Action quality assessment using transformers. arXiv preprint arXiv:2207.12318."},{"key":"2672_CR76","unstructured":"Jain, H. (2020). Assessment of human actions in videos. Thesis."},{"key":"2672_CR77","doi-asserted-by":"crossref","unstructured":"Jain, H., & Harit, G. (2019). An unsupervised sequence-to-sequence autoencoder based human action scoring model. In IEEE global conference on signal and information processing, pp. 1\u20135. IEEE.","DOI":"10.1109\/GlobalSIP45357.2019.8969424"},{"issue":"6","key":"2672_CR78","doi-asserted-by":"crossref","first-page":"2260","DOI":"10.1109\/TCSVT.2020.3017727","volume":"31","author":"H Jain","year":"2021","unstructured":"Jain, H., Harit, G., & Sharma, A. (2021). Action quality assessment using siamese network-based deep metric learning. IEEE Transactions on Circuits and Systems for Video Technology,31(6), 2260\u20132273.","journal-title":"IEEE Transactions on Circuits and Systems for Video Technology"},{"key":"2672_CR79","doi-asserted-by":"crossref","unstructured":"Ji, Y., Ye, L., Huang, H., Mao, L., Zhou, Y., & Gao, L. (2023). Localization-assisted uncertainty score disentanglement network for action quality assessment. In Proceedings of the ACM international conference on multimedia, pp. 8590\u20138597.","DOI":"10.1145\/3581783.3613795"},{"key":"2672_CR80","unstructured":"Jinglin, X., Yin, S., & Peng, Y. (2025). Human-centric fine-grained action quality assessment. IEEE transactions on pattern analysis and machine intelligence."},{"key":"2672_CR81","doi-asserted-by":"crossref","unstructured":"Joung, C.-I., Byun, S., & Baek, S. (2023). Contrastive learning for action assessment using graph convolutional networks with augmented virtual joints. IEEE Access.","DOI":"10.2139\/ssrn.4236091"},{"key":"2672_CR82","doi-asserted-by":"crossref","unstructured":"Jug, M., Per\u0161, J., De\u017eman, B., & Kova\u010di\u010d, S. (2003). Trajectory based assessment of coordinated human activity. In International conference on computer vision systems, pp. 534\u2013543. Springer.","DOI":"10.1007\/3-540-36592-3_51"},{"key":"2672_CR83","doi-asserted-by":"crossref","unstructured":"Karunaratne, A., Jayasooriya, C., Deegalla, S., & Navarathna, R. (2021). Objectively measure player performance on olympic weightlifting. In International conference on information and automation for sustainability, pp. 410\u2013415. IEEE.","DOI":"10.1109\/ICIAfS52090.2021.9605963"},{"key":"2672_CR84","unstructured":"Kay, W., Carreira, J., Simonyan, K., Zhang, B., Hillier, C., Vijayanarasimhan, S., Viola, F., Green, T., Back, T., Natsev, P. et\u00a0al. (2017). The kinetics human action video dataset. arXiv preprint arXiv:1705.06950."},{"key":"2672_CR85","volume":"664","author":"X Ke","year":"2024","unstructured":"Ke, X., Xu, H., Lin, X., & Guo, W. (2024). Two-path target-aware contrastive regression for action quality assessment. Information Sciences,664, Article 120347.","journal-title":"Information Sciences"},{"key":"2672_CR86","doi-asserted-by":"crossref","unstructured":"Kim, D., Kim, TT., Lee, I., & Lee, S. (2024). Kinematic diversity and rhythmic alignment in choreographic quality transformers for dance quality assessment. IEEE transactions on circuits and systems for video technology.","DOI":"10.1109\/TCSVT.2024.3360452"},{"key":"2672_CR87","unstructured":"Kondo, S. (2024). Zeal: Surgical skill assessment with zero-shot tool inference using unified foundation model. arXiv preprint arXiv:2407.02738."},{"issue":"5","key":"2672_CR88","doi-asserted-by":"crossref","first-page":"1366","DOI":"10.1007\/s11263-022-01594-9","volume":"130","author":"Y Kong","year":"2022","unstructured":"Kong, Y., & Fu, Y. (2022). Human action recognition and prediction: A survey. International Journal of Computer Vision,130(5), 1366\u20131401.","journal-title":"International Journal of Computer Vision"},{"key":"2672_CR89","doi-asserted-by":"crossref","unstructured":"Lea, C., Flynn, M. D., Vidal, R., Reiter, A., & Hager, G. D. (2017). Temporal convolutional networks for action segmentation and detection. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 156\u2013165.","DOI":"10.1109\/CVPR.2017.113"},{"issue":"10","key":"2672_CR90","doi-asserted-by":"crossref","first-page":"7160","DOI":"10.1109\/TCSVT.2022.3178430","volume":"32","author":"K Lee","year":"2022","unstructured":"Lee, K., Park, Y., Huh, J., Kang, J., & Lee, S. (2022). Self-updatable database system based on human motion assessment framework. IEEE Transactions on Circuits and Systems for Video Technology,32(10), 7160\u20137176.","journal-title":"IEEE Transactions on Circuits and Systems for Video Technology"},{"issue":"19","key":"2672_CR91","doi-asserted-by":"crossref","first-page":"4129","DOI":"10.3390\/s19194129","volume":"19","author":"Q Lei","year":"2019","unstructured":"Lei, Q., Du, J.-X., Zhang, H.-B., Ye, S., & Chen, D.-S. (2019). A survey of vision-based human action evaluation methods. Sensors,19(19), 4129.","journal-title":"Sensors"},{"issue":"19","key":"2672_CR92","doi-asserted-by":"crossref","first-page":"21692","DOI":"10.1007\/s10489-023-04613-5","volume":"53","author":"Q Lei","year":"2023","unstructured":"Lei, Q., Li, H., Zhang, H., Jixiang, D., & Gao, S. (2023). Multi-skeleton structures graph convolutional network for action quality assessment in long videos. Applied Intelligence,53(19), 21692\u201321705.","journal-title":"Applied Intelligence"},{"issue":"7","key":"2672_CR93","doi-asserted-by":"crossref","first-page":"1575","DOI":"10.1007\/s11760-021-01890-w","volume":"15","author":"Q Lei","year":"2021","unstructured":"Lei, Q., Zhang, H., & Du, J. (2021). Temporal attention learning for action quality assessment in sports video. Signal, Image and Video Processing,15(7), 1575\u20131583.","journal-title":"Signal, Image and Video Processing"},{"issue":"4","key":"2672_CR94","doi-asserted-by":"crossref","first-page":"568","DOI":"10.3390\/electronics9040568","volume":"9","author":"Q Lei","year":"2020","unstructured":"Lei, Q., Zhang, H.-B., Ji-Xiang, D., Hsiao, T.-C., & Chen, C.-C. (2020). Learning effective skeletal representations on rgb video for fine-grained human action quality assessment. Electronics,9(4), 568.","journal-title":"Electronics"},{"key":"2672_CR95","unstructured":"Lemos\u00a0Baptista, R.\u00a0M. (2021). Human motion analysis using 3D skeleton representation in the context of real-world applications: From home-based rehabilitation to sensing in the wild. Thesis."},{"key":"2672_CR96","doi-asserted-by":"crossref","unstructured":"Li, J., Bhat, A., & Barmaki, R. (2021). Improving the movement synchrony estimation with action quality assessment in children play therapy. In Proceedings of the international conference on multimodal interaction, pp. 397\u2013406.","DOI":"10.1145\/3462244.3479891"},{"key":"2672_CR97","doi-asserted-by":"crossref","unstructured":"Li, Y., Chai, X., & Chen, X. (2018). End-to-end learning for action quality assessment. In Pacific rim conference on multimedia, pp. 125\u2013134. Springer.","DOI":"10.1007\/978-3-030-00767-6_12"},{"key":"2672_CR98","doi-asserted-by":"crossref","unstructured":"Li, Y., Chai, X., & Chen, X. (2018). Scoringnet: Learning key fragment for action quality assessment with ranking loss in skilled sports. In Asian conference on computer vision, pp. 149\u2013164. Springer.","DOI":"10.1007\/978-3-030-20876-9_10"},{"key":"2672_CR99","doi-asserted-by":"crossref","unstructured":"Li, Z., Chen, H., Cai, J, & Xue, Y. (2024). Segmentation and quality assessment of continuous fitness movements based on vision. In International conference on intelligent computing, pp. 96\u2013107. Springer.","DOI":"10.1007\/978-981-97-5612-4_9"},{"key":"2672_CR100","doi-asserted-by":"crossref","unstructured":"Li, Q., Cui, Z., Kitahara, I., & Sagawa, R. (2022). Precise gymnastic scoring from tv playback. In IEEE global conference on consumer electronics, pp. 412\u2013415. IEEE.","DOI":"10.1109\/GCCE56475.2022.10014208"},{"key":"2672_CR101","doi-asserted-by":"crossref","unstructured":"Li, J., Hu, H., Xing, Q., Wang, X., Li, J., & Shen, Y. (2022). Tai chi action quality assessment and visual analysis with a consumer rgb-d camera. In IEEE international workshop on multimedia signal processing, pp. 1\u20136. IEEE.","DOI":"10.1109\/MMSP55362.2022.9949464"},{"key":"2672_CR102","doi-asserted-by":"crossref","unstructured":"Li, Z., Huang, Y., Cai, M., & Sato, Y. (2019). Manipulation-skill assessment from videos with spatial attention network. In Proceedings of the IEEE\/CVF international conference on computer vision workshops, pp. 0\u20130.","DOI":"10.1109\/ICCVW.2019.00539"},{"key":"2672_CR103","doi-asserted-by":"crossref","unstructured":"Li, Y.-M., Huang, W.-J., Wang, A.-L., Zeng, L.-A., Meng, J.-K., & Zheng, W.-S. (2024). Egoexo-fitness: Towards egocentric and exocentric full-body action understanding. In European conference on computer vision.","DOI":"10.1007\/978-3-031-72661-3_21"},{"key":"2672_CR104","doi-asserted-by":"crossref","unstructured":"Li, H.-Y., Lei, Q., Zhang, H.-B., & Du, J.-X. (2021). Skeleton based action quality assessment of figure skating videos. In International conference on information technology in medicine and education, pp. 196\u2013200. IEEE.","DOI":"10.1109\/ITME53901.2021.00048"},{"key":"2672_CR105","unstructured":"Li, Y.-M., Wang, A.-L., Lin, K.-Y., Tang, Y.-M., Zeng, L.-A., Hu, J.-F., & Zheng, W.-S. (2024). Techcoach: Towards technical keypoint-aware descriptive action coaching. arXiv preprint arXiv:2411.17130."},{"key":"2672_CR106","doi-asserted-by":"crossref","unstructured":"Li, J., Xue, J., Cao, R., Du, X., Mo, S., Ran, K., & Zhang, Z. (2024). Finerehab: A multi-modality and multi-task dataset for rehabilitation analysis. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 3184\u20133193.","DOI":"10.1109\/CVPRW63382.2024.00324"},{"key":"2672_CR107","doi-asserted-by":"crossref","unstructured":"Li, Y.-M., Zeng, L.-A., Meng, J.-K, & Zheng, W.-S. (2024). Continual action assessment via task-consistent score-discriminative feature distribution modeling. IEEE transactions on circuits and systems for video technology.","DOI":"10.1109\/TCSVT.2024.3396692"},{"key":"2672_CR108","doi-asserted-by":"crossref","unstructured":"Li, M., Zhang, H.-B., Lei, Q., Fan, Z., Liu, J., & Du, J.-X. (2022). Pairwise contrastive learning network for action quality assessment. In European conference on computer vision, pp. 457\u2013473. Springer.","DOI":"10.1007\/978-3-031-19772-7_27"},{"key":"2672_CR109","unstructured":"Li, C., Zhu, Q., Liu, T., Tang, J., & Su, Y. (2022). Hand hygiene assessment via joint step segmentation and key action scorer. arXiv preprint arXiv:2209.12221."},{"issue":"24","key":"2672_CR110","doi-asserted-by":"crossref","first-page":"30443","DOI":"10.1007\/s10489-023-05166-3","volume":"53","author":"P-X Lian","year":"2023","unstructured":"Lian, P.-X., & Shao, Z.-G. (2023). Improving action quality assessment with across-staged temporal reasoning on imbalanced data. Applied Intelligence,53(24), 30443\u201330454.","journal-title":"Applied Intelligence"},{"key":"2672_CR111","volume":"89","author":"H Li","year":"2022","unstructured":"Li, H., Lei, Q., Zhang, H., Jixiang, D., & Gao, S. (2022). Skeleton-based deep pose feature learning for action quality assessment on figure skating videos. Journal of Visual Communication and Image Representation,89, Article 103625.","journal-title":"Journal of Visual Communication and Image Representation"},{"issue":"10","key":"2672_CR112","doi-asserted-by":"crossref","first-page":"1813","DOI":"10.3390\/electronics13101813","volume":"13","author":"X Lin","year":"2024","unstructured":"Lin, X., Liu, Y., Feng, C., Chen, Z., Yang, X., & Cui, H. (2024). Automatic evaluation method for functional movement screening based on multi-scale lightweight 3d convolution and an encoder\u2013decoder. Electronics,13(10), 1813.","journal-title":"Electronics"},{"key":"2672_CR113","volume":"80","author":"J Li","year":"2021","unstructured":"Li, J., Qingrui, H., Guo, T., Wang, S., & Shen, Y. (2021). What and how well you exercised? an efficient analysis framework for fitness actions. Journal of Visual Communication and Image Representation,80, Article 103304.","journal-title":"Journal of Visual Communication and Image Representation"},{"key":"2672_CR114","unstructured":"Liu, H.-C., & King, C.-T. (2019). A low-cost virtual coach for diagnosis and guidance in baseball\/softball batting training. In International conference on systems."},{"key":"2672_CR115","doi-asserted-by":"crossref","unstructured":"Liu, Y., Cheng, X., & Ikenaga, T. (2023). A figure skating jumping dataset for replay-guided action quality assessment. In Proceedings of the ACM international conference on multimedia, pp. 2437\u20132445.","DOI":"10.1145\/3581783.3613774"},{"key":"2672_CR116","doi-asserted-by":"crossref","unstructured":"Liu, Y., Cheng, X., & Ikenaga, T. (2024). A hierarchical joint training based replay-guided contrastive transformer for action quality assessment of figure skating. IEICE Transactions on Fundamentals of Electronics, Communications and Computer Sciences.","DOI":"10.1587\/transfun.2024SMP0003"},{"key":"2672_CR117","unstructured":"Liu, S.-L., Ding, Y.-N., Zhang, S.-F., Chen, W.-Y., Zhou, N., Liu, H., & Lao, G.-H. (2023). Fine-grained action analysis: A multi-modality and multi-task dataset of figure skating. arXiv preprint arXiv:2307.02730."},{"key":"2672_CR118","doi-asserted-by":"crossref","unstructured":"Liu, D., Li, Q., Jiang, T., Wang, Y., Miao, R., Shan, F., & Li, Z. (2021). Towards unified surgical skill assessment. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 9522\u20139531.","DOI":"10.1109\/CVPR46437.2021.00940"},{"key":"2672_CR119","doi-asserted-by":"crossref","unstructured":"Liu, Z., Ning, J., Cao, Y., Wei, Y., Zhang, Z., Lin, S., & Hu, H. (2022). Video swin transformer. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 3202\u20133211.","DOI":"10.1109\/CVPR52688.2022.00320"},{"key":"2672_CR120","doi-asserted-by":"crossref","unstructured":"Liu, J., Wang, H., Stawarz, K., Li, S., Fu, Y., & Liu, H. (2024). Vision-based human action quality assessment: A systematic review. Expert Systems with applications, pp. 125642.","DOI":"10.1016\/j.eswa.2024.125642"},{"key":"2672_CR121","doi-asserted-by":"crossref","unstructured":"Liu, J., Wang, H., Zhou, W., Stawarz, K., Corcoran, P., Chen, Y., & Liu, H. (2025). Adaptive spatiotemporal graph transformer network for action quality assessment. IEEE transactions on circuits and systems for video technology.","DOI":"10.1109\/TCSVT.2025.3541456"},{"key":"2672_CR122","doi-asserted-by":"crossref","unstructured":"Liu, L., Zhai, P., Zheng, D., & Fang, Y. (2023). Multi-stage action quality assessment method. In Proceedings of the international conference on control, robotics and intelligent system, pp. 116\u2013122.","DOI":"10.1145\/3622896.3622916"},{"key":"2672_CR123","doi-asserted-by":"crossref","first-page":"360","DOI":"10.1016\/j.neucom.2020.06.108","volume":"413","author":"S Liu","year":"2020","unstructured":"Liu, S., Liu, X., Huang, G., Qiao, H., Hu, L., Jiang, D., Zhang, A., Liu, Y., & Guo, G. (2020). Fsd-10: A fine-grained classification dataset for figure skating. Neurocomputing,413, 360\u2013367.","journal-title":"Neurocomputing"},{"issue":"2","key":"2672_CR124","doi-asserted-by":"crossref","first-page":"1963","DOI":"10.1007\/s40747-022-00892-6","volume":"9","author":"M-Z Li","year":"2023","unstructured":"Li, M.-Z., Zhang, H.-B., Dong, L.-J., Lei, Q., & Ji-Xiang, D. (2023). Gaussian guided frame sequence encoder network for action quality assessment. Complex & Intelligent Systems,9(2), 1963\u20131974.","journal-title":"Complex & Intelligent Systems"},{"key":"2672_CR125","unstructured":"Louis, N. (2024). Improving articulated pose tracking and contact force estimation for qualitative assessment of human actions. Thesis."},{"key":"2672_CR126","doi-asserted-by":"crossref","unstructured":"Luo, Z., Xiao, Y., Yang, F., Zhou, J. T., & Fang, Z. (2024). Rhythmer: Ranking-based skill assessment with rhythm-aware transformer. IEEE Transactions on Circuits and Systems for Video Technology.","DOI":"10.1109\/TCSVT.2024.3459938"},{"key":"2672_CR127","doi-asserted-by":"crossref","unstructured":"Majeedi, A., Gajjala, V.\u00a0R., GNVV, S. S. S.\u00a0N., & Li, Y. (2024). Rica2: Rubric-informed, calibrated assessment of actions. arXiv preprint arXiv:2408.02138.","DOI":"10.1007\/978-3-031-73036-8_9"},{"key":"2672_CR128","doi-asserted-by":"crossref","unstructured":"Matsuyama, H., Kawaguchi, N., & Lim, B.\u00a0Y. (2023). Iris: Interpretable rubric-informed segmentation for action quality assessment. In Proceedings of the international conference on intelligent user interfaces, pp. 368\u2013378.","DOI":"10.1145\/3581641.3584048"},{"key":"2672_CR129","doi-asserted-by":"crossref","unstructured":"Millan, M., & Achard, C. (2020). Fine-tuning siamese networks to assess sport gestures quality. In International joint conference on computer vision, imaging and computer graphics theory and applications, pp. 57\u201365.","DOI":"10.5220\/0008924600570065"},{"key":"2672_CR130","doi-asserted-by":"crossref","unstructured":"Moodley, T., & van der Haar, D. (2022). Casa: Cricket action similarity assessment in video footage using deep metric learning. In Southern African conference for artificial intelligence research, pp. 139\u2013153. Springer.","DOI":"10.1007\/978-3-031-22321-1_10"},{"key":"2672_CR131","doi-asserted-by":"crossref","unstructured":"Moodley, T., & Van Der Haar, D. (2025). I3d-ae-lstm: A 2-stream autoencoder for action quality assessment using a newly created cricket batsman video dataset. In Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp. 5470\u20135478. IEEE.","DOI":"10.1109\/WACV61041.2025.00534"},{"issue":"3","key":"2672_CR132","doi-asserted-by":"crossref","first-page":"1014","DOI":"10.1111\/ecin.12074","volume":"52","author":"HN Morgan","year":"2014","unstructured":"Morgan, H. N., & Rotthoff, K. W. (2014). The harder the task, the higher the score: Findings of a difficulty bias. Economic Inquiry,52(3), 1014\u20131026.","journal-title":"Economic Inquiry"},{"key":"2672_CR133","doi-asserted-by":"crossref","DOI":"10.1016\/j.compbiomed.2023.107420","volume":"165","author":"Y Mourchid","year":"2023","unstructured":"Mourchid, Y., & Slama, R. (2023). D-stgcnt: A dense spatio-temporal graph conv-gru network based on transformer for assessment of patient physical rehabilitation. Computers in Biology and Medicine,165, Article 107420.","journal-title":"Computers in Biology and Medicine"},{"key":"2672_CR134","doi-asserted-by":"crossref","first-page":"37749","DOI":"10.1109\/ACCESS.2023.3265595","volume":"11","author":"P Murthy","year":"2023","unstructured":"Murthy, P., Taetz, B., Lekhra, A., & Stricker, D. (2023). Divenet: Dive action localization and physical pose parameter extraction for high performance training. IEEE Access,11, 37749\u201337767.","journal-title":"IEEE Access"},{"key":"2672_CR135","doi-asserted-by":"crossref","unstructured":"Nagai, T., Takeda, S., Matsumura, M., Shimizu, S., & Yamamoto, S. (2021). Action quality assessment with ignoring scene context. In IEEE international conference on image processing, pp. 1189\u20131193. IEEE.","DOI":"10.1109\/ICIP42928.2021.9506257"},{"key":"2672_CR136","doi-asserted-by":"crossref","unstructured":"Nagai, T., Takeda, S., Suzuki, S., & Seshimo, H. (2024). Mmw-aqa: Multimodal in-the-wild dataset for action quality assessment. IEEE Access.","DOI":"10.1109\/ACCESS.2024.3423462"},{"key":"2672_CR137","unstructured":"Nekoui, M. (2022). Intelligent video-based quality assessment of human activities. Thesis."},{"key":"2672_CR138","doi-asserted-by":"crossref","unstructured":"Nekoui, M., Cruz, F. O. T., & Cheng, L. (2020). Falcons: Fast learner-grader for contorted poses in sports. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition workshops, pp. 900\u2013901.","DOI":"10.1109\/CVPRW50498.2020.00458"},{"key":"2672_CR139","doi-asserted-by":"crossref","unstructured":"Nekoui, M., Cruz, F. O. T., & Cheng, L. (2021). Eagle-eye: Extreme-pose action grader using detail bird\u2019s-eye view. In Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp. 394\u2013402.","DOI":"10.1109\/WACV48630.2021.00044"},{"key":"2672_CR140","doi-asserted-by":"crossref","unstructured":"Ogata, R., Simo-Serra, E., Iizuka, S., & Ishikawa, H. (2019). Temporal distance matrices for squat classification. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition workshops, pp. 0\u20130.","DOI":"10.1109\/CVPRW.2019.00309"},{"key":"2672_CR141","doi-asserted-by":"crossref","unstructured":"Okamoto, L., & Parmar, P. (2024). Hierarchical neurosymbolic approach for comprehensive and explainable action quality assessment. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 3204\u20133213.","DOI":"10.1109\/CVPRW63382.2024.00326"},{"key":"2672_CR142","doi-asserted-by":"crossref","unstructured":"Page, M. J., McKenzie, J. E., Bossuyt, P. M., Boutron, I., Hoffmann, T. C., Mulrow, C. D., Shamseer, L., Tetzlaff, J. M., Akl, E. A., Brennan, S. E., et\u00a0al. (2021). The prisma 2020 statement: An updated guideline for reporting systematic reviews. BMJ, 372.","DOI":"10.1136\/bmj.n71"},{"key":"2672_CR143","doi-asserted-by":"crossref","unstructured":"Pan, J.-H., Gao, J., & Zheng, W.-S. (2019). Action assessment by joint relation graphs. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 6331\u20136340.","DOI":"10.1109\/ICCV.2019.00643"},{"key":"2672_CR144","doi-asserted-by":"crossref","unstructured":"Pan, Y., Zhang, C., & Bertasius, G. (2025). Basket: A large-scale video dataset for fine-grained skill estimation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 28952\u201328962.","DOI":"10.1109\/CVPR52734.2025.02696"},{"issue":"12","key":"2672_CR145","doi-asserted-by":"crossref","first-page":"8779","DOI":"10.1109\/TPAMI.2021.3126534","volume":"44","author":"J-H Pan","year":"2022","unstructured":"Pan, J.-H., Gao, J., & Zheng, W.-S. (2022). Adaptive action assessment. IEEE Transactions on Pattern Analysis and Machine Intelligence,44(12), 8779\u20138795.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2672_CR146","doi-asserted-by":"crossref","unstructured":"Parmar, P. (2019). On action quality assessment. Thesis.","DOI":"10.1109\/WACV.2019.00161"},{"key":"2672_CR147","doi-asserted-by":"crossref","unstructured":"Parmar, P., & Morris, B. T. (2016). Measuring the quality of exercises. In International conference of the IEEE engineering in medicine and biology society, pp. 2241\u20132244. IEEE.","DOI":"10.1109\/EMBC.2016.7591175"},{"key":"2672_CR148","doi-asserted-by":"crossref","unstructured":"Parmar, P., & Morris, B. (2019). Action quality assessment across multiple actions. In Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp. 1468\u20131476. IEEE.","DOI":"10.1109\/WACV.2019.00161"},{"key":"2672_CR149","doi-asserted-by":"crossref","unstructured":"Parmar, P., & Morris, B. T. (2019). What and how well you performed? a multitask learning approach to action quality assessment. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 304\u2013313.","DOI":"10.1109\/CVPR.2019.00039"},{"key":"2672_CR150","doi-asserted-by":"crossref","unstructured":"Parmar, P., & Morris, B. (2022). Win-fail action recognition. In Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp. 161\u2013171.","DOI":"10.1109\/WACVW54805.2022.00022"},{"key":"2672_CR151","doi-asserted-by":"crossref","unstructured":"Parmar, P., & Tran Morris, B. (2017). Learning to score olympic events. In Proceedings of the IEEE conference on computer vision and pattern recognition workshops, pp. 20\u201328.","DOI":"10.1109\/CVPRW.2017.16"},{"key":"2672_CR152","doi-asserted-by":"crossref","unstructured":"Parmar, P., Gharat, A., & Rhodin, H. (2022). Domain knowledge-informed self-supervised representations for workout form assessment. In European conference on computer vision, pp. 105\u2013123. Springer.","DOI":"10.1007\/978-3-031-19839-7_7"},{"key":"2672_CR153","doi-asserted-by":"crossref","unstructured":"Parmar, P., Peh, E., & Fernando, B. (2024). Learning to visually connect actions and their effects. arXiv preprint arXiv:2401.10805.","DOI":"10.1109\/WACV61041.2025.00151"},{"key":"2672_CR154","doi-asserted-by":"crossref","unstructured":"Parmar, P., Reddy, J., & Morris, B. (2021). Piano skills assessment. In IEEE international workshop on multimedia signal processing, pp. 1\u20135. IEEE.","DOI":"10.1109\/MMSP53017.2021.9733638"},{"issue":"3","key":"2672_CR155","doi-asserted-by":"crossref","first-page":"604","DOI":"10.3390\/signals2030037","volume":"2","author":"P Parmar","year":"2021","unstructured":"Parmar, P., & Morris, B. (2021). Hallucinet-ing spatiotemporal representations using a 2d-cnn. Signals,2(3), 604\u2013618.","journal-title":"Signals"},{"key":"2672_CR156","unstructured":"Parsa, B. (2020). Deep learning methods for video-based human activity recognition in industrial settings. Thesis."},{"key":"2672_CR157","doi-asserted-by":"crossref","unstructured":"Parsa, B., & Banerjee, A. G. (2021). A multi-task learning approach for human activity segmentation and ergonomics risk assessment. In Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp. 2352\u20132362.","DOI":"10.1109\/WACV48630.2021.00240"},{"key":"2672_CR158","doi-asserted-by":"crossref","unstructured":"Pirsiavash, H., Vondrick, C., & Torralba, A. (2014). Assessing the quality of actions. In European conference on computer vision, pp. 556\u2013571. Springer.","DOI":"10.1007\/978-3-319-10599-4_36"},{"key":"2672_CR159","doi-asserted-by":"crossref","unstructured":"Qiu, Z., Yao, T., & Mei, T. (2017). Learning spatio-temporal representation with pseudo-3d residual networks. In Proceedings of the IEEE international conference on computer vision, pp. 5533\u20135541.","DOI":"10.1109\/ICCV.2017.590"},{"key":"2672_CR160","volume":"72","author":"Y Qiu","year":"2022","unstructured":"Qiu, Y., Wang, J., Jin, Z., Chen, H., Zhang, M., & Guo, L. (2022). Pose-guided matching based on deep learning for assessing quality of action on rehabilitation training. Biomedical Signal Processing and Control,72, Article 103323.","journal-title":"Biomedical Signal Processing and Control"},{"key":"2672_CR161","doi-asserted-by":"crossref","unstructured":"Roditakis, K., Makris, A., & Argyros, A. (2021). Towards improved and interpretable action quality assessment with self-supervised alignment. In Proceedings of the PErvasive technologies related to assistive environments conference, pp. 507\u2013513.","DOI":"10.1145\/3453892.3461624"},{"key":"2672_CR162","doi-asserted-by":"crossref","unstructured":"Sardari, F., Paiement, A., & Mirmehdi, M. (2019). View-invariant pose analysis for human movement assessment from rgb data. In Image analysis and processing, pp. 237\u2013248. Springer.","DOI":"10.1007\/978-3-030-30645-8_22"},{"issue":"18","key":"2672_CR163","doi-asserted-by":"crossref","first-page":"5258","DOI":"10.3390\/s20185258","volume":"20","author":"F Sardari","year":"2020","unstructured":"Sardari, F., Paiement, A., Hannuna, S., & Mirmehdi, M. (2020). Vi-net-view-invariant quality of human movement assessment. Sensors,20(18), 5258.","journal-title":"Sensors"},{"key":"2672_CR164","doi-asserted-by":"crossref","unstructured":"Sener, F., Chatterjee, D., Shelepov, D., He, K., Singhania, D., Wang, R., & Yao, A. (2022). Assembly101: A large-scale multi-view video dataset for understanding procedural activities. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 21096\u201321106.","DOI":"10.1109\/CVPR52688.2022.02042"},{"key":"2672_CR165","doi-asserted-by":"crossref","unstructured":"Seo, C., Sabanai, M., Goto, Y., Tagami, K., Ogata, H., Kanosue, K., & Ohya, J. (2021). Extracting and interpreting unknown factors with classifier for foot strike types in running. In International conference on pattern recognition, pp. 3217\u20133224. IEEE.","DOI":"10.1109\/ICPR48806.2021.9413118"},{"key":"2672_CR166","doi-asserted-by":"crossref","unstructured":"Shen, Y.-Y., Xing, Q.-J., & Shen, Y.-F. (2024). Markerless vision-based functional movement screening movements evaluation with deep neural networks. Iscience, 27(1).","DOI":"10.1016\/j.isci.2023.108705"},{"key":"2672_CR167","doi-asserted-by":"crossref","unstructured":"Siow, C. Z., Chin, W. H., & Kubota, N. (2023). Evaluating simple exercises with a fuzzy system based on human skeleton poses. In IEEE international conference on fuzzy systems, pp. 1\u20136. IEEE.","DOI":"10.1109\/FUZZ52849.2023.10309722"},{"key":"2672_CR168","doi-asserted-by":"crossref","unstructured":"Soman, K., Rose, P.\u00a0W., Morris, J.\u00a0H., Akbas, R.\u00a0E., Smith, B., Peetoom, B., Villouta-Reyes, C., Cerono, G., Shi, Y., Rizk-Jackson, A., et\u00a0al. (2023). Biomedical knowledge graph-enhanced prompt generation for large language models. arXiv preprint arXiv:2311.17330.","DOI":"10.1093\/bioinformatics\/btae560"},{"key":"2672_CR169","doi-asserted-by":"crossref","unstructured":"Sun, W., Hu, Y., Zhang, B., Chen, X., Hao, C., & Gao, Y. (2023). A novel blind action quality assessment based on multi-headed gru network and attention mechanism. In International conference on artificial intelligence, automation, and high-performance computing, vol. 12717, pp. 835\u2013843. SPIE.","DOI":"10.1117\/12.2685368"},{"key":"2672_CR170","doi-asserted-by":"crossref","unstructured":"Tang, Y., Liu, J., Liu, A., Yang, B., Dai, W., Rao, Y., Lu, J., Zhou, J., & Li, X. (2023). Flag3d: A 3d fitness activity dataset with language instruction. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 22106\u201322117.","DOI":"10.1109\/CVPR52729.2023.02117"},{"key":"2672_CR171","doi-asserted-by":"crossref","unstructured":"Tang, Y., Ni, Z., Zhou, J., Zhang, D., Lu, J., Wu, Y., & Zhou, J. (2020). Uncertainty-aware score distribution learning for action quality assessment. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 9839\u20139848.","DOI":"10.1109\/CVPR42600.2020.00986"},{"issue":"9","key":"2672_CR172","doi-asserted-by":"crossref","first-page":"3138","DOI":"10.1109\/TPAMI.2020.2980824","volume":"43","author":"Y Tang","year":"2020","unstructured":"Tang, Y., Lu, J., & Zhou, J. (2020). Comprehensive instructional video analysis: The coin dataset and performance evaluation. IEEE Transactions on Pattern Analysis and Machine Intelligence,43(9), 3138\u20133153.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2672_CR173","doi-asserted-by":"crossref","unstructured":"Tao, L., Elhamifar, E., Khudanpur, S., Hager, G. D., & Vidal, R. (2012). Sparse hidden markov models for surgical gesture classification and skill evaluation. In Information processing in computer-assisted interventions, pp. 167\u2013177. Springer.","DOI":"10.1007\/978-3-642-30618-1_17"},{"key":"2672_CR174","doi-asserted-by":"crossref","unstructured":"Tran, D., Bourdev, L., Fergus, R., Torresani, L., & Paluri, M. (2015). Learning spatiotemporal features with 3d convolutional networks. In Proceedings of the IEEE international conference on computer vision, pp. 4489\u20134497.","DOI":"10.1109\/ICCV.2015.510"},{"issue":"1","key":"2672_CR175","doi-asserted-by":"crossref","first-page":"2","DOI":"10.3390\/data3010002","volume":"3","author":"A Vakanski","year":"2018","unstructured":"Vakanski, A., Jun, H.-P., Paul, D., & Baker, R. (2018). A data set of human body movements for physical rehabilitation exercises. Data,3(1), 2.","journal-title":"Data"},{"key":"2672_CR176","unstructured":"Vaswani, A. (2017). Attention is all you need. Advances in Neural Information Processing Systems."},{"key":"2672_CR177","first-page":"1","volume":"67","author":"V Venkataraman","year":"2015","unstructured":"Venkataraman, V., Vlachos, I., & Turaga, P. K. (2015). Dynamical regularity for action analysis. BMVC,67, 1\u201312.","journal-title":"BMVC"},{"key":"2672_CR178","doi-asserted-by":"crossref","unstructured":"Wang, J., Du, Z., Li, A., & Wang, Y. (2020). Assessing action quality via attentive spatio-temporal convolutional networks. In Chinese conference on pattern recognition and computer vision, pp. 3\u201316. Springer.","DOI":"10.1007\/978-3-030-60639-8_1"},{"key":"2672_CR179","doi-asserted-by":"crossref","unstructured":"Wang, X., Li, J., & Hu, H. (2022). Skeleton-based action quality assessment via partially connected lstm with triplet losses. In Chinese conference on pattern recognition and computer vision, pp. 220\u2013232. Springer.","DOI":"10.1007\/978-3-031-18913-5_17"},{"key":"2672_CR180","doi-asserted-by":"crossref","unstructured":"Wang, Y., Wang, J. W., & Bai, X. (2023). Three-stream fusion networks for student engagement recognition based on timesformer. In International conference on artificial intelligence and computer engineering, vol. 12610, pp. 758\u2013764. SPIE.","DOI":"10.1117\/12.2671122"},{"key":"2672_CR181","doi-asserted-by":"crossref","unstructured":"Wang, F., Wang, Q., & Chen, D. (2025). From beats to scores: A multi-modal framework for comprehensive figure skating assessment. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 5905\u20135914.","DOI":"10.1109\/CVPRW67362.2025.00588"},{"key":"2672_CR182","doi-asserted-by":"crossref","unstructured":"Wang, T., Wang, Y., & Li, M. (2020). Towards accurate and interpretable surgical skill assessment: A video-based method incorporating recognized surgical gestures and skill levels. In Medical image computing and computer assisted intervention, pp. 668\u2013678. Springer.","DOI":"10.1007\/978-3-030-59716-0_64"},{"key":"2672_CR183","doi-asserted-by":"crossref","unstructured":"Wang, W., Wang, H., Hao, Y., & Wang, Q. (2024). Action quality assessment with multi-scale temporal attention mechanism. In International conference on advanced algorithms and control engineering, pp. 247\u2013251. IEEE.","DOI":"10.1109\/ICAACE61206.2024.10548995"},{"key":"2672_CR184","doi-asserted-by":"crossref","unstructured":"Wang, S., Wang, S., Yang, D., Li, M., Kuang, H., Zhao, X., Su, L., Zhai, P., & Zhang, L. (2024). Cpr-coach: Recognizing composite error actions based on single-class training. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 18782\u201318792.","DOI":"10.1109\/CVPR52733.2024.01777"},{"key":"2672_CR185","doi-asserted-by":"crossref","unstructured":"Wang, W., Yang, Y., & Fei, W. (2024). Towards data-and knowledge-driven ai: A survey on neuro-symbolic computing. IEEE Transactions on Pattern Analysis and Machine Intelligence.","DOI":"10.1109\/TPAMI.2024.3483273"},{"key":"2672_CR186","doi-asserted-by":"crossref","unstructured":"Wang, S., Yang, D., Zhai, P., Chen, C., & Zhang, L. (2021). Tsa-net: Tube self-attention network for action quality assessment. In Proceedings of the ACM international conference on multimedia, pp. 4902\u20134910.","DOI":"10.1145\/3474085.3475438"},{"key":"2672_CR187","doi-asserted-by":"crossref","unstructured":"Wang, S., Yang, D., Zhai, P., Yu, Q., Suo, T., Sun, Z., Li, K., & Zhang, L. (2021). A survey of video-based action quality assessment. In International conference on networking systems of AI, pp. 1\u20139. IEEE.","DOI":"10.1109\/INSAI54028.2021.00029"},{"issue":"9","key":"2672_CR188","doi-asserted-by":"crossref","first-page":"1595","DOI":"10.1007\/s11548-021-02448-4","volume":"16","author":"T Wang","year":"2021","unstructured":"Wang, T., Jin, M., & Li, M. (2021). Towards accurate and interpretable surgical skill assessment: A video-based method for skill score prediction and guiding feedback generation. International Journal of Computer Assisted Radiology and Surgery,16(9), 1595\u20131605.","journal-title":"International Journal of Computer Assisted Radiology and Surgery"},{"issue":"2","key":"2672_CR189","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3477533","volume":"18","author":"J Wang","year":"2022","unstructured":"Wang, J., Wang, Y., Weng, N., Chai, T., Li, A., Zhang, F., & Sansi, Yu. (2022). Will you ever become popular? learning to predict virality of dance clips. ACM Transactions on Multimedia Computing, Communications, and Applications,18(2), 1\u201324.","journal-title":"ACM Transactions on Multimedia Computing, Communications, and Applications"},{"key":"2672_CR190","doi-asserted-by":"crossref","unstructured":"Wen, H., & Xu, Y. (2024). Learning to score sign language with two-stage method. arXiv preprint arXiv:2404.10383.","DOI":"10.1007\/978-981-97-9674-8_3"},{"key":"2672_CR191","doi-asserted-by":"crossref","unstructured":"Wnuk, K., & Soatto, S. (2010). Analyzing diving: A dataset for judging action quality. In Asian conference on computer vision, pp. 266\u2013276. Springer.","DOI":"10.1007\/978-3-642-22822-3_27"},{"key":"2672_CR192","doi-asserted-by":"crossref","unstructured":"Wu, G., Li, T., Zhou, Y., Guo, J., Zhu, J., Chen, N., Song, W., Xing, Y., Meng, X., & Lin, Y. (2024). Research on worker action recognition and evaluation in intelligent manufacturing training based on industrial metaverse. In Asia simulation conference, pp. 365\u2013380. Springer.","DOI":"10.1007\/978-981-97-7225-4_28"},{"key":"2672_CR193","doi-asserted-by":"crossref","unstructured":"Xiang, X., Tian, Y., Reiter, A., Hager, G. D., & Tran, T. D. (2018). S3d: Stacking segmental p3d for action quality assessment. In IEEE international conference on image processing, pp. 928\u2013932. IEEE.","DOI":"10.1109\/ICIP.2018.8451364"},{"key":"2672_CR194","doi-asserted-by":"crossref","first-page":"2901","DOI":"10.1609\/aaai.v37i3.25392","volume":"37","author":"J Xia","year":"2023","unstructured":"Xia, J., Zhuge, M., Geng, T., Fan, S., Wei, Y., He, Z., & Zheng, F. (2023). Skating-mixer: Long-term sport audio-visual modeling with mlps. In Proceedings of the AAAI Conference on Artificial Intelligence,37, 2901\u20132909.","journal-title":"In Proceedings of the AAAI Conference on Artificial Intelligence"},{"issue":"1","key":"2672_CR195","doi-asserted-by":"crossref","first-page":"104","DOI":"10.1038\/s41597-022-01188-7","volume":"9","author":"Q-J Xing","year":"2022","unstructured":"Xing, Q.-J., Shen, Y.-Y., Cao, R., Zong, S.-X., Zhao, S.-X., & Shen, Y.-F. (2022). Functional movement screen dataset collected with two azure kinect depth sensors. Scientific Data,9(1), 104.","journal-title":"Scientific Data"},{"issue":"3","key":"2672_CR196","volume":"20","author":"Q Xing","year":"2025","unstructured":"Xing, Q., Xing, X., Guo, P., Tang, Z., & Shen, Y. (2025). Llm-fms: A fine-grained dataset for functional movement screen action quality assessment. PloS one,20(3), Article e0313707.","journal-title":"PloS one"},{"key":"2672_CR197","doi-asserted-by":"crossref","unstructured":"Xu, S., Chen, P., Liu, Y., Wang, M., Wang, S., & Kwong, S. (2024). Reveal fluidity behind frames: A multi-modality framework for action quality assessment. In IEEE international workshop on multimedia signal processing, pp. 1\u20136. IEEE.","DOI":"10.1109\/MMSP61759.2024.10743311"},{"key":"2672_CR198","doi-asserted-by":"crossref","unstructured":"Xu, H., Ke, X., Li, Y., Xu, R., Wu, H., Lin, X., & Guo, W. (2024). Vision-language action knowledge learning for semantic-aware action quality assessment. In European conference on computer vision, pp. 423\u2013440. Springer.","DOI":"10.1007\/978-3-031-72946-1_24"},{"key":"2672_CR199","doi-asserted-by":"crossref","unstructured":"Xu, H., Ke, X., Wu, H., Xu, R., Li, Y., & Guo, W. (2025). Language-guided audio-visual learning for long-term sports assessment. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 23967\u201323977.","DOI":"10.1109\/CVPR52734.2025.02232"},{"key":"2672_CR200","doi-asserted-by":"crossref","unstructured":"Xu, J., Rao, Y., Yu, X., Chen, G., Zhou, J., & Lu, J. (2022). Finediving: A fine-grained dataset for procedure-aware action quality assessment. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 2949\u20132958.","DOI":"10.1109\/CVPR52688.2022.00296"},{"key":"2672_CR201","doi-asserted-by":"crossref","unstructured":"Xu, J., Rao, Y., Zhou, J., & Lu, J. (2024). Procedure-aware action quality assessment: Datasets and performance evaluation. International journal of computer vision, pp. 1\u201322.","DOI":"10.1007\/s11263-024-02146-z"},{"key":"2672_CR202","doi-asserted-by":"crossref","unstructured":"Xu, J., Yin, S., Zhao, G., Wang, Z., & Peng, Y. (2024). Fineparser: A fine-grained spatio-temporal action parser for human-centric action quality assessment. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 14628\u201314637.","DOI":"10.1109\/CVPR52733.2024.01386"},{"key":"2672_CR203","doi-asserted-by":"crossref","unstructured":"Xu, A., Zeng, L.-A., & Zheng, W.-S. (2022). Likert scoring with grade decoupling for long-term action assessment. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 3232\u20133241.","DOI":"10.1109\/CVPR52688.2022.00323"},{"issue":"12","key":"2672_CR204","doi-asserted-by":"crossref","first-page":"4578","DOI":"10.1109\/TCSVT.2019.2927118","volume":"30","author":"C Xu","year":"2019","unstructured":"Xu, C., Fu, Y., Zhang, B., Chen, Z., Jiang, Y.-G., & Xue, X. (2019). Learning to score figure skating sport videos. IEEE Transactions on Circuits and Systems for Video Technology,30(12), 4578\u20134590.","journal-title":"IEEE Transactions on Circuits and Systems for Video Technology"},{"key":"2672_CR205","doi-asserted-by":"crossref","unstructured":"Yao, L., Lei, Q., Zhang, H, Du, J., & Gao, S. (2023). A contrastive learning network for performance metric and assessment of physical rehabilitation exercises. IEEE Transactions on Neural Systems and Rehabilitation Engineering.","DOI":"10.1109\/TNSRE.2023.3317411"},{"key":"2672_CR206","unstructured":"Yin, H., Gu, L., Parmar, P., Xu, L., Guo, T., Fu, W., Zhang, Y., & Zheng, T. (2025). Flex: A large-scale multi-modal multi-action dataset for fitness action quality assessment. arXiv preprint arXiv:2506.03198."},{"key":"2672_CR207","doi-asserted-by":"crossref","unstructured":"Yu, X., Rao, Y., Zhao, W., Lu, J., & Zhou, J. (2021). Group-aware contrastive regression for action quality assessment. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 7919\u20137928.","DOI":"10.1109\/ICCV48922.2021.00782"},{"key":"2672_CR208","doi-asserted-by":"crossref","unstructured":"Yun, W., Qi, M., Peng, F., & Ma, H. (2024). Semi-supervised teacher-reference-student architecture for action quality assessment. In European conference on computer vision, pp. 161\u2013178. Springer, Cham.","DOI":"10.1007\/978-3-031-72904-1_10"},{"key":"2672_CR209","unstructured":"Zahan, S. (2024). Human motion analysis. Thesis."},{"key":"2672_CR210","doi-asserted-by":"crossref","unstructured":"Zahan, S., Hassan, G. M., & Mian, A. (2024). Learning sparse temporal video mapping for action quality assessment in floor gymnastics. IEEE Transactions on Instrumentation and Measurement.","DOI":"10.1109\/TIM.2024.3398072"},{"key":"2672_CR211","doi-asserted-by":"crossref","unstructured":"Zeng, L.-A., & Zheng, W.-S. (2024). Multimodal action quality assessment. IEEE Transactions on Image Processing.","DOI":"10.1109\/TIP.2024.3362135"},{"key":"2672_CR212","doi-asserted-by":"crossref","unstructured":"Zeng, L.-A., Hong, F.-T., Zheng, W.-S., Yu, Q.-Z., Zeng, W., Wang, Y.-W., & Lai, J.-H. (2020). Hybrid dynamic-static context-aware attention network for action assessment in long videos. In Proceedings of the ACM international conference on multimedia, pp. 2526\u20132534.","DOI":"10.1145\/3394171.3413560"},{"key":"2672_CR213","unstructured":"Zhang, D. (2023). Hand-eye behaviour analytics for children with autism spectrum disorder. Thesis."},{"key":"2672_CR214","doi-asserted-by":"crossref","unstructured":"Zhang, S., Bai, S., Chen, G., Chen, L., Lu, J., Wang, J., & Tang, Y. (2024). Narrative action evaluation with prompt-guided multimodal interaction. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 18430\u201318439.","DOI":"10.1109\/CVPR52733.2024.01744"},{"key":"2672_CR215","doi-asserted-by":"crossref","unstructured":"Zhang, S., Dai, W., Wang, S., Shen, X., Lu, J., Zhou, J., & Tang, Y. (2023). Logo: A long-form video dataset for group action quality assessment. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 2405\u20132414.","DOI":"10.1109\/CVPR52729.2023.00238"},{"key":"2672_CR216","doi-asserted-by":"crossref","unstructured":"Zhang, X., Hongzhi Feng, M., Hossain, S., Chen, Y., Wang, H., & Yin, Y. (2024). Scaled background swap: Video augmentation for action quality assessment with background debiasing. ACM Transactions on Multimedia Computing, Communications and Applications.","DOI":"10.1145\/3737461"},{"key":"2672_CR217","doi-asserted-by":"crossref","unstructured":"Zhang, S.-J., Pan, J.-H., Gao, J., & Zheng, W.-S. (2023). Adaptive stage-aware assessment skill transfer for skill determination. IEEE Transactions on Multimedia.","DOI":"10.1109\/TMM.2023.3294800"},{"key":"2672_CR218","doi-asserted-by":"crossref","unstructured":"Zhang, D., Zhou, D., & Liu, H. (2023). Action quality assessment for asd behaviour evaluation. In International conference on machine learning and cybernetics, pp. 483\u2013488. IEEE.","DOI":"10.1109\/ICMLC58545.2023.10327994"},{"issue":"2","key":"2672_CR219","doi-asserted-by":"crossref","first-page":"929","DOI":"10.1007\/s00521-023-09068-w","volume":"36","author":"B Zhang","year":"2024","unstructured":"Zhang, B., Chen, J., Xu, Y., Zhang, H., Yang, X., & Geng, X. (2024). Auto-encoding score distribution regression for action quality assessment. Neural Computing and Applications,36(2), 929\u2013942.","journal-title":"Neural Computing and Applications"},{"issue":"9","key":"2672_CR220","doi-asserted-by":"crossref","first-page":"10053","DOI":"10.1007\/s10489-022-03984-5","volume":"53","author":"H-B Zhang","year":"2023","unstructured":"Zhang, H.-B., Dong, L.-J., Lei, Q., Yang, L.-J., & Du, J.-X. (2023). Label-reconstruction-based pseudo-subscore learning for action quality assessment in sporting events. Applied Intelligence,53(9), 10053\u201310067.","journal-title":"Applied Intelligence"},{"issue":"9","key":"2672_CR221","doi-asserted-by":"crossref","first-page":"6017","DOI":"10.1109\/TCSVT.2022.3143549","volume":"32","author":"S-J Zhang","year":"2022","unstructured":"Zhang, S.-J., Pan, J.-H., Gao, J., & Zheng, W.-S. (2022). Semi-supervised action quality assessment with self-supervised segment feature recovery. IEEE Transactions on Circuits and Systems for Video Technology,32(9), 6017\u20136028.","journal-title":"IEEE Transactions on Circuits and Systems for Video Technology"},{"issue":"1","key":"2672_CR222","doi-asserted-by":"crossref","first-page":"757","DOI":"10.1007\/s10489-022-03411-9","volume":"53","author":"Z Zhang","year":"2023","unstructured":"Zhang, Z., Wang, Z., Zhuang, S., & Wang, J. (2023). Toward action recognition and assessment using sfagcn and combinative regression model of spatiotemporal features. Applied Intelligence,53(1), 757\u2013768.","journal-title":"Applied Intelligence"},{"key":"2672_CR223","doi-asserted-by":"crossref","first-page":"104","DOI":"10.1016\/j.patrec.2022.04.015","volume":"158","author":"Y Zhang","year":"2022","unstructured":"Zhang, Y., Xiong, W., & Mi, S. (2022). Learning time-aware features for action quality assessment. Pattern Recognition Letters,158, 104\u2013110.","journal-title":"Pattern Recognition Letters"},{"key":"2672_CR224","volume":"78","author":"W Zhao","year":"2023","unstructured":"Zhao, W., Wang, S., Zhao, Y., Wei, J., & Li, T. (2023). Knowledge and data co-driven intelligent assessment of Chinese zither fingerings. Displays,78, Article 102442.","journal-title":"Displays"},{"key":"2672_CR225","doi-asserted-by":"crossref","first-page":"2612","DOI":"10.1109\/TNSRE.2023.3282675","volume":"31","author":"K Zheng","year":"2023","unstructured":"Zheng, K., Ji, W., Zhang, J., & Guo, C. (2023). A skeleton-based rehabilitation exercise assessment system with rotation invariance. IEEE Transactions on Neural Systems and Rehabilitation Engineering,31, 2612\u20132621.","journal-title":"IEEE Transactions on Neural Systems and Rehabilitation Engineering"},{"key":"2672_CR226","doi-asserted-by":"crossref","unstructured":"Zhong, Y., & Demiris, Y. (2024). Dancemvp: Self-supervised learning for multi-task primitive-based dance performance assessment via transformer text prompting. In Proceedings of the AAAI conference on artificial intelligence, vol.\u00a038, pp. 10270\u201310278.","DOI":"10.1609\/aaai.v38i9.28893"},{"key":"2672_CR227","doi-asserted-by":"crossref","unstructured":"Zhong, Y., Zhang, F., & Demiris, Y. (2023). Contrastive self-supervised learning for automated multi-modal dance performance assessment. In IEEE international conference on acoustics, speech and signal processing, pp. 1\u20135. IEEE.","DOI":"10.1109\/ICASSP49357.2023.10096824"},{"key":"2672_CR228","unstructured":"Zhou, K., Cai, R., Wang, L., Shum, H. P. H., & Liang, X. (2024). A comprehensive survey of action quality assessment: Method and benchmark. arXiv preprint arXiv:2412.11149."},{"key":"2672_CR229","doi-asserted-by":"crossref","unstructured":"Zhou, H., Hou, T., & Li, J. (2023). Prior knowledge-guided hierarchical action quality assessment with 3d convolution and attention mechanism. In Journal of physics: Conference series, vol. 2632, pp. 012027. IOP Publishing.","DOI":"10.1088\/1742-6596\/2632\/1\/012027"},{"key":"2672_CR230","unstructured":"Zhou, C., Huang, Y., & Ling, H. (2022). Uncertainty-driven action quality assessment. arXiv preprint arXiv:2207.14513."},{"key":"2672_CR231","unstructured":"Zhou, K., Li, J., Cai, R., Wang, L., Zhang, X., & Liang, X. (2024). Cofinal: Enhancing action quality assessment with coarse-to-fine instruction alignment. In International joint conference on artificial intelligence."},{"key":"2672_CR232","doi-asserted-by":"crossref","unstructured":"Zhou, K., Shum, H.\u00a0P., Li, F.\u00a0W., Zhang, X., & Liang, X. (2025). Phi: Bridging domain shift in long-term action quality assessment via progressive hierarchical instruction. IEEE transactions on image processing.","DOI":"10.1109\/TIP.2025.3574938"},{"key":"2672_CR233","doi-asserted-by":"crossref","unstructured":"Zhou, K., Wang, L., Zhang, X., Shum, H. P. H., Li, F. W. B., Li, J., & Liang, X. (2024). Magr: Manifold-aligned graph regularization for continual action quality assessment. European conference on computer vision (pp. 375\u2013392). Cham: Springer.","DOI":"10.1007\/978-3-031-73247-8_22"},{"issue":"5","key":"2672_CR234","doi-asserted-by":"crossref","first-page":"2456","DOI":"10.1109\/TVCG.2023.3247092","volume":"29","author":"K Zhou","year":"2023","unstructured":"Zhou, K., Cai, R., Ma, Y., Tan, Q., Wang, X., Li, J., Shum, H. P., Li, F. W., Jin, S., & Liang, X. (2023). A video-based augmented reality system for human-in-the-loop muscle strength assessment of juvenile dermatomyositis. IEEE Transactions on Visualization and Computer Graphics,29(5), 2456\u20132466.","journal-title":"IEEE Transactions on Visualization and Computer Graphics"},{"issue":"12","key":"2672_CR235","doi-asserted-by":"crossref","first-page":"7749","DOI":"10.1109\/TCSVT.2023.3281413","volume":"33","author":"K Zhou","year":"2023","unstructured":"Zhou, K., Ma, Y., Shum, H. P., & Liang, X. (2023). Hierarchical graph convolutional networks for action quality assessment. IEEE Transactions on Circuits and Systems for Video Technology,33(12), 7749\u20137763.","journal-title":"IEEE Transactions on Circuits and Systems for Video Technology"},{"key":"2672_CR236","doi-asserted-by":"crossref","DOI":"10.1016\/j.engappai.2023.107780","volume":"131","author":"C Zhou","year":"2024","unstructured":"Zhou, C., Zeng, J., Qiu, L., Wang, S., Liu, P., & Pan, J. (2024). An attention-based adaptive spatial\u2013temporal graph convolutional network for long-video ergonomic risk assessment. Engineering Applications of Artificial Intelligence,131, Article 107780.","journal-title":"Engineering Applications of Artificial Intelligence"},{"key":"2672_CR237","doi-asserted-by":"crossref","unstructured":"Zhu, Y., Liang, S., Li, P., & Wu, X. (2022). Robust human pose quality assessment using optimal sub-pattern assignment. In International conference on control, automation and information sciences, pp. 419\u2013423. IEEE.","DOI":"10.1109\/ICCAIS56082.2022.9990031"},{"key":"2672_CR238","unstructured":"Zia, A., Berniker, M., Nespolo, R., Perreault, C., Wang, Z., Mueller, B., Schmidt, R., Bhattacharyya, K., Liu, X., & Jarc, A. (2025). Surgical visual understanding (surgvu) dataset. arXiv preprint arXiv:2501.09209."},{"key":"2672_CR239","unstructured":"Zia, A., Bhattacharyya, K., Liu, X., Wang, Z., Berniker, M., Kondo, S., Colleoni, E., Psychogyios, D., Jin, Y., & Zhou, J. (2022). Objective surgical skills assessment and tool localization: Results from the miccai 2021 simsurgskill challenge. arXiv preprint arXiv:2212.04448"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02672-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-025-02672-4","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02672-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,17]],"date-time":"2026-02-17T15:22:01Z","timestamp":1771341721000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-025-02672-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1,20]]},"references-count":239,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2026,2]]}},"alternative-id":["2672"],"URL":"https:\/\/doi.org\/10.1007\/s11263-025-02672-4","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,1,20]]},"assertion":[{"value":"6 January 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 September 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 January 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"73"}}