{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T16:50:22Z","timestamp":1777654222687,"version":"3.51.4"},"reference-count":153,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"1","license":[{"start":{"date-parts":[[2023,2,1]],"date-time":"2023-02-01T00:00:00Z","timestamp":1675209600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,2,1]],"date-time":"2023-02-01T00:00:00Z","timestamp":1675209600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,2,1]],"date-time":"2023-02-01T00:00:00Z","timestamp":1675209600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61773197"],"award-info":[{"award-number":["61773197"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100017607","name":"Shenzhen Fundamental Research Program","doi-asserted-by":"publisher","award":["JCYJ20200109141622964"],"award-info":[{"award-number":["JCYJ20200109141622964"]}],"id":[{"id":"10.13039\/501100017607","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Intel ICRI-IACV Research Fund","award":["CG#52514373"],"award-info":[{"award-number":["CG#52514373"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Human-Mach. Syst."],"published-print":{"date-parts":[[2023,2]]},"DOI":"10.1109\/thms.2022.3219242","type":"journal-article","created":{"date-parts":[[2022,11,18]],"date-time":"2022-11-18T20:45:54Z","timestamp":1668804354000},"page":"253-268","source":"Crossref","is-referenced-by-count":76,"title":["Vision-Based Human Pose Estimation via Deep Learning: A Survey"],"prefix":"10.1109","volume":"53","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2020-8186","authenticated-orcid":false,"given":"Gongjin","family":"Lan","sequence":"first","affiliation":[{"name":"Department of Computer Science and Engineering, Southern University of Science and Technology, Shenzhen, China"}]},{"given":"Yu","family":"Wu","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Engineering, Southern University of Science and Technology, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4346-9477","authenticated-orcid":false,"given":"Fei","family":"Hu","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, University of Alabama, Tuscaloosa, AL, USA"}]},{"given":"Qi","family":"Hao","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Engineering, Southern University of Science and Technology, Shenzhen, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00022"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995316"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/AVSS.2010.80"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3343031.3350910"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2017.19"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00535"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/1189762.1189763"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/3377325.3377505"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.214"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00584"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/0262-8856(83)90003-3"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1006\/cviu.2000.0897"},{"key":"ref13","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","volume":"25","author":"Krizhevsky","year":"2012","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICARCV.2018.8581288"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/SSCI44817.2019.9002863"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00542"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3118207"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.26599\/TST.2018.9010100"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2009.11.014"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2019.102897"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3524497"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.3390\/s16121966"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107561"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CCUBE53681.2021.9702726"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2021.103225"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.5244\/C.24.12"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.471"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.396"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.280"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.471"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01112"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.248"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2782743"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01249-6_37"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2017.00064"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01225-0_27"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.256"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.143"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46484-8_29"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00742"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01231-1_29"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00546"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00706"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107410"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6867"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00354"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1145\/3474085.3475219"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00236"},{"key":"ref51","first-page":"1799","article-title":"Joint training of a convolutional network and a graphical model for human pose estimation","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Tompson","year":"2014"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.511"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.601"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.144"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/FG47880.2020.00014"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.5244\/C.30.109"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-16808-1_21"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00712"},{"key":"ref59","article-title":"TFPose: Direct human pose estimation with transformers","author":"Mao","year":"2021"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00198"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01159"},{"key":"ref62","article-title":"ViTPose: Simple vision transformer baselines for human pose estimation","author":"Xu","year":"2022"},{"key":"ref63","first-page":"2277","article-title":"Associative embedding: End-to-end learning for joint detection and grouping","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Newell","year":"2017"},{"key":"ref64","article-title":"Blazepose: On-device real-time body pose tracking","author":"Bazarevsky","year":"2020"},{"key":"ref65","article-title":"Mediapipe: A framework for building perception pipelines","author":"Lugaresi","year":"2019"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref67","article-title":"Rethinking on multi-stage networks for human pose estimation","author":"Li","year":"2019"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46466-4_3"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00705"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58571-6_42"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01252-6_26"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00543"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.395"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00704"},{"key":"ref75","first-page":"3027","article-title":"Learning temporal pose estimation from sparsely-labeled videos","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Bertasius","year":"2019"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01168"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00098"},{"key":"ref78","first-page":"29","article-title":"On the robustness of human pose estimation","volume-title":"Proc. IEEE\/CVF Conf. Comput. Vis. Pattern Recognit. Workshops","author":"Jain","year":"2019"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-011-0498-z"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-009-0209-1"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-16808-1_23"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.610"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.288"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2018.00024"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00621"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00847"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00781"},{"key":"ref88","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-020-01398-9"},{"key":"ref89","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00780"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00444"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01096"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.5244\/C.31.14"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-018-1118-y"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00227"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2017.00058"},{"key":"ref96","doi-asserted-by":"publisher","DOI":"10.1109\/WACV45572.2020.9093526"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00214"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01249-6_46"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00539"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.139"},{"key":"ref101","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2019.00162"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00723"},{"key":"ref103","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01145"},{"key":"ref104","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00794"},{"key":"ref105","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2019.2892985"},{"key":"ref106","first-page":"8410","article-title":"Deep network for the integrated 3D sensing of multiple people in natural images","volume":"31","author":"Zanfir","year":"2018","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"ref107","doi-asserted-by":"publisher","DOI":"10.1017\/cbo9780511811685"},{"key":"ref108","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00798"},{"key":"ref109","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00334"},{"key":"ref110","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58604-1_29"},{"key":"ref111","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR48806.2021.9412652"},{"key":"ref112","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00768"},{"key":"ref113","doi-asserted-by":"publisher","DOI":"10.1016\/j.jvcir.2018.07.010"},{"key":"ref114","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2019.00014"},{"key":"ref115","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00606"},{"key":"ref116","doi-asserted-by":"publisher","DOI":"10.1109\/FSKD.2018.8686917"},{"key":"ref117","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN48605.2020.9207296"},{"key":"ref118","article-title":"Using deep learning-based pose estimation algorithms for markerless gait analysis in rehabilitation medicine","author":"Rabbito","year":"2021"},{"key":"ref119","doi-asserted-by":"publisher","DOI":"10.1049\/iet-cvi.2017.0062"},{"key":"ref120","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2947518"},{"key":"ref121","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2021.03.028"},{"key":"ref122","doi-asserted-by":"publisher","DOI":"10.1007\/s12652-019-01301-6"},{"key":"ref123","doi-asserted-by":"publisher","DOI":"10.1080\/10447318.2018.1543081"},{"key":"ref124","doi-asserted-by":"publisher","DOI":"10.1109\/EMBC.2016.7591458"},{"key":"ref125","doi-asserted-by":"publisher","DOI":"10.1109\/EMBC.2012.6346149"},{"key":"ref126","article-title":"A survey on 3D skeleton-based action recognition using learning method","author":"Ren","year":"2020"},{"key":"ref127","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2019.2916873"},{"key":"ref128","doi-asserted-by":"publisher","DOI":"10.1109\/ICMEW.2017.8026283"},{"key":"ref129","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00298"},{"key":"ref130","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58545-7_5"},{"key":"ref131","doi-asserted-by":"publisher","DOI":"10.1061\/(ASCE)CO.1943-7862.0001497"},{"key":"ref132","doi-asserted-by":"publisher","DOI":"10.1109\/CompComm.2016.7924850"},{"key":"ref133","doi-asserted-by":"publisher","DOI":"10.1109\/AITC.2019.8920892"},{"key":"ref134","doi-asserted-by":"publisher","DOI":"10.1007\/s11042-015-2611-8"},{"key":"ref135","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2019.00304"},{"key":"ref136","doi-asserted-by":"publisher","DOI":"10.1109\/IWAIT.2018.8369762"},{"key":"ref137","doi-asserted-by":"publisher","DOI":"10.1145\/3334480.3382853"},{"key":"ref138","doi-asserted-by":"publisher","DOI":"10.1016\/j.joi.2018.09.002"},{"key":"ref139","doi-asserted-by":"publisher","DOI":"10.1016\/j.softx.2019.100263"},{"key":"ref140","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01581"},{"key":"ref141","first-page":"12949","article-title":"Sim2real transfer learning for 3D human pose estimation: Motion to the rescue","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Doersch","year":"2019"},{"key":"ref142","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01084"},{"key":"ref143","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00574"},{"key":"ref144","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01030"},{"key":"ref145","doi-asserted-by":"publisher","DOI":"10.5220\/0007555407440748"},{"key":"ref146","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00059"},{"key":"ref147","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58555-6_33"},{"key":"ref148","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58574-7_23"},{"key":"ref149","doi-asserted-by":"publisher","DOI":"10.1145\/3072959.3073596"},{"key":"ref150","article-title":"Synthetic occlusion augmentation with volumetric heatmaps for the 2018 ECCV posetrack challenge on 3D human pose estimation","author":"Srndi","year":"2018"},{"key":"ref151","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01231-1_33"},{"key":"ref152","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00756"},{"key":"ref153","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01101"}],"container-title":["IEEE Transactions on Human-Machine Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6221037\/10016745\/09955393.pdf?arnumber=9955393","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,1]],"date-time":"2024-02-01T03:13:21Z","timestamp":1706757201000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9955393\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,2]]},"references-count":153,"journal-issue":{"issue":"1"},"URL":"https:\/\/doi.org\/10.1109\/thms.2022.3219242","relation":{},"ISSN":["2168-2291","2168-2305"],"issn-type":[{"value":"2168-2291","type":"print"},{"value":"2168-2305","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,2]]}}}