{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,10]],"date-time":"2026-01-10T19:38:38Z","timestamp":1768073918118,"version":"3.49.0"},"reference-count":72,"publisher":"Springer Science and Business Media LLC","issue":"31","license":[{"start":{"date-parts":[[2025,2,22]],"date-time":"2025-02-22T00:00:00Z","timestamp":1740182400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,2,22]],"date-time":"2025-02-22T00:00:00Z","timestamp":1740182400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-025-20704-6","type":"journal-article","created":{"date-parts":[[2025,2,22]],"date-time":"2025-02-22T04:58:17Z","timestamp":1740200297000},"page":"38121-38158","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Deep learning based on hand pose estimation methods: a systematic literature review"],"prefix":"10.1007","volume":"84","author":[{"given":"Bekiri","family":"Roumaissa","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Babahenini","family":"Mohamed Chaouki","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,2,22]]},"reference":[{"key":"20704_CR1","doi-asserted-by":"crossref","unstructured":"Piumsomboon T, Clark A, Billinghurst M, Cockburn A (2013) User-defined gestures for augmented reality. In: IFIP Conference on Human-Computer Interaction, pp. 282\u2013299. Springer","DOI":"10.1007\/978-3-642-40480-1_18"},{"key":"20704_CR2","doi-asserted-by":"crossref","unstructured":"Yin F, Chai X, Chen X (2016) Iterative reference driven metric learning for signer independent isolated sign language recognition. In: European Conference on Computer Vision, pp. 434\u2013450. Springer","DOI":"10.1007\/978-3-319-46478-7_27"},{"key":"20704_CR3","doi-asserted-by":"crossref","unstructured":"Markussen A, Jakobsen MR, Hornb\u00e6k K (2014) Vulture: a mid-air word-gesture keyboard. In: Proceedings of the SIGCHI Conference on Human Factors in Computing Systems, pp. 1073\u20131082","DOI":"10.1145\/2556288.2556964"},{"issue":"4","key":"20704_CR4","doi-asserted-by":"publisher","first-page":"501","DOI":"10.1109\/TVCG.2015.2391860","volume":"21","author":"Y Jang","year":"2015","unstructured":"Jang Y, Noh S-T, Chang HJ, Kim T-K, Woo W (2015) 3d finger cape: Clicking action and position estimation under self-occlusions in egocentric viewpoint. IEEE Trans Visual Comput Graphics 21(4):501\u2013510","journal-title":"IEEE Trans Visual Comput Graphics"},{"key":"20704_CR5","doi-asserted-by":"crossref","unstructured":"Liu Y, Jiang J, Sun J (2021) Hand pose estimation from rgb images based on deep learning: A survey. In: 2021 IEEE 7th International Conference on Virtual Reality (ICVR), pp. 82\u201389. IEEE","DOI":"10.1109\/ICVR51878.2021.9483815"},{"key":"20704_CR6","doi-asserted-by":"crossref","unstructured":"Zhang J, Jiao J, Chen M, Qu L, Xu X, Yang Q (2017) A hand pose tracking benchmark from stereo matching. In: 2017 IEEE International Conference on Image Processing (ICIP), pp. 982\u2013986. IEEE","DOI":"10.1109\/ICIP.2017.8296428"},{"key":"20704_CR7","doi-asserted-by":"crossref","unstructured":"Kazakos E, Nikou C, Kakadiaris IA (2018) On the fusion of rgb and depth information for hand pose estimation. In: 2018 25th IEEE International Conference on Image Processing (ICIP), pp. 868\u2013872. IEEE","DOI":"10.1109\/ICIP.2018.8451022"},{"key":"20704_CR8","doi-asserted-by":"crossref","unstructured":"Lim GM, Jatesiktat P, Ang WT (2020) Mobilehand: Real-time 3d hand shape and pose estimation from color image. In: International Conference on Neural Information Processing, pp. 450\u2013459. Springer","DOI":"10.1007\/978-3-030-63820-7_52"},{"issue":"19","key":"20704_CR9","doi-asserted-by":"publisher","first-page":"6850","DOI":"10.3390\/app10196850","volume":"10","author":"T Chatzis","year":"2020","unstructured":"Chatzis T, Stergioulas A, Konstantinidis D, Dimitropoulos K, Daras P (2020) A comprehensive study on deep learning-based 3d hand pose estimation methods. Appl Sci 10(19):6850","journal-title":"Appl Sci"},{"issue":"3","key":"20704_CR10","doi-asserted-by":"publisher","first-page":"207","DOI":"10.1016\/j.vrih.2021.05.002","volume":"3","author":"L Huang","year":"2021","unstructured":"Huang L, Zhang B, Guo Z, Xiao Y, Cao Z, Yuan J (2021) Survey on depth and rgb image-based 3d hand shape and pose estimation. Virtual Reality & Intelligent Hardware. 3(3):207\u2013234","journal-title":"Virtual Reality & Intelligent Hardware."},{"key":"20704_CR11","unstructured":"Doosti B (2019) Hand pose estimation: A survey. arXiv:1903.01013"},{"key":"20704_CR12","doi-asserted-by":"publisher","first-page":"474","DOI":"10.1016\/j.cag.2023.09.013","volume":"116","author":"T Woo","year":"2023","unstructured":"Woo T, Park W, Jeong W, Park J (2023) A survey of deep learning methods and datasets for hand pose estimation from hand-object interaction images. Computers & Graphics. 116:474\u2013490","journal-title":"Computers & Graphics."},{"key":"20704_CR13","doi-asserted-by":"publisher","first-page":"144","DOI":"10.25046\/aj050418","volume":"5","author":"V-H Le","year":"2020","unstructured":"Le V-H, Nguyen H-C (2020) A survey on 3d hand skeleton and pose estimation by convolutional neu-ral network. Adv Sci Technol Eng Syst J. 5:144\u2013159","journal-title":"Adv Sci Technol Eng Syst J."},{"issue":"5","key":"20704_CR14","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2629500","volume":"33","author":"J Tompson","year":"2014","unstructured":"Tompson J, Stein M, Lecun Y, Perlin K (2014) Real-time continuous pose recovery of human hands using convolutional networks. ACM Transactions on Graphics (ToG). 33(5):1\u201310","journal-title":"ACM Transactions on Graphics (ToG)."},{"key":"20704_CR15","unstructured":"Oberweger M, Wohlhart P, Lepetit V (2015) Hands deep in deep learning for hand pose estimation. arXiv:1502.06807"},{"key":"20704_CR16","doi-asserted-by":"crossref","unstructured":"Oberweger M, Lepetit V (2017) Deepprior++: Improving fast and accurate 3d hand pose estimation. In: Proceedings of the IEEE International Conference on Computer Vision Workshops, pp. 585\u2013594","DOI":"10.1109\/ICCVW.2017.75"},{"key":"20704_CR17","doi-asserted-by":"crossref","unstructured":"Zhou Y, Lu J, Du K, Lin X, Sun Y, Ma X (2018) Hbe: Hand branch ensemble network for real-time 3d hand pose estimation. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 501\u2013516","DOI":"10.1007\/978-3-030-01264-9_31"},{"key":"20704_CR18","doi-asserted-by":"crossref","unstructured":"Du K, Lin X, Sun Y, Ma X (2019) Crossinfonet: Multi-task information sharing based hand pose estimation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9896\u20139905","DOI":"10.1109\/CVPR.2019.01013"},{"key":"20704_CR19","doi-asserted-by":"crossref","unstructured":"Sinha A, Choi C, Ramani K (2016) Deephand: Robust hand pose estimation by completing a matrix imputed with deep features. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4150\u20134158","DOI":"10.1109\/CVPR.2016.450"},{"key":"20704_CR20","doi-asserted-by":"crossref","unstructured":"Wan C, Probst T, Van\u00a0Gool L, Yao A (2017) Crossing nets: Combining gans and vaes with a shared latent space for hand pose estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 680\u2013689","DOI":"10.1109\/CVPR.2017.132"},{"key":"20704_CR21","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.119922","volume":"223","author":"M Rezaei","year":"2023","unstructured":"Rezaei M, Rastgoo R, Athitsos V (2023) Trihorn-net: a model for accurate depth-based 3d hand pose estimation. Expert Syst Appl 223:119922","journal-title":"Expert Syst Appl"},{"key":"20704_CR22","doi-asserted-by":"crossref","unstructured":"Meng H, Jin S, Liu W, Qian C, Lin M, Ouyang W, Luo P (2022) 3d interacting hand pose estimation by hand de-occlusion and removal. In: European Conference on Computer Vision, pp. 380\u2013397. Springer","DOI":"10.1007\/978-3-031-20068-7_22"},{"key":"20704_CR23","doi-asserted-by":"crossref","unstructured":"Ge L, Ren Z, Yuan J (2018) Point-to-point regression pointnet for 3d hand pose estimation. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 475\u2013491","DOI":"10.1007\/978-3-030-01261-8_29"},{"key":"20704_CR24","unstructured":"Qi CR, Yi L, Su H, Guibas LJ (2017) Pointnet++: Deep hierarchical feature learning on point sets in a metric space. Advances in neural information processing systems 30"},{"key":"20704_CR25","doi-asserted-by":"crossref","unstructured":"Ge L, Liang H, Yuan J, Thalmann D (2017) 3d convolutional neural networks for efficient and robust hand pose estimation from single depth images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1991\u20132000","DOI":"10.1109\/CVPR.2017.602"},{"key":"20704_CR26","doi-asserted-by":"crossref","unstructured":"Moon G, Chang JY, Lee KM (2018) V2v-posenet: Voxel-to-voxel prediction network for accurate 3d hand and human pose estimation from a single depth map. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5079\u20135088","DOI":"10.1109\/CVPR.2018.00533"},{"key":"20704_CR27","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"20704_CR28","unstructured":"Huang F, Zeng A, Liu M, Qin J, Xu Q (2018) Structure-aware 3d hourglass network for hand pose estimation from single depth image. arXiv:1812.10320"},{"key":"20704_CR29","doi-asserted-by":"publisher","first-page":"2163","DOI":"10.1609\/aaai.v37i2.25310","volume":"37","author":"P Ren","year":"2023","unstructured":"Ren P, Chen Y, Hao J, Sun H, Qi Q, Wang J, Liao J (2023) Two heads are better than one: image-point cloud network for depth-based 3d hand pose estimation. Proceedings of the AAAI Conference on Artificial Intelligence 37:2163\u20132171","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence"},{"key":"20704_CR30","doi-asserted-by":"publisher","first-page":"419","DOI":"10.1609\/aaai.v36i1.19919","volume":"36","author":"J Cheng","year":"2022","unstructured":"Cheng J, Wan Y, Zuo D, Ma C, Gu J, Tan P, Wang H, Deng X, Zhang Y (2022) Efficient virtual view selection for 3d hand pose estimation. Proceedings of the AAAI Conference on Artificial Intelligence 36:419\u2013426","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence"},{"key":"20704_CR31","doi-asserted-by":"crossref","unstructured":"Ge L, Liang H, Yuan J, Thalmann D (2016) Robust 3d hand pose estimation in single depth images: from single-view cnn to multi-view cnns. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3593\u20133601","DOI":"10.1109\/CVPR.2016.391"},{"key":"20704_CR32","doi-asserted-by":"crossref","unstructured":"Zimmermann C, Brox T (2017) Learning to estimate 3d hand pose from single rgb images. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 4903\u20134911","DOI":"10.1109\/ICCV.2017.525"},{"key":"20704_CR33","doi-asserted-by":"crossref","unstructured":"Wei SE, Ramakrishna V, Kanade T, Sheikh Y (2016) Convolutional pose machines. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4724\u20134732","DOI":"10.1109\/CVPR.2016.511"},{"key":"20704_CR34","doi-asserted-by":"crossref","unstructured":"Cao Z, Simon T, Wei SE, Sheikh Y (2017) Realtime multi-person 2d pose estimation using part affinity fields. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7291\u20137299","DOI":"10.1109\/CVPR.2017.143"},{"key":"20704_CR35","doi-asserted-by":"crossref","unstructured":"Spurr A, Song J, Park S, Hilliges O (2018) Cross-modal deep variational hand pose estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 89\u201398","DOI":"10.1109\/CVPR.2018.00017"},{"key":"20704_CR36","doi-asserted-by":"crossref","unstructured":"Theodoridis T, Chatzis T, Solachidis V, Dimitropoulos K, Daras P (2020) Cross-modal variational alignment of latent spaces. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, pp. 960\u2013961","DOI":"10.1109\/CVPRW50498.2020.00488"},{"key":"20704_CR37","doi-asserted-by":"crossref","unstructured":"Iqbal U, Molchanov P, Gall TBJ, Kautz J (2018) Hand pose estimation via latent 2.5 d heatmap regression. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 118\u2013134","DOI":"10.1007\/978-3-030-01252-6_8"},{"key":"20704_CR38","doi-asserted-by":"crossref","unstructured":"Spurr A, Iqbal U, Molchanov P, Hilliges O, Kautz J (2020) Weakly supervised 3d hand pose estimation via biomechanical constraints. In: European Conference on Computer Vision, pp. 211\u2013228. Springer","DOI":"10.1007\/978-3-030-58520-4_13"},{"issue":"1","key":"20704_CR39","doi-asserted-by":"publisher","first-page":"79","DOI":"10.1007\/s41095-023-0346-4","volume":"10","author":"F Zhang","year":"2024","unstructured":"Zhang F, Zhao L, Li S, Su W, Liu L, Tao W (2024) 3d hand pose and shape estimation from monocular rgb via efficient 2d cues. Computational Visual Media. 10(1):79\u201396","journal-title":"Computational Visual Media."},{"key":"20704_CR40","doi-asserted-by":"crossref","unstructured":"Ivashechkin M, Mendez O, Bowden R (2023) Denoising diffusion for 3d hand pose estimation from images. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3136\u20133145","DOI":"10.1109\/ICCVW60793.2023.00338"},{"key":"20704_CR41","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2022.109217","volume":"136","author":"K Mahdikhanlou","year":"2023","unstructured":"Mahdikhanlou K, Ebrahimnezhad H (2023) 3d hand pose estimation from a single rgb image by weighting the occlusion and classification. Pattern Recogn 136:109217","journal-title":"Pattern Recogn"},{"key":"20704_CR42","doi-asserted-by":"crossref","unstructured":"Mueller F, Bernard F, Sotnychenko O, Mehta D, Sridhar S, Casas D, Theobalt C (2018) Ganerated hands for real-time 3d hand tracking from monocular rgb. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 49\u201359","DOI":"10.1109\/CVPR.2018.00013"},{"key":"20704_CR43","doi-asserted-by":"crossref","unstructured":"Lim GM, Jatesiktat P, Ang WT (2020) Mobilehand: Real-time 3d hand shape and pose estimation from color image. In: International Conference on Neural Information Processing, pp. 450\u2013459. Springer","DOI":"10.1007\/978-3-030-63820-7_52"},{"key":"20704_CR44","doi-asserted-by":"crossref","unstructured":"Ge L, Ren Z, Li Y, Xue Z, Wang Y, Cai J, Yuan J (2019) 3d hand shape and pose estimation from a single rgb image. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10833\u201310842","DOI":"10.1109\/CVPR.2019.01109"},{"key":"20704_CR45","doi-asserted-by":"crossref","unstructured":"Taheri O, Ghorbani N, Black MJ, Tzionas D (2020) Grab: A dataset of whole-body human grasping of objects. In: European Conference on Computer Vision, pp. 581\u2013600. Springer","DOI":"10.1007\/978-3-030-58548-8_34"},{"key":"20704_CR46","doi-asserted-by":"crossref","unstructured":"Boukhayma A, Bem Rd, Torr PH (2019) 3d hand shape and pose from images in the wild. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10843\u201310852","DOI":"10.1109\/CVPR.2019.01110"},{"key":"20704_CR47","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2022.108762","volume":"129","author":"D Avola","year":"2022","unstructured":"Avola D, Cinque L, Fagioli A, Foresti GL, Fragomeni A, Pannone D (2022) 3d hand pose and shape estimation from rgb images for keypoint-based hand gesture recognition. Pattern Recogn 129:108762","journal-title":"Pattern Recogn"},{"key":"20704_CR48","doi-asserted-by":"crossref","unstructured":"Xie P, Xu W, Tang T, Yu Z, Lu C (2024) Ms-mano: Enabling hand pose tracking with biomechanical constraints. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2382\u20132392","DOI":"10.1109\/CVPR52733.2024.00231"},{"key":"20704_CR49","doi-asserted-by":"crossref","unstructured":"Hasson Y, Varol G, Tzionas D, Kalevatykh I, Black MJ, Laptev I, Schmid C (2019) Learning joint reconstruction of hands and manipulated objects. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11807\u201311816","DOI":"10.1109\/CVPR.2019.01208"},{"key":"20704_CR50","unstructured":"Romero J, Tzionas D, Black MJ (2022) Embodied hands: Modeling and capturing hands and bodies together. arXiv:2201.02610"},{"key":"20704_CR51","doi-asserted-by":"crossref","unstructured":"Groueix T, Fisher M, Kim VG, Russell BC, Aubry M (2018) A papier-m\u00e2ch\u00e9 approach to learning 3d surface generation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 216\u2013224","DOI":"10.1109\/CVPR.2018.00030"},{"key":"20704_CR52","doi-asserted-by":"crossref","unstructured":"Dibra E, Melchior S, Balkis A, Wolf T, Oztireli C, Gross M (2018) Monocular rgb hand pose inference from unsupervised refinable nets. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition Workshops, pp. 1075\u20131085","DOI":"10.1109\/CVPRW.2018.00155"},{"key":"20704_CR53","doi-asserted-by":"crossref","unstructured":"Mueller F, Mehta D, Sotnychenko O, Sridhar S, Casas D, Theobalt C (2017) Real-time hand tracking under occlusion from an egocentric rgb-d sensor. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1154\u20131163","DOI":"10.1109\/ICCV.2017.131"},{"key":"20704_CR54","doi-asserted-by":"crossref","unstructured":"Mofarreh-Bonab M, Seyedarabi H, Mozaffari\u00a0Tazehkand B, Kasaei S (2021) 3d hand pose estimation using rgbd images and hybrid deep learning networks. The Visual Computer 1\u201310","DOI":"10.1007\/s00371-021-02263-7"},{"key":"20704_CR55","doi-asserted-by":"crossref","unstructured":"Choi C, Sinha A, Choi JH, Jang S, Ramani K (2015) A collaborative filtering approach to real-time hand pose estimation. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2336\u20132344","DOI":"10.1109\/ICCV.2015.269"},{"issue":"1","key":"20704_CR56","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1007\/s12652-022-03874-1","volume":"15","author":"Y Wang","year":"2024","unstructured":"Wang Y, Jiang X, Fujita H, Fang Z, Qiu X, Chen J (2024) Efn6d: an efficient rgb-d fusion network for 6d pose estimation. J Ambient Intell Humaniz Comput 15(1):75\u201388","journal-title":"J Ambient Intell Humaniz Comput"},{"key":"20704_CR57","doi-asserted-by":"publisher","first-page":"3756","DOI":"10.1609\/aaai.v38i4.28166","volume":"38","author":"X Liu","year":"2024","unstructured":"Liu X, Ren P, Gao Y, Wang J, Sun H, Qi Q, Zhuang Z, Liao J (2024) Keypoint fusion for rgb-d based 3d hand pose estimation. Proceedings of the AAAI Conference on Artificial Intelligence 38:3756\u20133764","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence"},{"issue":"18","key":"20704_CR58","doi-asserted-by":"publisher","first-page":"6095","DOI":"10.3390\/s21186095","volume":"21","author":"X Sun","year":"2021","unstructured":"Sun X, Wang B, Huang L, Zhang Q, Zhu S, Ma Y (2021) Crossfunet: Rgb and depth cross-fusion network for hand pose estimation. Sensors. 21(18):6095","journal-title":"Sensors."},{"key":"20704_CR59","doi-asserted-by":"crossref","unstructured":"Mueller F, Bernard F, Sotnychenko O, Mehta D, Sridhar S, Casas D, Theobalt C (2018) Ganerated hands for real-time 3d hand tracking from monocular rgb. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 49\u201359","DOI":"10.1109\/CVPR.2018.00013"},{"key":"20704_CR60","doi-asserted-by":"crossref","unstructured":"Tang D, Jin\u00a0Chang H, Tejani A, Kim TK (2014) Latent regression forest: Structured estimation of 3d articulated hand posture. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3786\u20133793","DOI":"10.1109\/CVPR.2014.490"},{"key":"20704_CR61","doi-asserted-by":"crossref","unstructured":"Yuan S, Ye Q, Stenger B, Jain S, Kim TK (2017) Bighand2. 2m benchmark: Hand pose dataset and state of the art analysis. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4866\u20134874","DOI":"10.1109\/CVPR.2017.279"},{"key":"20704_CR62","doi-asserted-by":"crossref","unstructured":"Sun X, Wei Y, Liang S, Tang X, Sun J (2015) Cascaded hand pose regression. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 824\u2013832","DOI":"10.1109\/CVPR.2015.7298683"},{"key":"20704_CR63","unstructured":"Yuan S, Ye Q, Garcia-Hernando G, Kim TK (2017) The 2017 hands in the million challenge on 3d hand pose estimation. arXiv:1707.02237"},{"key":"20704_CR64","doi-asserted-by":"crossref","unstructured":"Chao YW, Yang W, Xiang Y, Molchanov P, Handa A, Tremblay J, Narang YS, Van\u00a0Wyk K, Iqbal U, Birchfield S et\u00a0al. (2021) Dexycb: A benchmark for capturing hand grasping of objects. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9044\u20139053","DOI":"10.1109\/CVPR46437.2021.00893"},{"key":"20704_CR65","doi-asserted-by":"crossref","unstructured":"Moon G, Yu SI, Wen H, Shiratori T, Lee KM (2020) Interhand2. 6m: A dataset and baseline for 3d interacting hand pose estimation from a single rgb image. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XX 16, pp. 548\u2013564. Springer","DOI":"10.1007\/978-3-030-58565-5_33"},{"key":"20704_CR66","doi-asserted-by":"crossref","unstructured":"Lin F, Wilhelm C, Martinez T (2021) Two-hand global 3d pose estimation using monocular rgb. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 2373\u20132381","DOI":"10.1109\/WACV48630.2021.00242"},{"key":"20704_CR67","doi-asserted-by":"crossref","unstructured":"Wetzler A, Slossberg R, Kimmel R (2015) Rule of thumb: Deep derotation for improved fingertip detection. arXiv:1507.05726","DOI":"10.5244\/C.29.33"},{"issue":"12","key":"20704_CR68","doi-asserted-by":"publisher","first-page":"2878","DOI":"10.1109\/TPAMI.2012.261","volume":"35","author":"Y Yang","year":"2012","unstructured":"Yang Y, Ramanan D (2012) Articulated human detection with flexible mixtures of parts. IEEE Trans Pattern Anal Mach Intell 35(12):2878\u20132890","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"20704_CR69","doi-asserted-by":"crossref","unstructured":"Ahuja K, Streli P, Holz C (2021) Touchpose: Hand pose prediction, depth estimation, and touch classification from capacitive images. In: The 34th Annual ACM Symposium on User Interface Software and Technology, pp. 997\u20131009","DOI":"10.1145\/3472749.3474801"},{"key":"20704_CR70","doi-asserted-by":"crossref","unstructured":"Yuan S, Ye Q, Stenger B, Jain S, Kim TK (2017) Bighand2. 2m benchmark: Hand pose dataset and state of the art analysis. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4866\u20134874","DOI":"10.1109\/CVPR.2017.279"},{"key":"20704_CR71","doi-asserted-by":"crossref","unstructured":"Sridhar S, Oulasvirta A, Theobalt C (2013) Interactive markerless articulated hand motion tracking using rgb and depth data. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2456\u20132463","DOI":"10.1109\/ICCV.2013.305"},{"key":"20704_CR72","unstructured":"Deng X, Yang S, Zhang Y, Tan P, Chang L, Wang H (2017) Hand3d: Hand pose estimation using 3d neural network. arXiv:1704.02224"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-025-20704-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-025-20704-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-025-20704-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,17]],"date-time":"2025-09-17T09:45:03Z","timestamp":1758102303000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-025-20704-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,2,22]]},"references-count":72,"journal-issue":{"issue":"31","published-online":{"date-parts":[[2025,9]]}},"alternative-id":["20704"],"URL":"https:\/\/doi.org\/10.1007\/s11042-025-20704-6","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,2,22]]},"assertion":[{"value":"28 January 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 January 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 February 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 February 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no Conflict of interest to declare relevant to this article\u2019s content.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"This article does not contain any studies with human participants or animals performed by authors.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics Approval"}},{"value":"All authors have agreed to participate in this submitted article.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent to Participate"}},{"value":"All the authors involved in this manuscript give full consent for publication of this submitted article.","order":5,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for Publication"}}]}}