{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,17]],"date-time":"2026-03-17T07:59:52Z","timestamp":1773734392324,"version":"3.50.1"},"reference-count":48,"publisher":"Springer Science and Business Media LLC","issue":"7","license":[{"start":{"date-parts":[[2023,8,1]],"date-time":"2023-08-01T00:00:00Z","timestamp":1690848000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,8,1]],"date-time":"2023-08-01T00:00:00Z","timestamp":1690848000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-023-16384-9","type":"journal-article","created":{"date-parts":[[2023,8,1]],"date-time":"2023-08-01T09:02:33Z","timestamp":1690880553000},"page":"21497-21523","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Hand pose estimation based on regression method from monocular RGB cameras for handling occlusion"],"prefix":"10.1007","volume":"83","author":[{"given":"Bekiri","family":"Roumaissa","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Babahenini","family":"Mohamed Chaouki","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,8,1]]},"reference":[{"key":"16384_CR1","unstructured":"Athitsos, V., Sclaroff, S.: Estimating 3d hand pose from a cluttered image. In: 2003 IEEE Computer Society Conference on Computer Vision and Pattern Recognition, 2003. Proceedings., vol. 2, p. 432 (2003). IEEE"},{"key":"16384_CR2","doi-asserted-by":"crossref","unstructured":"Baek, S., Kim, K.I., Kim, T.-K.: Pushing the envelope for rgb-based dense 3d hand pose estimation via neural rendering. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 1067\u20131076 (2019)","DOI":"10.1109\/CVPR.2019.00116"},{"key":"16384_CR3","doi-asserted-by":"crossref","unstructured":"Boukhayma, A., Bem, R.d., Torr, P.H.: 3d hand shape and pose from images in the wild. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10843\u201310852 (2019)","DOI":"10.1109\/CVPR.2019.01110"},{"key":"16384_CR4","doi-asserted-by":"crossref","unstructured":"Cai, Y., Ge, L., Cai, J., Yuan, J.: Weakly-supervised 3d hand pose estimation from monocular rgb images. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 666\u2013682 (2018)","DOI":"10.1007\/978-3-030-01231-1_41"},{"key":"16384_CR5","unstructured":"Chen, L., Lin, S.-Y., Xie, Y., Tang, H., Xue, Y., Xie, X., Lin, Y.-Y., Fan, W.: Generating realistic training images based on tonality-alignment generative adversarial networks for hand pose estimation. arXiv preprint arXiv:1811.09916 (2018)"},{"key":"16384_CR6","doi-asserted-by":"crossref","unstructured":"Dibra, E., Melchior, S., Balkis, A., Wolf, T., Oztireli, C., Gross, M.: Monocular rgb hand pose inference from unsupervised refinable nets. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition Workshops, pp. 1075\u20131085 (2018)","DOI":"10.1109\/CVPRW.2018.00155"},{"key":"16384_CR7","doi-asserted-by":"crossref","unstructured":"Feng Q, Shum HP, Morishima S (2020) Resolving hand-object occlusion for mixed reality with joint deep learning and model optimization. Computer Animation and Virtual Worlds 31(4\u20135):1956","DOI":"10.1002\/cav.1956"},{"key":"16384_CR8","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1016\/j.neucom.2021.12.013","volume":"474","author":"C Gao","year":"2022","unstructured":"Gao C, Yang Y, Li W (2022) 3d interacting hand pose and shape estimation from a single rgb image. Neurocomputing 474:25\u201336","journal-title":"Neurocomputing"},{"key":"16384_CR9","doi-asserted-by":"crossref","unstructured":"Ge, L., Liang, H., Yuan, J., Thalmann, D.: 3d convolutional neural networks for efficient and robust hand pose estimation from single depth images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1991\u20132000 (2017)","DOI":"10.1109\/CVPR.2017.602"},{"key":"16384_CR10","doi-asserted-by":"crossref","unstructured":"Ge, L., Liang, H., Yuan, J., Thalmann, D.: Robust 3d hand pose estimation in single depth images: from single-view cnn to multi-view cnns. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3593\u20133601 (2016)","DOI":"10.1109\/CVPR.2016.391"},{"key":"16384_CR11","doi-asserted-by":"crossref","unstructured":"Ge, L., Ren, Z., Li, Y., Xue, Z., Wang, Y., Cai, J., Yuan, J.: 3d hand shape and pose estimation from a single rgb image. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10833\u201310842 (2019)","DOI":"10.1109\/CVPR.2019.01109"},{"issue":"11","key":"16384_CR12","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1145\/3422622","volume":"63","author":"I Goodfellow","year":"2020","unstructured":"Goodfellow I, Pouget-Abadie J, Mirza M, Xu B, Warde-Farley D, Ozair S, Courville A, Bengio Y (2020) Generative adversarial networks. Communications of the ACM 63(11):139\u2013144","journal-title":"Communications of the ACM"},{"key":"16384_CR13","doi-asserted-by":"crossref","unstructured":"Hasson, Y., Varol, G., Tzionas, D., Kalevatykh, I., Black, M.J., Laptev, I., Schmid, C.: Learning joint reconstruction of hands and manipulated objects. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11807\u201311816 (2019)","DOI":"10.1109\/CVPR.2019.01208"},{"key":"16384_CR14","unstructured":"He, Y., Hu, W., Yang, S., Qu, X., Wan, P., Guo, Z.: 3d hand pose estimation in the wild via graph refinement under adversarial learning. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (2020)"},{"key":"16384_CR15","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"16384_CR16","doi-asserted-by":"crossref","unstructured":"Iqbal, U., Molchanov, P., Gall, T.B.J., Kautz, J.: Hand pose estimation via latent 2.5 d heatmap regression. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 118\u2013134 (2018)","DOI":"10.1007\/978-3-030-01252-6_8"},{"key":"16384_CR17","doi-asserted-by":"crossref","unstructured":"Kourbane, I., Genc, Y.: A graph-based approach for absolute 3d hand pose estimation using a single rgb image. Applied Intelligence, 1\u201316 (2022)","DOI":"10.1007\/s10489-022-03390-x"},{"key":"16384_CR18","unstructured":"Kulon, D., Wang, H., G\u00fcler, R.A., Bronstein, M., Zafeiriou, S.: Single image 3d hand reconstruction with mesh convolutions. arXiv preprint arXiv:1905.01326 (2019)"},{"key":"16384_CR19","doi-asserted-by":"crossref","unstructured":"Le, V.-H., Nguyen, T.-T., Tran, N.-A., Pham, T.-C.: Openpose\u2019s evaluation in the video traditional martial arts presentation. In: 2019 19th International Symposium on Communications and Information Technologies (ISCIT), pp. 76\u201381 (2019). IEEE","DOI":"10.1109\/ISCIT.2019.8905243"},{"key":"16384_CR20","doi-asserted-by":"crossref","unstructured":"Li, S., Wang, H., Lee, D.: Hand pose estimation for hand-object interaction cases using augmented autoencoder. In: 2020 IEEE International Conference on Robotics and Automation (ICRA), pp. 993\u2013999 (2020). IEEE","DOI":"10.1109\/ICRA40945.2020.9197299"},{"issue":"12","key":"16384_CR21","doi-asserted-by":"publisher","first-page":"4883","DOI":"10.1109\/TCSVT.2021.3055862","volume":"31","author":"M Li","year":"2021","unstructured":"Li M, Wang J, Sang N (2021) Latent distribution-based 3d hand pose estimation from monocular rgb images. IEEE Transactions on Circuits and Systems for Video Technology 31(12):4883\u20134894","journal-title":"IEEE Transactions on Circuits and Systems for Video Technology"},{"issue":"6","key":"16384_CR22","doi-asserted-by":"publisher","first-page":"2023","DOI":"10.1007\/s00371-021-02263-7","volume":"38","author":"M Mofarreh-Bonab","year":"2022","unstructured":"Mofarreh-Bonab M, Seyedarabi H, Mozaffari Tazehkand B, Kasaei S (2022) 3d hand pose estimation using rgbd images and hybrid deep learning networks. The Visual Computer 38(6):2023\u20132032","journal-title":"The Visual Computer"},{"key":"16384_CR23","doi-asserted-by":"crossref","unstructured":"Moon, G., Chang, J.Y., Lee, K.M.: V2v-posenet: Voxel-to-voxel prediction network for accurate 3d hand and human pose estimation from a single depth map. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5079\u20135088 (2018)","DOI":"10.1109\/CVPR.2018.00533"},{"key":"16384_CR24","doi-asserted-by":"crossref","unstructured":"Mueller, F., Bernard, F., Sotnychenko, O., Mehta, D., Sridhar, S., Casas, D., Theobalt, C.: Ganerated hands for real-time 3d hand tracking from monocular rgb. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 49\u201359 (2018)","DOI":"10.1109\/CVPR.2018.00013"},{"key":"16384_CR25","doi-asserted-by":"crossref","unstructured":"Mueller, F., Bernard, F., Sotnychenko, O., Mehta, D., Sridhar, S., Casas, D., Theobalt, C.: Ganerated hands for real-time 3d hand tracking from monocular rgb. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 49\u201359 (2018)","DOI":"10.1109\/CVPR.2018.00013"},{"key":"16384_CR26","doi-asserted-by":"crossref","unstructured":"Mueller, F., Mehta, D., Sotnychenko, O., Sridhar, S., Casas, D., Theobalt, C.: Real-time hand tracking under occlusion from an egocentric rgb-d sensor. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1154\u20131163 (2017)","DOI":"10.1109\/ICCVW.2017.82"},{"issue":"8","key":"16384_CR27","doi-asserted-by":"publisher","first-page":"1898","DOI":"10.1109\/TPAMI.2019.2907951","volume":"42","author":"M Oberweger","year":"2019","unstructured":"Oberweger M, Wohlhart P, Lepetit V (2019) Generalized feedback loop for joint hand-object pose estimation. IEEE transactions on pattern analysis and machine intelligence 42(8):1898\u20131912","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"key":"16384_CR28","unstructured":"Paszke, A., Gross, S., Chintala, S., Chanan, G., Yang, E., DeVito, Z., Lin, Z., Desmaison, A., Antiga, L., Lerer, A.: Automatic differentiation in pytorch (2017)"},{"key":"16384_CR29","doi-asserted-by":"crossref","unstructured":"Qian, C., Sun, X., Wei, Y., Tang, X., Sun, J.: Realtime and robust hand tracking from depth. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1106\u20131113 (2014)","DOI":"10.1109\/CVPR.2014.145"},{"key":"16384_CR30","doi-asserted-by":"crossref","unstructured":"Redmon, J., Farhadi, A.: Yolo9000: better, faster, stronger. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7263\u20137271 (2017)","DOI":"10.1109\/CVPR.2017.690"},{"key":"16384_CR31","doi-asserted-by":"crossref","unstructured":"Romero, J., Kjellstr\u00f6m, H., Kragic, D.: Hands in action: real-time 3d reconstruction of hands in interaction with objects. In: 2010 IEEE International Conference on Robotics and Automation, pp. 458\u2013463 (2010). IEEE","DOI":"10.1109\/ROBOT.2010.5509753"},{"key":"16384_CR32","unstructured":"Romero, J., Tzionas, D., Black, M.J.: Embodied hands: Modeling and capturing hands and bodies together. arXiv preprint arXiv:2201.02610 (2022)"},{"key":"16384_CR33","doi-asserted-by":"crossref","unstructured":"Spurr, A., Song, J., Park, S., Hilliges, O.: Cross-modal deep variational hand pose estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 89\u201398 (2018)","DOI":"10.1109\/CVPR.2018.00017"},{"key":"16384_CR34","doi-asserted-by":"crossref","unstructured":"Sridhar, S., Oulasvirta, A., Theobalt, C.: Interactive markerless articulated hand motion tracking using rgb and depth data. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2456\u20132463 (2013)","DOI":"10.1109\/ICCV.2013.305"},{"key":"16384_CR35","doi-asserted-by":"crossref","unstructured":"Su, Y., Rambach, J., Minaskan, N., Lesur, P., Pagani, A., Stricker, D.: Deep multi-state object pose estimation for augmented reality assembly. In: 2019 IEEE International Symposium on Mixed and Augmented Reality Adjunct (ISMAR-Adjunct), pp. 222\u2013227 (2019). IEEE","DOI":"10.1109\/ISMAR-Adjunct.2019.00-42"},{"key":"16384_CR36","doi-asserted-by":"crossref","unstructured":"Tekin, B., Bogo, F., Pollefeys, M.: H+ o: Unified egocentric recognition of 3d hand-object poses and interactions. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4511\u20134520 (2019)","DOI":"10.1109\/CVPR.2019.00464"},{"key":"16384_CR37","doi-asserted-by":"crossref","unstructured":"Tekin, B., Bogo, F., Pollefeys, M.: H+ o: Unified egocentric recognition of 3d hand-object poses and interactions. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4511\u20134520 (2019)","DOI":"10.1109\/CVPR.2019.00464"},{"key":"16384_CR38","doi-asserted-by":"crossref","unstructured":"Wan, C., Yao, A., Gool, L.V.: Hand pose estimation from local surface normals. In: European Conference on Computer Vision, pp. 554\u2013569 (2016). Springer","DOI":"10.1007\/978-3-319-46487-9_34"},{"key":"16384_CR39","doi-asserted-by":"publisher","DOI":"10.1016\/j.jvcir.2020.102802","volume":"70","author":"M-Y Wu","year":"2020","unstructured":"Wu M-Y, Ting P-W, Tang Y-H, Chou E-T, Fu L-C (2020) Hand pose estimation in object-interaction based on deep learning for virtual reality applications. Journal of Visual Communication and Image Representation 70:102802","journal-title":"Journal of Visual Communication and Image Representation"},{"key":"16384_CR40","doi-asserted-by":"publisher","DOI":"10.1016\/j.jvcir.2020.102802","volume":"70","author":"M-Y Wu","year":"2020","unstructured":"Wu M-Y, Ting P-W, Tang Y-H, Chou E-T, Fu L-C (2020) Hand pose estimation in object-interaction based on deep learning for virtual reality applications. Journal of Visual Communication and Image Representation 70:102802","journal-title":"Journal of Visual Communication and Image Representation"},{"key":"16384_CR41","doi-asserted-by":"crossref","unstructured":"Xiang, D., Joo, H., Sheikh, Y.: Monocular total capture: Posing face, body, and hands in the wild. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10965\u201310974 (2019)","DOI":"10.1109\/CVPR.2019.01122"},{"key":"16384_CR42","doi-asserted-by":"crossref","unstructured":"Ye, Q., Kim, T.-K.: Occlusion-aware hand pose estimation using hierarchical mixture density network. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 801\u2013817 (2018)","DOI":"10.1007\/978-3-030-01249-6_49"},{"issue":"8","key":"16384_CR43","doi-asserted-by":"publisher","first-page":"2687","DOI":"10.1007\/s11042-013-1501-1","volume":"74","author":"H-S Yeo","year":"2015","unstructured":"Yeo H-S, Lee B-G, Lim H (2015) Hand tracking and gesture recognition system for human-computer interaction using low-cost hardware. Multimedia Tools and Applications 74(8):2687\u20132715","journal-title":"Multimedia Tools and Applications"},{"key":"16384_CR44","doi-asserted-by":"crossref","unstructured":"Yuan, S., Stenger, B., Kim, T.-K.: Rgb-based 3d hand pose estimation via privileged learning with depth images. arXiv preprint arXiv:1811.07376 (2018)","DOI":"10.1109\/ICCVW.2019.00348"},{"key":"16384_CR45","doi-asserted-by":"crossref","unstructured":"Zhang, X., Li, Q., Mo, H., Zhang, W., Zheng, W.: End-to-end hand mesh recovery from a monocular rgb image. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 2354\u20132364 (2019)","DOI":"10.1109\/ICCV.2019.00244"},{"key":"16384_CR46","unstructured":"Zhang, Y., Xu, C., Cheng, L.: Learning to search on manifolds for 3d pose estimation of articulated objects. arXiv preprint arXiv:1612.00596 (2016)"},{"key":"16384_CR47","doi-asserted-by":"crossref","unstructured":"Zhou, Y., Lu, J., Du, K., Lin, X., Sun, Y., Ma, X.: Hbe: Hand branch ensemble network for real-time 3d hand pose estimation. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 501\u2013516 (2018)","DOI":"10.1007\/978-3-030-01264-9_31"},{"key":"16384_CR48","doi-asserted-by":"crossref","unstructured":"Zimmermann, C., Brox, T.: Learning to estimate 3d hand pose from single rgb images. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 4903\u20134911 (2017)","DOI":"10.1109\/ICCV.2017.525"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-16384-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-023-16384-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-16384-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,15]],"date-time":"2024-02-15T10:37:29Z","timestamp":1707993449000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-023-16384-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,8,1]]},"references-count":48,"journal-issue":{"issue":"7","published-online":{"date-parts":[[2024,2]]}},"alternative-id":["16384"],"URL":"https:\/\/doi.org\/10.1007\/s11042-023-16384-9","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,8,1]]},"assertion":[{"value":"22 January 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"5 April 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 July 2023","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 August 2023","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"This article does not contain any studies with human participants or animals performed by any of the authors.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}},{"value":"All the authors involved have agreed to participate in this submitted article.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent to participate"}},{"value":"All the authors involved in this manuscript give full consent for publication of this submitted article.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent to publish"}},{"value":"The authors have no conflicts of interest to declare relevant to this article\u2019s content.","order":5,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}