{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T16:12:57Z","timestamp":1760890377826},"reference-count":47,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2021,7,24]],"date-time":"2021-07-24T00:00:00Z","timestamp":1627084800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,7,24]],"date-time":"2021-07-24T00:00:00Z","timestamp":1627084800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2022,6]]},"DOI":"10.1007\/s00371-021-02263-7","type":"journal-article","created":{"date-parts":[[2021,7,24]],"date-time":"2021-07-24T12:02:31Z","timestamp":1627128151000},"page":"2023-2032","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["3D hand pose estimation using RGBD images and hybrid deep learning networks"],"prefix":"10.1007","volume":"38","author":[{"given":"Mohammad","family":"Mofarreh-Bonab","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hadi","family":"Seyedarabi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Behzad","family":"Mozaffari\u00a0Tazehkand","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shohreh","family":"Kasaei","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,7,24]]},"reference":[{"issue":"1\u20132","key":"2263_CR1","doi-asserted-by":"publisher","first-page":"52","DOI":"10.1016\/j.cviu.2006.10.012","volume":"108","author":"A Erol","year":"2007","unstructured":"Erol, A., Bebis, G., Nicolescu, M., Boyle, R.D., Twombly, X.: Vision-based hand pose estimation: a review. Comput. Vis. Image Underst. 108(1\u20132), 52\u201373 (2007)","journal-title":"Comput. Vis. Image Underst."},{"key":"2263_CR2","unstructured":"Doosti, B.: Hand pose estimation: a survey. arXiv preprint arXiv:1903.01013 (2019)"},{"issue":"3","key":"2263_CR3","doi-asserted-by":"publisher","first-page":"1106","DOI":"10.1016\/j.patcog.2006.06.010","volume":"40","author":"P Kakumanu","year":"2007","unstructured":"Kakumanu, P., Makrogiannis, S., Bourbakis, N.: A survey of skin-color modeling and detection methods. Pattern Recogn. 40(3), 1106\u20131122 (2007)","journal-title":"Pattern Recogn."},{"key":"2263_CR4","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1016\/j.cviu.2015.05.010","volume":"139","author":"C Zhang","year":"2015","unstructured":"Zhang, C., Tian, Y.: Histogram of 3d facets: a depth descriptor for human action and hand gesture recognition. Comput. Vis. Image Underst. 139, 29\u201339 (2015)","journal-title":"Comput. Vis. Image Underst."},{"issue":"5","key":"2263_CR5","doi-asserted-by":"publisher","first-page":"1110","DOI":"10.1109\/TMM.2013.2246148","volume":"15","author":"Z Ren","year":"2013","unstructured":"Ren, Z., Yuan, J., Meng, J., Zhang, Z.: Robust part-based hand gesture recognition using kinect sensor. IEEE Trans. Multimedia 15(5), 1110\u20131120 (2013)","journal-title":"IEEE Trans. Multimedia"},{"issue":"10","key":"2263_CR6","doi-asserted-by":"publisher","first-page":"1107","DOI":"10.1007\/s00371-014-0921-x","volume":"30","author":"F Pedersoli","year":"2014","unstructured":"Pedersoli, F., Benini, S., Adami, N., Leonardi, R.: Xkin: an open source framework for hand pose and gesture recognition using kinect. Vis. Comput. 30(10), 1107\u20131122 (2014)","journal-title":"Vis. Comput."},{"issue":"9","key":"2263_CR7","doi-asserted-by":"publisher","first-page":"1797","DOI":"10.1007\/s00371-019-01774-8","volume":"36","author":"S Zhang","year":"2020","unstructured":"Zhang, S., He, F.: DRCDN: learning deep residual convolutional dehazing networks. Vis. Comput. 36(9), 1797\u20131808 (2020)","journal-title":"Vis. Comput."},{"key":"2263_CR8","doi-asserted-by":"publisher","first-page":"106335","DOI":"10.1016\/j.asoc.2020.106335","volume":"93","author":"Y Chen","year":"2020","unstructured":"Chen, Y., He, F., Li, H., Zhang, D., Wu, Y.: A full migration bbo algorithm with enhanced population quality bounds for multimodal biomedical image registration. Appl. Soft Comput. 93, 106335 (2020)","journal-title":"Appl. Soft Comput."},{"issue":"9","key":"2263_CR9","doi-asserted-by":"publisher","first-page":"5743","DOI":"10.1007\/s11042-019-08493-1","volume":"79","author":"H Yu","year":"2020","unstructured":"Yu, H., He, F., Pan, Y.: A scalable region-based level set method using adaptive bilateral filter for noisy image segmentation. Multimed. Tools Appl. 79(9), 5743\u20135765 (2020)","journal-title":"Multimed. Tools Appl."},{"issue":"9","key":"2263_CR10","doi-asserted-by":"publisher","first-page":"11173","DOI":"10.1007\/s11042-018-6690-1","volume":"78","author":"X Chen","year":"2019","unstructured":"Chen, X., He, F., Yu, H.: A matting method based on full feature coverage. Multimed. Tools Appl. 78(9), 11173\u201311201 (2019)","journal-title":"Multimed. Tools Appl."},{"issue":"3","key":"2263_CR11","first-page":"1","volume":"28","author":"RY Wang","year":"2009","unstructured":"Wang, R.Y., Popovic, J.: Real-time hand-tracking with a color glove. ACM Trans. Graph. (TOG) 28(3), 1\u20138 (2009)","journal-title":"ACM Trans. Graph. (TOG)"},{"issue":"8","key":"2263_CR12","doi-asserted-by":"publisher","first-page":"1533","DOI":"10.1109\/TPAMI.2016.2522398","volume":"38","author":"T Von Marcard","year":"2016","unstructured":"Von Marcard, T., Pons-Moll, G., Rosenhahn, B.: Human pose estimation from video and imus. IEEE Trans. Pattern Anal. Mach. Intell. 38(8), 1533\u20131547 (2016)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2263_CR13","doi-asserted-by":"crossref","unstructured":"Jung, H.Y., Suh, Y., Moon, G., Lee, K.M.: A sequential approach to 3d human pose estimation: Separation of localization and identification of body joints. In: European Conference on Computer Vision, pp. 747\u2013761. Springer (2016)","DOI":"10.1007\/978-3-319-46454-1_45"},{"issue":"4","key":"2263_CR14","doi-asserted-by":"publisher","first-page":"381","DOI":"10.1007\/s11263-018-1118-y","volume":"127","author":"A Gilbert","year":"2019","unstructured":"Gilbert, A., Trumble, M., Malleson, C., Hilton, A., Collomosse, J.: Fusing visual and inertial sensors with semantics for 3d human pose estimation. Int. J. Comput. Vis. 127(4), 381\u2013397 (2019)","journal-title":"Int. J. Comput. Vis."},{"issue":"5","key":"2263_CR15","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2629500","volume":"33","author":"J Tompson","year":"2014","unstructured":"Tompson, J., Stein, M., Lecun, Y., Perlin, K.: Real-time continuous pose recovery of human hands using convolutional networks. ACM Trans. Graph. (ToG) 33(5), 1\u201310 (2014)","journal-title":"ACM Trans. Graph. (ToG)"},{"key":"2263_CR16","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"2263_CR17","doi-asserted-by":"crossref","unstructured":"Nalepa, J., Grzejszczak, T., Kawulok, M.: Wrist localization in color images for hand gesture recognition. In: Man\u2013Machine Interactions 3, pp. 79\u201386. Springer (2014)","DOI":"10.1007\/978-3-319-02309-0_8"},{"issue":"6","key":"2263_CR18","doi-asserted-by":"publisher","first-page":"837","DOI":"10.1007\/s00371-013-0822-4","volume":"29","author":"H Liang","year":"2013","unstructured":"Liang, H., Yuan, J., Thalmann, D., Zhang, Z.: Model-based hand pose estimation via spatial\u2013temporal hand parsing and 3d fingertip localization. Vis. Comput. 29(6), 837\u2013848 (2013)","journal-title":"Vis. Comput."},{"key":"2263_CR19","doi-asserted-by":"crossref","unstructured":"Breuer, P., Eckes, C., Muller, S.: Hand gesture recognition with a novel ir time-of-flight range camera-a pilot study. In: International Conference on Computer Vision\/Computer Graphics Collaboration Techniques and Applications, pp. 247\u2013260. Springer (2007)","DOI":"10.1007\/978-3-540-71457-6_23"},{"issue":"2","key":"2263_CR20","first-page":"150","volume":"2","author":"A Rasim","year":"2013","unstructured":"Rasim, A., Alexander, T.: Hand detection based on skin color segmentation and classification of image local features. Tem J. 2(2), 150\u2013155 (2013)","journal-title":"Tem J."},{"key":"2263_CR21","doi-asserted-by":"crossref","unstructured":"Vinh, T.Q., Tri, N.T.: Hand gesture recognition based on depth image using kinect sensor. In: 2015 2nd National Foundation for Science and Technology Development Conference on Information and Computer Science (NICS), pp. 34\u201339. IEEE (2015)","DOI":"10.1109\/NICS.2015.7302218"},{"key":"2263_CR22","unstructured":"Oberweger, M., Wohlhart, P., Lepetit, V.: Hands deep in deep learning for hand pose estimation. arXiv preprint arXiv:1502.06807 (2015)"},{"key":"2263_CR23","doi-asserted-by":"crossref","unstructured":"Supancic, J.S., Rogez, G., Yang, Y., Shotton, J., Ramanan, D.: Depthbased hand pose estimation: data, methods, and challenges. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1868\u20131876 (2015)","DOI":"10.1109\/ICCV.2015.217"},{"key":"2263_CR24","doi-asserted-by":"crossref","unstructured":"Khamis, S., Taylor, J., Shotton, J., Keskin, C., Izadi, S., Fitzgibbon, A.: Learning an efficient model of hand shape variation from depth images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2540\u20132548 (2015)","DOI":"10.1109\/CVPR.2015.7298869"},{"key":"2263_CR25","doi-asserted-by":"crossref","unstructured":"Tan, D.J., Cashman, T., Taylor, J., Fitzgibbon, A., Tarlow, D., Khamis, S., Izadi, S., Shotton, J.: Fits like a glove: Rapid and reliable hand shape personalization. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5610\u20135619 (2016)","DOI":"10.1109\/CVPR.2016.605"},{"key":"2263_CR26","doi-asserted-by":"crossref","unstructured":"Oberweger, M., Lepetit, V.: Deepprior++: improving fast and accurate 3d hand pose estimation. In: Proceedings of the IEEE International Conference on Computer Vision Workshops, pp. 585\u2013594 (2017)","DOI":"10.1109\/ICCVW.2017.75"},{"key":"2263_CR27","doi-asserted-by":"crossref","unstructured":"Ye, Q., Kim, T.K.: Occlusion-aware hand pose estimation using hierarchical mixture density network. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 801\u2013817 (2018)","DOI":"10.1007\/978-3-030-01249-6_49"},{"key":"2263_CR28","doi-asserted-by":"crossref","unstructured":"Ye, Q., Yuan, S., Kim, T.K.: Spatial attention deep net with partial PSO for hierarchical hybrid hand pose estimation. In: European Conference on Computer Vision, pp. 346\u2013361. Springer (2016)","DOI":"10.1007\/978-3-319-46484-8_21"},{"issue":"9","key":"2263_CR29","doi-asserted-by":"publisher","first-page":"1145","DOI":"10.1007\/s00371-018-1546-2","volume":"34","author":"Q Fan","year":"2018","unstructured":"Fan, Q., Shen, X., Hu, Y.: Detail-preserved real-time hand motion regression from depth. Vis. Comput. 34(9), 1145\u20131154 (2018)","journal-title":"Vis. Comput."},{"key":"2263_CR30","doi-asserted-by":"crossref","unstructured":"Guo, H., Wang, G., Chen, X., Zhang, C.: Towards good practices for deep 3d hand pose estimation. arXiv preprint arXiv:1707.07248 (2017)","DOI":"10.1016\/j.jvcir.2018.04.005"},{"key":"2263_CR31","doi-asserted-by":"publisher","first-page":"138","DOI":"10.1016\/j.neucom.2018.06.097","volume":"395","author":"X Chen","year":"2020","unstructured":"Chen, X., Wang, G., Guo, H., Zhang, C.: Pose guided structured region ensemble network for cascaded hand pose estimation. Neurocomputing 395, 138\u2013149 (2020)","journal-title":"Neurocomputing"},{"issue":"9","key":"2263_CR32","doi-asserted-by":"publisher","first-page":"1793","DOI":"10.1109\/TPAMI.2011.33","volume":"33","author":"M De La Gorce","year":"2011","unstructured":"De La Gorce, M., Fleet, D.J., Paragios, N.: Model-based 3d hand pose estimation from monocular video. IEEE Trans. Pattern Anal. Mach. Intell. 33(9), 1793\u20131805 (2011)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"12","key":"2263_CR33","doi-asserted-by":"publisher","first-page":"1910","DOI":"10.1109\/TPAMI.2005.233","volume":"27","author":"Y Wu","year":"2005","unstructured":"Wu, Y., Lin, J., Huang, T.S.: Analyzing and capturing articulated hand motion in image sequences. IEEE Trans. Pattern Anal. Mach. Intell. 27(12), 1910\u20131922 (2005)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2263_CR34","doi-asserted-by":"crossref","unstructured":"Cai, Y., Ge, L., Cai, J., Magnenat-Thalmann, N., Yuan, J.: 3d hand pose estimation using synthetic data and weakly labeled RGB images. IEEE Trans. Pattern Anal. Mach. Intell. (2020)","DOI":"10.1109\/TPAMI.2020.2993627"},{"key":"2263_CR35","doi-asserted-by":"crossref","unstructured":"Tang, D., Jin Chang, H., Tejani, A., Kim, T.K.: Latent regression forest: Structured estimation of 3d articulated hand posture. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3786\u20133793 (2014)","DOI":"10.1109\/CVPR.2014.490"},{"key":"2263_CR36","doi-asserted-by":"crossref","unstructured":"Sridhar, S., Oulasvirta, A., Theobalt, C.: Interactive markerless articulated hand motion tracking using RGB and depth data. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2456\u20132463 (2013)","DOI":"10.1109\/ICCV.2013.305"},{"key":"2263_CR37","doi-asserted-by":"crossref","unstructured":"Xu, D., Chen, Y.L., Wu, X., Ou, Y., Xu, Y.: Integrated approach of skincolor detection and depth information for hand and face localization. In: 2011 IEEE International Conference on Robotics and Biomimetics, pp. 952\u2013956. IEEE (2011)","DOI":"10.1109\/ROBIO.2011.6181410"},{"key":"2263_CR38","doi-asserted-by":"crossref","unstructured":"Cai, Y., Ge, L., Cai, J., Yuan, J.: Weakly-supervised 3d hand pose estimation from monocular RGB images. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 666\u2013682 (2018)","DOI":"10.1007\/978-3-030-01231-1_41"},{"key":"2263_CR39","doi-asserted-by":"crossref","unstructured":"Spurr, A., Song, J., Park, S., Hilliges, O.: Cross-modal deep variational hand pose estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 89\u201398 (2018)","DOI":"10.1109\/CVPR.2018.00017"},{"key":"2263_CR40","doi-asserted-by":"crossref","unstructured":"Zimmermann, C., Brox, T.: Learning to estimate 3d hand pose from single RGB images. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 4903\u20134911 (2017)","DOI":"10.1109\/ICCV.2017.525"},{"key":"2263_CR41","doi-asserted-by":"crossref","unstructured":"Mueller, F., Bernard, F., Sotnychenko, O., Mehta, D., Sridhar, S., Casas, D., Theobalt, C.: Ganerated hands for real-time 3d hand tracking from monocular rgb. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 49\u201359 (2018)","DOI":"10.1109\/CVPR.2018.00013"},{"key":"2263_CR42","doi-asserted-by":"crossref","unstructured":"Iqbal, U., Molchanov, P., Gall, T.B.J., Kautz, J.: Hand pose estimation via latent 2.5 d heatmap regression. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 118\u2013134 (2018)","DOI":"10.1007\/978-3-030-01252-6_8"},{"key":"2263_CR43","doi-asserted-by":"crossref","unstructured":"Rad, M., Oberweger, M., Lepetit, V.: Domain transfer for 3d pose estimation from color images without manual annotations. In: Asian Conference on Computer Vision, pp. 69\u201384. Springer (2018)","DOI":"10.1007\/978-3-030-20873-8_5"},{"key":"2263_CR44","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for largescale image recognition. arXiv preprint arXiv:1409.1556 (2014)"},{"key":"2263_CR45","doi-asserted-by":"crossref","unstructured":"Huang, G., Liu, Z., Van Der Maaten, L., Weinberger, K.Q.: Densely connected convolutional networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 4700\u20134708 (2017)","DOI":"10.1109\/CVPR.2017.243"},{"key":"2263_CR46","unstructured":"Howard, A.G., Zhu, M., Chen, B., Kalenichenko, D., Wang, W., Weyand, T., Andreetto, M., Adam, H.: Mobilenets: efficient convolutional neural networks for mobile vision applications. arXiv preprint arXiv:1704.04861 (2017)"},{"key":"2263_CR47","unstructured":"Kingma, D.P., Ba, J.: Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-021-02263-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-021-02263-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-021-02263-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T08:13:04Z","timestamp":1652170384000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-021-02263-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,7,24]]},"references-count":47,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2022,6]]}},"alternative-id":["2263"],"URL":"https:\/\/doi.org\/10.1007\/s00371-021-02263-7","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,7,24]]},"assertion":[{"value":"14 July 2021","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 July 2021","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}