{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T09:23:55Z","timestamp":1780392235705,"version":"3.54.1"},"publisher-location":"Cham","reference-count":45,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783319464749","type":"print"},{"value":"9783319464756","type":"electronic"}],"license":[{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016]]},"DOI":"10.1007\/978-3-319-46475-6_19","type":"book-chapter","created":{"date-parts":[[2016,9,16]],"date-time":"2016-09-16T08:48:10Z","timestamp":1474015690000},"page":"294-310","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":142,"title":["Real-Time Joint Tracking of a Hand Manipulating an Object from RGB-D Input"],"prefix":"10.1007","author":[{"given":"Srinath","family":"Sridhar","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Franziska","family":"Mueller","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Michael","family":"Zollh\u00f6fer","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Dan","family":"Casas","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Antti","family":"Oulasvirta","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Christian","family":"Theobalt","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2016,9,17]]},"reference":[{"key":"19_CR1","unstructured":"Leap Motion. https:\/\/www.leapmotion.com\/"},{"key":"19_CR2","unstructured":"NimbleVR. http:\/\/nimblevr.com\/"},{"key":"19_CR3","doi-asserted-by":"crossref","unstructured":"Athitsos, V., Sclaroff, S.: Estimating 3D hand pose from a cluttered image. In: Proceedings of IEEE CVPR, pp. 432\u2013442 (2003)","DOI":"10.1109\/CVPR.2003.1211500"},{"key":"19_CR4","unstructured":"Badami, I., Stckler, J., Behnke, S.: Depth-enhanced hough forests for object-class detection and continuous pose estimation. In: Workshop on Semantic Perception, Mapping and Exploration (SPME) (2013)"},{"key":"19_CR5","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"640","DOI":"10.1007\/978-3-642-33783-3_46","volume-title":"Computer Vision \u2013 ECCV 2012","author":"L Ballan","year":"2012","unstructured":"Ballan, L., Taneja, A., Gall, J., Gool, L., Pollefeys, M.: Motion capture of hands in action using discriminative salient points. In: Fitzgibbon, A., Lazebnik, S., Perona, P., Sato, Y., Schmid, C. (eds.) ECCV 2012. LNCS, vol. 7577, pp. 640\u2013653. Springer, Heidelberg (2012). doi: 10.1007\/978-3-642-33783-3_46"},{"key":"19_CR6","doi-asserted-by":"crossref","unstructured":"Bray, M., Koller-Meier, E., Van Gool, L.: Smart particle filtering for 3D hand tracking. In: Proceedings of the International Conference on Automatic Face and Gesture Recognition, pp. 675\u2013680 (2004)","DOI":"10.1109\/AFGR.2004.1301612"},{"key":"19_CR7","unstructured":"Campbell, D., Petersson, L.: Gogma: globally-optimal Gaussian mixture alignment (2016). arXiv preprint arXiv:1603.00150"},{"key":"19_CR8","doi-asserted-by":"crossref","unstructured":"Hamer, H., Schindler, K., Koller-Meier, E., Van Gool, L.: Tracking a hand manipulating an object. In: Proceedings of IEEE ICCV, pp. 1475\u20131482 (2009)","DOI":"10.1109\/ICCV.2009.5459282"},{"key":"19_CR9","doi-asserted-by":"crossref","unstructured":"Heap, T., Hogg, D.: Towards 3D hand tracking using a deformable model. In: Proceedings of the International Conference on Automatic Face and Gesture Recognition, pp. 140\u2013145, October 1996","DOI":"10.1109\/AFGR.1996.557255"},{"issue":"8","key":"19_CR10","doi-asserted-by":"publisher","first-page":"1633","DOI":"10.1109\/TPAMI.2010.223","volume":"33","author":"B Jian","year":"2011","unstructured":"Jian, B., Vemuri, B.C.: Robust point set registration using Gaussian mixture models. IEEE Trans. Pattern Anal. Mach. Intell. 33(8), 1633\u20131645 (2011)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"19_CR11","unstructured":"Keskin, C., Kira, F., Kara, Y.E., Akarun, L.: Real time hand pose estimation using depth sensors. In: ICCV Workshops, pp. 1228\u20131234. IEEE (2011). http:\/\/dblp.uni-trier.de\/db\/conf\/iccvw\/iccvw2011.html#KeskinKKA11"},{"key":"19_CR12","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"415","DOI":"10.1007\/978-3-642-40602-7_44","volume-title":"Pattern Recognition","author":"D Kurmankhojayev","year":"2013","unstructured":"Kurmankhojayev, D., Hasler, N., Theobalt, C.: Monocular pose capture with a depth camera using a sums-of-Gaussians body model. In: Weickert, J., Hein, M., Schiele, B. (eds.) GCPR 2013. LNCS, vol. 8142, pp. 415\u2013424. Springer, Heidelberg (2013)"},{"key":"19_CR13","doi-asserted-by":"crossref","unstructured":"Kyriazis, N., Argyros, A.: Physically plausible 3D scene tracking: the single actor hypothesis. In: Proceedings of IEEE CVPR, pp. 9\u201316 (2013)","DOI":"10.1109\/CVPR.2013.9"},{"key":"19_CR14","doi-asserted-by":"crossref","unstructured":"Kyriazis, N., Argyros, A.: Scalable 3D tracking of multiple interacting objects. In: Proceedings of IEEE CVPR, pp. 3430\u20133437, June 2014","DOI":"10.1109\/CVPR.2014.438"},{"issue":"9","key":"19_CR15","doi-asserted-by":"publisher","first-page":"1793","DOI":"10.1109\/TPAMI.2011.33","volume":"33","author":"M de La Gorce","year":"2011","unstructured":"de La Gorce, M., Fleet, D., Paragios, N.: Model-based 3D hand pose estimation from monocular video. IEEE TPAMI 33(9), 1793\u20131805 (2011)","journal-title":"IEEE TPAMI"},{"key":"19_CR16","doi-asserted-by":"crossref","unstructured":"Melax, S., Keselman, L., Orsten, S.: Dynamics based 3D skeletal hand tracking. In: Proceedings of GI, pp. 63\u201370 (2013)","DOI":"10.1145\/2448196.2448232"},{"key":"19_CR17","doi-asserted-by":"crossref","unstructured":"Oikonomidis, I., Kyriazis, N., Argyros, A.: Full DOF tracking of a hand interacting with an object by modeling occlusions and physical constraints. In: Proceedings of IEEE ICCV, pp. 2088\u20132095 (2011)","DOI":"10.1109\/ICCV.2011.6126483"},{"key":"19_CR18","doi-asserted-by":"crossref","unstructured":"Oikonomidis, I., Kyriazis, N., Argyros, A.: Tracking the articulated motion of two strongly interacting hands. In: Proceedings of IEEE CVPR, pp. 1862\u20131869 (2012)","DOI":"10.1109\/CVPR.2012.6247885"},{"key":"19_CR19","doi-asserted-by":"crossref","unstructured":"Oikonomidis, I., Kyriazis, N., Argyros, A.A.: Efficient model-based 3D tracking of hand articulations using kinect. In: Proceedings of BMVC, pp. 1\u201311 (2011)","DOI":"10.5244\/C.25.101"},{"key":"19_CR20","doi-asserted-by":"crossref","unstructured":"Panteleris, P., Kyriazis, N., Argyros, A.A.: 3D tracking of human hands in interaction with unknown objects. In: Proceedings of BMVC (2015). https:\/\/dx.doi.org\/10.5244\/C.29.123","DOI":"10.5244\/C.29.123"},{"key":"19_CR21","unstructured":"Pham, T.H., Kheddar, A., Qammaz, A., Argyros, A.A.: Towards force sensing from vision: observing hand-object interactions to infer manipulation forces. In: Proceedings of IEEE CVPR (2015)"},{"issue":"9","key":"19_CR22","doi-asserted-by":"publisher","first-page":"1182","DOI":"10.1109\/TPAMI.2003.1227995","volume":"25","author":"R Plankers","year":"2003","unstructured":"Plankers, R., Fua, P.: Articulated soft objects for multiview shape and motion capture. IEEE TPAMI 25(9), 1182\u20131187 (2003). http:\/\/dx.doi.org\/10.1109\/TPAMI.2003.1227995","journal-title":"IEEE TPAMI"},{"key":"19_CR23","doi-asserted-by":"crossref","unstructured":"Qian, C., Sun, X., Wei, Y., Tang, X., Sun, J.: Realtime and robust hand tracking from depth. In: Proceedings of IEEE CVPR (2014)","DOI":"10.1109\/CVPR.2014.145"},{"key":"19_CR24","doi-asserted-by":"crossref","unstructured":"Romero, J., Kjellstrom, H., Kragic, D.: Hands in action: real-time 3D reconstruction of hands in interaction with objects. In: Proceedings of ICRA, pp. 458\u2013463 (2010)","DOI":"10.1109\/ROBOT.2010.5509753"},{"key":"19_CR25","doi-asserted-by":"crossref","unstructured":"Sharp, T., Keskin, C., Robertson, D., Taylor, J., Shotton, J., Kim, D., Rhemann, C., Leichter, I., Vinnikov, A., Wei, Y., Freedman, D., Kohli, P., Krupka, E., Fitzgibbon, A., Izadi, S.: Accurate, robust, and flexible real-time hand tracking. In: Proceedings of ACM CHI (2015)","DOI":"10.1145\/2702123.2702179"},{"key":"19_CR26","doi-asserted-by":"crossref","unstructured":"Shotton, J., Fitzgibbon, A., Cook, M., Sharp, T., Finocchio, M., Moore, R., Kipman, A., Blake, A.: Real-time human pose recognition in parts from single depth images. In: Proceedings of IEEE CVPR, pp. 1297\u20131304 (2011). http:\/\/dx.doi.org\/10.1109\/CVPR.2011.5995316","DOI":"10.1109\/CVPR.2011.5995316"},{"key":"19_CR27","unstructured":"Sridhar, S., Mueller, F., Oulasvirta, A., Theobalt, C.: Fast and robust hand tracking using detection-guided optimization. In: Proceedings IEEE CVPR (2015). http:\/\/handtracker.mpi-inf.mpg.de\/projects\/FastHandTracker\/"},{"key":"19_CR28","doi-asserted-by":"crossref","unstructured":"Sridhar, S., Oulasvirta, A., Theobalt, C.: Interactive markerless articulated hand motion tracking using RGB and depth data. In: Proceedings of IEEE ICCV (2013)","DOI":"10.1109\/ICCV.2013.305"},{"key":"19_CR29","doi-asserted-by":"crossref","unstructured":"Stenger, B., Mendon\u00e7a, P.R., Cipolla, R.: Model-based 3D tracking of an articulated hand. In: Proceedings of the 2001 IEEE Computer Society Conference on Computer Vision and Pattern Recognition, CVPR 2001, vol. 2, pp. II-310. IEEE (2001)","DOI":"10.1109\/CVPR.2001.990976"},{"key":"19_CR30","doi-asserted-by":"crossref","unstructured":"Stoll, C., Hasler, N., Gall, J., Seidel, H., Theobalt, C.: Fast articulated motion tracking using a sums of Gaussians body model. In: Proceedings of IEEE ICCV, pp. 951\u2013958 (2011)","DOI":"10.1109\/ICCV.2011.6126338"},{"key":"19_CR31","doi-asserted-by":"crossref","unstructured":"Sun, X., Wei, Y., Liang, S., Tang, X., Sun, J.: Cascaded hand pose regression. In: Proceedings of IEEE CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298683"},{"issue":"5","key":"19_CR32","doi-asserted-by":"crossref","first-page":"101","DOI":"10.1111\/cgf.12700","volume":"34","author":"Andrea Tagliasacchi","year":"2015","unstructured":"Tagliasacchi, A., Schr\u00f6der, M., Tkach, A., Bouaziz, S., Botsch, M., Pauly, M.: Robust articulated-ICP for real-time hand tracking. In: Computer Graphics Forum (Proceedings of SGP), vol. 34, no. 5 (2015)","journal-title":"Computer Graphics Forum"},{"key":"19_CR33","doi-asserted-by":"crossref","unstructured":"Tang, D., Chang, H.J., Tejani, A., Kim, T.: Latent regression forest: structured estimation of 3D articulated hand posture. In: Proceedings of IEEE CVPR, pp. 3786\u20133793 (2014). http:\/\/dx.doi.org\/10.1109\/CVPR.2014.490","DOI":"10.1109\/CVPR.2014.490"},{"key":"19_CR34","doi-asserted-by":"crossref","unstructured":"Tang, D., Taylor, J., Kim, T.K.: Opening the black box: hierarchical sampling optimization for estimating human hand pose. In: Proceedings of IEEE ICCV (2015)","DOI":"10.1109\/ICCV.2015.380"},{"key":"19_CR35","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"462","DOI":"10.1007\/978-3-319-10599-4_30","volume-title":"Computer Vision \u2013 ECCV 2014","author":"A Tejani","year":"2014","unstructured":"Tejani, A., Tang, D., Kouskouridas, R., Kim, T.-K.: Latent-class hough forests for 3D object detection and pose estimation. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8694, pp. 462\u2013477. Springer, Heidelberg (2014). doi: 10.1007\/978-3-319-10599-4_30"},{"issue":"5","key":"19_CR36","doi-asserted-by":"publisher","first-page":"169:1","DOI":"10.1145\/2629500","volume":"33","author":"J Tompson","year":"2014","unstructured":"Tompson, J., Stein, M., Lecun, Y., Perlin, K.: Real-time continuous pose recovery of human hands using convolutional networks. ACM TOG 33(5), 169:1\u2013169:10 (2014)","journal-title":"ACM TOG"},{"key":"19_CR37","doi-asserted-by":"publisher","first-page":"172","DOI":"10.1007\/s11263-016-0895-4","volume":"118","author":"D Tzionas","year":"2016","unstructured":"Tzionas, D., Ballan, L., Srikantha, A., Aponte, P., Pollefeys, M., Gall, J.: Capturing hands in action using discriminative salient points and physics simulation. IJCV 118, 172\u2013193 (2016)","journal-title":"IJCV"},{"key":"19_CR38","doi-asserted-by":"crossref","unstructured":"Tzionas, D., Gall, J.: 3D object reconstruction from hand-object interactions. In: Proceedings of IEEE ICCV (2015)","DOI":"10.1109\/ICCV.2015.90"},{"key":"19_CR39","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"277","DOI":"10.1007\/978-3-319-11752-2_22","volume-title":"Pattern Recognition","author":"D Tzionas","year":"2014","unstructured":"Tzionas, D., Srikantha, A., Aponte, P., Gall, J.: Capturing hand motion with an RGB-D sensor, fusing a generative model with salient points. In: Jiang, X., Hornegger, J., Koch, R. (eds.) GCPR 2014. LNCS, vol. 8753, pp. 277\u2013289. Springer, Heidelberg (2014). doi: 10.1007\/978-3-319-11752-2_22"},{"key":"19_CR40","doi-asserted-by":"crossref","unstructured":"Wang, R., Paris, S., Popovi\u0107, J.: 6D hands: markerless hand-tracking for computer aided design. In: Proceedings of ACM UIST, pp. 549\u2013558 (2011)","DOI":"10.1145\/2047196.2047269"},{"issue":"4","key":"19_CR41","doi-asserted-by":"publisher","first-page":"43:1","DOI":"10.1145\/2461912.2462000","volume":"32","author":"Y Wang","year":"2013","unstructured":"Wang, Y., Min, J., Zhang, J., Liu, Y., Xu, F., Dai, Q., Chai, J.: Video-based hand manipulation capture through composite motion control. ACM TOG 32(4), 43:1\u201343:14 (2013)","journal-title":"ACM TOG"},{"key":"19_CR42","unstructured":"Wu, Y., Huang, T.: View-independent recognition of hand postures. In: Proceedings of IEEE CVPR, pp. 88\u201394 (2000)"},{"key":"19_CR43","doi-asserted-by":"crossref","unstructured":"Xu, C., Cheng, L.: Efficient hand pose estimation from a single depth image. In: Proceedings of IEEE ICCV (2013)","DOI":"10.1109\/ICCV.2013.429"},{"key":"19_CR44","doi-asserted-by":"crossref","unstructured":"Ye, M., Yang, R.: Real-time simultaneous pose and shape estimation for articulated objects using a single depth camera. In: 2014 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 2353\u20132360, June 2014","DOI":"10.1109\/CVPR.2014.301"},{"issue":"4","key":"19_CR45","doi-asserted-by":"publisher","first-page":"156","DOI":"10.1145\/2601097.2601165","volume":"33","author":"M Zollh\u00f6fer","year":"2014","unstructured":"Zollh\u00f6fer, M., Nie\u00dfner, M., Izadi, S., Rehmann, C., Zach, C., Fisher, M., Wu, C., Fitzgibbon, A., Loop, C., Theobalt, C., Stamminger, M.: Real-time non-rigid reconstruction using an RGB-D camera. ACM TOG 33(4), 156 (2014)","journal-title":"ACM TOG"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2016"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-46475-6_19","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,10]],"date-time":"2025-06-10T19:14:43Z","timestamp":1749582883000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-46475-6_19"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016]]},"ISBN":["9783319464749","9783319464756"],"references-count":45,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-46475-6_19","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016]]},"assertion":[{"value":"17 September 2016","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Amsterdam","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"The Netherlands","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2016","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 October 2016","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"16 October 2016","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2016","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.eccv2016.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}