{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,2]],"date-time":"2025-08-02T05:28:06Z","timestamp":1754112486939,"version":"3.41.0"},"publisher-location":"Cham","reference-count":29,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319166278"},{"type":"electronic","value":"9783319166285"}],"license":[{"start":{"date-parts":[[2015,1,1]],"date-time":"2015-01-01T00:00:00Z","timestamp":1420070400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2015,1,1]],"date-time":"2015-01-01T00:00:00Z","timestamp":1420070400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2015]]},"DOI":"10.1007\/978-3-319-16628-5_2","type":"book-chapter","created":{"date-parts":[[2015,4,11]],"date-time":"2015-04-11T06:31:51Z","timestamp":1428733911000},"page":"19-34","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Hand Detection and Tracking in Videos for Fine-Grained Action Recognition"],"prefix":"10.1007","author":[{"given":"Nga H.","family":"Do","sequence":"first","affiliation":[]},{"given":"Keiji","family":"Yanai","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,4,12]]},"reference":[{"key":"2_CR1","doi-asserted-by":"crossref","unstructured":"Yao, B., Fei-Fei, L.: Modeling mutual context of object and human pose in human-object interaction activities. In: Proceedings of IEEE Computer Vision and Pattern Recognition, pp. 17\u201324 (2010)","DOI":"10.1109\/CVPR.2010.5540235"},{"key":"2_CR2","doi-asserted-by":"crossref","unstructured":"Yao, B., Fei-Fei, L.: Discovering object functionality. In: Proceedings of IEEE International Conference on Computer Vision, pp. 2512\u20132519 (2013)","DOI":"10.1109\/ICCV.2013.312"},{"key":"2_CR3","unstructured":"Delaitre, V., Sivic, J., Laptev, I.: Learning person-object interactions for action recognition in still images. In: Advances in Neural Information Processing Systems (2011)"},{"key":"2_CR4","doi-asserted-by":"publisher","first-page":"601","DOI":"10.1109\/TPAMI.2011.158","volume":"34","author":"A Prest","year":"2012","unstructured":"Prest, A., Schmid, C., Ferrari, V.: Weakly supervised learning of interactions between humans and objects. IEEE Trans. Pattern Anal. Mach. Intell. 34, 601\u2013614 (2012)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2_CR5","doi-asserted-by":"publisher","first-page":"835","DOI":"10.1109\/TPAMI.2012.175","volume":"35","author":"A Prest","year":"2013","unstructured":"Prest, A., Ferrari, V., Schmid, C.: Explicit modeling of human-object interactions in realistic videos. IEEE Trans. Pattern Anal. Mach. Intell. 35, 835\u2013848 (2013)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2_CR6","unstructured":"Khurram, S., Amir, R., Mubarak, S.: UCF101: A dataset of 101 human actions classes from videos in the wild. CoRR abs\/1212.0402 (2012)"},{"key":"2_CR7","unstructured":"Binh, N.D., Shuichi, E., Ejima, T.: Real-time hand tracking and gesture recognition system. In: Proceedings of International Conference on Graphics, Vision and Image Processing, pp. 19\u201321 (2005)"},{"key":"2_CR8","first-page":"96","volume":"5","author":"C Manresa","year":"2005","unstructured":"Manresa, C., Varona, J., Mas, R., Perales, F.: Hand tracking and gesture recognition for human-computer interaction. Electron. Lett. Comput. Vis. Image Anal. 5, 96\u2013104 (2005)","journal-title":"Electron. Lett. Comput. Vis. Image Anal."},{"key":"2_CR9","doi-asserted-by":"crossref","unstructured":"Angelopoulou, A., Rodr\u00edguez, J.G., Psarrou, A.: Learning 2d hand shapes using the topology preservation model GNG. In: Proceedings of European Conference on Computer Vision, pp. 313\u2013324 (2006)","DOI":"10.1007\/11744023_25"},{"key":"2_CR10","doi-asserted-by":"crossref","unstructured":"Ren, Z., Yuan, J., Zhang, Z.: Robust hand gesture recognition based on finger-earth mover\u2019s distance with a commodity depth camera. In: Proceedings of ACM International Conference on Multimedia, pp. 1093\u20131096 (2011)","DOI":"10.1145\/2072298.2071946"},{"key":"2_CR11","doi-asserted-by":"crossref","unstructured":"Van den Bergh, M., Van Gool, L.: Combining RGB and ToF cameras for real-time 3d hand gesture interaction. In: IEEE Workshop on Applications of Computer Vision, pp. 66\u201372 (2011)","DOI":"10.1109\/WACV.2011.5711485"},{"key":"2_CR12","series-title":"Studies in Computational Intelligence","doi-asserted-by":"publisher","first-page":"259","DOI":"10.1007\/978-3-642-24013-3_27","volume-title":"Intelligent Distributed Computing V","author":"TI Cerlinca","year":"2011","unstructured":"Cerlinca, T.I., Pentiuc, S.G.: Robust 3D hand detection for gestures recognition. In: Brazier, F.M.T., Nieuwenhuis, K., Pavlin, G., Warnier, M., Badica, C. (eds.) Intelligent Distributed Computing V. SCI, vol. 382, pp. 259\u2013264. Springer, Heidelberg (2011)"},{"key":"2_CR13","doi-asserted-by":"crossref","unstructured":"Oikonomidis, I., Lourakis, M.I., Argyros, A.: Evolutionary quasi-random search for hand articulations tracking. In: Proceedings of IEEE Computer Vision and Pattern Recognition (2014)","DOI":"10.1109\/CVPR.2014.437"},{"key":"2_CR14","doi-asserted-by":"crossref","unstructured":"Sapp, B., Weiss, D., Taskar, B.: Parsing human motion with stretchable models. In: Proceedings of IEEE Computer Vision and Pattern Recognition, pp. 1281\u20131288 (2011)","DOI":"10.1109\/CVPR.2011.5995607"},{"key":"2_CR15","doi-asserted-by":"crossref","unstructured":"Yuan, Q., Sclaroff, S., Athitsos, V.: Automatic 2d hand tracking in video sequences. In: IEEE Workshops on Application of Computer Vision, vol. 1, pp. 250\u2013256 (2005)","DOI":"10.1109\/ACVMOT.2005.27"},{"key":"2_CR16","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1007\/978-3-540-79547-6_4","volume-title":"Computer Vision Systems","author":"H Baltzakis","year":"2008","unstructured":"Baltzakis, H., Argyros, A.A., Lourakis, M.I.A., Trahanias, P.: Tracking of human hands and faces through probabilistic fusion of multiple visual cues. In: Gasteratos, A., Vincze, M., Tsotsos, J.K. (eds.) ICVS 2008. LNCS, vol. 5008, pp. 33\u201342. Springer, Heidelberg (2008)"},{"key":"2_CR17","doi-asserted-by":"crossref","unstructured":"Filipovych, R., Ribeiro, E.: Recognizing primitive interactions by exploring actor-object states. In: Proceedings of IEEE Computer Vision and Pattern Recognition, pp. 1\u20137 (2008)","DOI":"10.1109\/CVPR.2008.4587726"},{"key":"2_CR18","doi-asserted-by":"publisher","first-page":"177","DOI":"10.1016\/j.cviu.2010.11.012","volume":"115","author":"R Filipovych","year":"2011","unstructured":"Filipovych, R., Ribeiro, E.: Robust sequence alignment for actor-object interaction recognition: discovering actor-object states. Comput. Vis. Image Underst. 115, 177\u2013193 (2011)","journal-title":"Comput. Vis. Image Underst."},{"key":"2_CR19","doi-asserted-by":"publisher","first-page":"1775","DOI":"10.1109\/TPAMI.2009.83","volume":"31","author":"A Gupta","year":"2009","unstructured":"Gupta, A., Kembhavi, A., Davis, L.: Observing human-object interactions: using spatial and functional compatibility for recognition. IEEE Trans. Pattern Anal. Mach. Intell. 31, 1775\u20131789 (2009)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2_CR20","doi-asserted-by":"crossref","unstructured":"Weinzaepfel, P., Revaud, J., Harchaoui, Z., Schmid, C.: DeepFlow: large displacement optical flow with deep matching. In: Proceedings of IEEE International Conference on Computer Vision (2013)","DOI":"10.1109\/ICCV.2013.175"},{"key":"2_CR21","doi-asserted-by":"crossref","unstructured":"Mittal, A., Zisserman, A., Torr, P.H.: Hand detection using multiple proposals. In: Proceedings of British Machine Vision Conference, pp. 1\u201311 (2011)","DOI":"10.5244\/C.25.75"},{"key":"2_CR22","doi-asserted-by":"publisher","first-page":"1627","DOI":"10.1109\/TPAMI.2009.167","volume":"32","author":"PF Felzenszwalb","year":"2010","unstructured":"Felzenszwalb, P.F., Girshick, R.B., McAllester, D., Ramanan, D.: Object detection with discriminatively trained part based models. IEEE Trans. Pattern Anal. Mach. Intell. 32, 1627\u20131645 (2010)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2_CR23","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1023\/A:1009715923555","volume":"2","author":"CJ Burges","year":"1998","unstructured":"Burges, C.J.: A tutorial on support vector machines for pattern recognition. Data Min. Knowl. Disc. 2, 121\u2013167 (1998)","journal-title":"Data Min. Knowl. Disc."},{"key":"2_CR24","doi-asserted-by":"publisher","first-page":"898","DOI":"10.1109\/TPAMI.2010.161","volume":"33","author":"P Arbelaez","year":"2011","unstructured":"Arbelaez, P., Maire, M., Fowlkes, C., Malik, J.: Contour detection and hierarchical image segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 33, 898\u2013916 (2011)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2_CR25","doi-asserted-by":"crossref","unstructured":"Bourdev, L., Malik, J.: Poselets: body part detectors trained using 3d human pose annotations. In: Proceedings of IEEE International Conference on Computer Vision (2009)","DOI":"10.1109\/ICCV.2009.5459303"},{"key":"2_CR26","doi-asserted-by":"crossref","unstructured":"Dalal, N., Triggs, B.: Histograms of oriented gradients for human detection. In: Proceedings of IEEE Computer Vision and Pattern Recognition, vol. 1, pp. 886\u2013893 (2005)","DOI":"10.1109\/CVPR.2005.177"},{"key":"2_CR27","doi-asserted-by":"crossref","unstructured":"Karlinsky, L., Dinerstein, M., Harari, D., Ullman, S.: The chains model for detecting parts by their context. In: Proceedings of IEEE Computer Vision and Pattern Recognition, pp. 25\u201332 (2010)","DOI":"10.1109\/CVPR.2010.5540232"},{"key":"2_CR28","doi-asserted-by":"crossref","unstructured":"Wang, H., Schmid, C.: Action recognition with improved trajectories. In: Proceedings of IEEE International Conference on Computer Vision, pp. 3551\u20133558 (2013)","DOI":"10.1109\/ICCV.2013.441"},{"key":"2_CR29","first-page":"1453","volume":"6","author":"I Tsochantaridis","year":"2005","unstructured":"Tsochantaridis, I., Joachims, T., Hofmann, T., Altun, Y.: Large margin methods for structured and interdependent output variables. J. Mach. Learn Res. 6, 1453\u20131484 (2005)","journal-title":"J. Mach. Learn Res."}],"container-title":["Lecture Notes in Computer Science","Computer Vision - ACCV 2014 Workshops"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-16628-5_2","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,22]],"date-time":"2025-05-22T10:22:55Z","timestamp":1747909375000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-16628-5_2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015]]},"ISBN":["9783319166278","9783319166285"],"references-count":29,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-16628-5_2","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2015]]},"assertion":[{"value":"12 April 2015","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}