{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,5]],"date-time":"2026-04-05T00:41:28Z","timestamp":1775349688219,"version":"3.50.1"},"reference-count":90,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2012,5,30]],"date-time":"2012-05-30T00:00:00Z","timestamp":1338336000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2012,10]]},"DOI":"10.1007\/s11263-012-0532-9","type":"journal-article","created":{"date-parts":[[2012,5,29]],"date-time":"2012-05-29T15:59:54Z","timestamp":1338307194000},"page":"16-37","source":"Crossref","is-referenced-by-count":81,"title":["Coupled Action Recognition and Pose Estimation from Multiple Views"],"prefix":"10.1007","volume":"100","author":[{"given":"Angela","family":"Yao","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Juergen","family":"Gall","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Luc","family":"Van Gool","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2012,5,30]]},"reference":[{"issue":"1","key":"532_CR1","doi-asserted-by":"crossref","first-page":"44","DOI":"10.1109\/TPAMI.2006.21","volume":"28","author":"A. Agarwal","year":"2006","unstructured":"Agarwal, A., & Triggs, B. (2006). Recovering 3d human pose from monocular images. IEEE Transactions on Pattern Analysis and Machine Intelligence, 28(1), 44\u201358.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"532_CR2","unstructured":"Aggarwal, J., & Ryoo, M. (2010). Human activity analysis: a\u00a0review. ACM Computing Surveys."},{"key":"532_CR3","volume-title":"Proceedings international conference on computer vision","author":"S. Ali","year":"2007","unstructured":"Ali, S., Basharat, A., & Shah, M. (2007). Chaotic invariants for human action recognition. In Proceedings international conference on computer vision."},{"key":"532_CR4","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"M. Andriluka","year":"2010","unstructured":"Andriluka, M., Roth, S., & Schiele, B. (2010). Monocular 3d pose estimation and tracking by detection. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR5","volume-title":"Proceedings international conference on computer vision","author":"A. Baak","year":"2009","unstructured":"Baak, A., Rosenhahn, B., Mueller, M., & Seidel, H. P. (2009). Stabilizing motion tracking using retrieved motion priors. In Proceedings international conference on computer vision."},{"key":"532_CR6","volume-title":"Proceeding of the workshop on motion of nonrigid and articulated objects","author":"A. Baumberg","year":"1994","unstructured":"Baumberg, A., & Hogg, D. (1994). An efficient method for contour tracking using active shape models. In Proceeding of the workshop on motion of nonrigid and articulated objects. Los Alamitos: IEEE Computer Society."},{"key":"532_CR7","volume-title":"Neural information processing systems","author":"M. Belkin","year":"2002","unstructured":"Belkin, M., & Niyogi, P. (2002). Laplacian eigenmaps and spectral techniques for embedding and clustering. In Neural information processing systems."},{"key":"532_CR8","doi-asserted-by":"crossref","first-page":"93","DOI":"10.1007\/s11263-009-0209-1","volume":"87","author":"M. Bergtholdt","year":"2010","unstructured":"Bergtholdt, M., Kappes, J., Schmidt, S., & Schn\u00f6rr, C. (2010). A study of parts-based object class detection using complete graphs. International Journal of Computer Vision, 87, 93\u2013117.","journal-title":"International Journal of Computer Vision"},{"key":"532_CR9","volume-title":"Proceedings international conference on computer vision","author":"M. Blank","year":"2005","unstructured":"Blank, M., Gorelick, L., Shechtman, E., Irani, M., & Basri, R. (2005). Actions as space-time shapes. In Proceedings international conference on computer vision."},{"key":"532_CR10","doi-asserted-by":"crossref","first-page":"28","DOI":"10.1007\/s11263-008-0204-y","volume":"87","author":"L. Bo","year":"2010","unstructured":"Bo, L., & Sminchisescu, C. (2010). Twin Gaussian processes for structured prediction. International Journal of Computer Vision, 87, 28\u201352.","journal-title":"International Journal of Computer Vision"},{"issue":"3","key":"532_CR11","doi-asserted-by":"crossref","first-page":"257","DOI":"10.1109\/34.910878","volume":"23","author":"A. Bobick","year":"2001","unstructured":"Bobick, A., & Davis, J. (2001). The recognition of human movement using temporal templates. IEEE Transactions on Pattern Analysis and Machine Intelligence, 23(3), 257\u2013267.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"532_CR12","volume-title":"Proceedings European conference on computer vision","author":"T. Brox","year":"2004","unstructured":"Brox, T., Bruhn, A., Papenberg, N., & Weickert, J. (2004). High accuracy optical flow estimation based on a theory for warping. In Proceedings European conference on computer vision."},{"key":"532_CR13","doi-asserted-by":"crossref","first-page":"140","DOI":"10.1007\/s11263-009-0274-5","volume":"87","author":"M. Brubaker","year":"2010","unstructured":"Brubaker, M., Fleet, D., & Hertzmann, A. (2010). Physics-based person tracking using the anthropomorphic walker. International Journal of Computer Vision, 87, 140\u2013155.","journal-title":"International Journal of Computer Vision"},{"key":"532_CR14","volume-title":"Proceedings international conference on computer vision","author":"L. Campbell","year":"1995","unstructured":"Campbell, L., & Bobick, A. (1995). Recognition of human body motion using phase space constraints. In Proceedings international conference on computer vision."},{"key":"532_CR15","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"J. Chen","year":"2009","unstructured":"Chen, J., Kim, M., Wang, Y., & Ji, Q. (2009). Switching Gaussian process dynamic models for simultaneous composite motion tracking and recognition. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR16","doi-asserted-by":"crossref","first-page":"156","DOI":"10.1007\/s11263-009-0284-3","volume":"87","author":"S. Corazza","year":"2010","unstructured":"Corazza, S., M\u00fcndermann, L., Gambaretto, E., Ferrigno, G., & Andriacchi, T. (2010). Markerless motion capture through visual hull, articulated icp and subject specific model generation. International Journal of Computer Vision, 87, 156\u2013169.","journal-title":"International Journal of Computer Vision"},{"key":"532_CR17","doi-asserted-by":"crossref","first-page":"3042","DOI":"10.1016\/j.patcog.2010.03.018","volume":"43","author":"J. Darby","year":"2010","unstructured":"Darby, J., Li, B., & Costen, N. (2010). Tracking human pose with multiple activity models. Pattern Recognition, 43, 3042\u20133058.","journal-title":"Pattern Recognition"},{"key":"532_CR18","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4684-9393-1","volume-title":"Feynman-Kac formulae. Genealogical and interacting particle systems with applications","author":"P. Moral Del","year":"2004","unstructured":"Del Moral, P. (2004). Feynman-Kac formulae. Genealogical and interacting particle systems with applications. New York: Springer."},{"key":"532_CR19","doi-asserted-by":"crossref","first-page":"2","DOI":"10.1023\/B:VISI.0000043757.18370.9c","volume":"61","author":"J. Deutscher","year":"2005","unstructured":"Deutscher, J., & Reid, I. (2005). Articulated body motion capture by stochastic search. International Journal of Computer Vision, 61,\u00a02.","journal-title":"International Journal of Computer Vision"},{"key":"532_CR20","volume-title":"IEEE international workshop on visual surveillance and performance evaluation of tracking and surveillance (VS-PETS)","author":"P. Dollar","year":"2005","unstructured":"Dollar, P., Rabaud, V., Cottrell, G., & Belongie, S. (2005). Behavior recognition via sparse spatio-temporal features. In IEEE international workshop on visual surveillance and performance evaluation of tracking and surveillance (VS-PETS)."},{"key":"532_CR21","volume-title":"Proceedings international conference on computer vision","author":"A. Efros","year":"2003","unstructured":"Efros, A., Berg, A., Mori, G., & Malik, J. (2003). Recognizing action at a distance. In Proceedings international conference on computer vision."},{"key":"532_CR22","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"A. Elgammal","year":"2004","unstructured":"Elgammal, A., & Lee, C. S. (2004). Inferring 3d body pose from silhouettes using activity manifold learning. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR23","unstructured":"Forsyth, D., Arikan, O., Ikemoto, L., O\u2019Brien, J., & Ramanan, D. (2006). Computational studies of human motion: Part 1, tracking and motion synthesis. Foundations and Trends in Computer Graphics and Vision, 1."},{"key":"532_CR24","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"J. Gall","year":"2008","unstructured":"Gall, J., Rosenhahn, B., & Seidel, H. P. (2008a). Drift-free tracking of rigid and articulated objects. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR25","doi-asserted-by":"crossref","first-page":"319","DOI":"10.1007\/978-1-4020-6693-1_13","volume-title":"Human motion: understanding, modelling, capture and animation","author":"J. Gall","year":"2008","unstructured":"Gall, J., Rosenhahn, B., & Seidel, H. P. (2008b). An introduction to interacting simulated annealing. In Human motion: understanding, modelling, capture and animation (pp. 319\u2013343). Berlin: Springer."},{"key":"532_CR26","first-page":"1746","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"J. Gall","year":"2009","unstructured":"Gall, J., Stoll, C., de Aguiar, E., Theobalt, C., Rosenhahn, B., & Seidel, H. P. (2009). Motion capture using joint skeleton tracking and surface estimation. In Proceedings IEEE conference on computer vision and pattern recognition (pp. 1746\u20131753)."},{"key":"532_CR27","doi-asserted-by":"crossref","first-page":"75","DOI":"10.1007\/s11263-008-0173-1","volume":"87","author":"J. Gall","year":"2010","unstructured":"Gall, J., Rosenhahn, B., Brox, T., & Seidel, H. P. (2010a). Optimization and filtering for human motion capture\u2014a\u00a0multi-layer framework. International Journal of Computer Vision, 87, 75\u201392.","journal-title":"International Journal of Computer Vision"},{"key":"532_CR28","volume-title":"Proceedings European conference on computer vision","author":"J. Gall","year":"2010","unstructured":"Gall, J., Yao, A., & Van Gool, L. (2010b). 2d action recognition serves 3d human pose estimation. In Proceedings European conference on computer vision."},{"key":"532_CR29","doi-asserted-by":"crossref","unstructured":"Gall, J., Yao, A., Razavi, N., Van Gool, L., & Lempitsky, V. (2011). Hough forests for object detection, tracking, and action recognition. IEEE Transactions on Pattern Analysis and Machine Intelligence.","DOI":"10.1109\/TPAMI.2011.70"},{"key":"532_CR30","volume-title":"International workshop on face and gesture recognition","author":"D. Gavrila","year":"1995","unstructured":"Gavrila, D., & Davis, L. (1995). Towards 3-d model-based tracking and recognition of human movement: a multi-view approach. In International workshop on face and gesture recognition."},{"key":"532_CR31","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"A. Geiger","year":"2009","unstructured":"Geiger, A., Urtasun, R., & Darrell, T. (2009). Rank priors for continuous non-linear dimensionality reduction. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR32","volume-title":"Proceedings international conference on computer vision","author":"S. Hou","year":"2007","unstructured":"Hou, S., Galata, A., Caillette, F., Thacker, N., & Bromiley, P. (2007). Real-time body tracking using a Gaussian process latent variable model. In Proceedings international conference on computer vision."},{"key":"532_CR33","doi-asserted-by":"crossref","unstructured":"Husz, Z. L., Wallace, A. M., & Green, P. R. (2011) Behavioural analysis with movement cluster model for concurrent actions. EURASIP Journal on Image and Video Processing.","DOI":"10.1155\/2011\/365307"},{"issue":"2","key":"532_CR34","doi-asserted-by":"crossref","first-page":"121","DOI":"10.1007\/s11263-008-0158-0","volume":"83","author":"T. Jaeggli","year":"2009","unstructured":"Jaeggli, T., Koller-Meier, E., & Van Gool, L. (2009). Learning generative models for multi-activity body pose estimation. International Journal of Computer Vision, 83(2), 121\u2013134.","journal-title":"International Journal of Computer Vision"},{"issue":"2","key":"532_CR35","doi-asserted-by":"crossref","first-page":"365","DOI":"10.1142\/S0219843607001060","volume":"4","author":"O. C. Jenkins","year":"2007","unstructured":"Jenkins, O. C., Serrano, G. G., & Loper, M. M. (2007). Interactive human pose and action recognition using dynamical motion primitives. International Journal of Humanoid Robotics, 4(2), 365\u2013385.","journal-title":"International Journal of Humanoid Robotics"},{"key":"532_CR36","volume-title":"Proceedings international conference on computer vision","author":"H. Jhuang","year":"2007","unstructured":"Jhuang, H., Serre, T., Wolf, L., & Poggio, T. (2007). A biologically inspired system for action recognition. In Proceedings international conference on computer vision."},{"key":"532_CR37","doi-asserted-by":"crossref","first-page":"226","DOI":"10.1109\/34.667881","volume":"20","author":"J. Kittler","year":"1998","unstructured":"Kittler, J., Hatef, M., Duin, R., & Matas, J. (1998). On combining classifiers. IEEE Transactions on Pattern Analysis and Machine Intelligence, 20, 226\u2013239.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"532_CR38","volume-title":"International workshop on sign, gesture, and activity","author":"A. Kl\u00e4ser","year":"2010","unstructured":"Kl\u00e4ser, A., Marsza\u0142ek, M., Schmid, C., & Zisserman, A. (2010). Human focused action localization in video. In International workshop on sign, gesture, and activity."},{"key":"532_CR39","doi-asserted-by":"crossref","first-page":"559","DOI":"10.1145\/1015706.1015760","volume":"23","author":"L. Kovar","year":"2004","unstructured":"Kovar, L., & Gleicher, M. (2004). Automated extraction and parameterization of motions in large data sets. ACM Transactions on Graphics, 23, 559\u2013568.","journal-title":"ACM Transactions on Graphics"},{"key":"532_CR40","volume-title":"Proceedings international conference on computer vision","author":"I. Laptev","year":"2003","unstructured":"Laptev, I., & Lindeberg, T. (2003). Space-time interest points. In Proceedings international conference on computer vision."},{"key":"532_CR41","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"I. Laptev","year":"2008","unstructured":"Laptev, I., Marsza\u0142ek, M., Schmid, C., & Rozenfeld, B. (2008). Learning realistic human actions from movies. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR42","first-page":"1783","volume":"6","author":"N. Lawrence","year":"2005","unstructured":"Lawrence, N. (2005). Probabilistic non-linear principal component analysis with Gaussian process latent variable models. Journal of Machine Learning Research, 6, 1783\u20131816.","journal-title":"Journal of Machine Learning Research"},{"key":"532_CR43","doi-asserted-by":"crossref","first-page":"118","DOI":"10.1007\/s11263-009-0266-5","volume":"87","author":"C. Lee","year":"2010","unstructured":"Lee, C., & Elgammal, A. (2010). Coupled visual and kinematic manifold models for tracking. International Journal of Computer Vision, 87, 118\u2013139.","journal-title":"International Journal of Computer Vision"},{"key":"532_CR44","volume-title":"Proceedings international conference on computer vision","author":"R. Li","year":"2007","unstructured":"Li, R., Tian, T., & Sclaroff, S. (2007). Simultaneous learning of non-linear manifold and dynamical models for high-dimensional time series. In Proceedings international conference on computer vision."},{"key":"532_CR45","doi-asserted-by":"crossref","first-page":"170","DOI":"10.1007\/s11263-009-0283-4","volume":"87","author":"R. Li","year":"2010","unstructured":"Li, R., Tian, T., Sclaroff, S., & Yang, M. (2010). 3d human motion tracking with a coordinated mixture of factor analyzers. International Journal of Computer Vision, 87, 170\u2013190.","journal-title":"International Journal of Computer Vision"},{"key":"532_CR46","volume-title":"Proceedings European conference on computer vision","author":"R. Lin","year":"2006","unstructured":"Lin, R., Liu, C., Yang, M., Ahja, N., & Levinson, S. (2006). Learning nonlinear manifolds from time series. In Proceedings European conference on computer vision."},{"key":"532_CR47","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"J. Liu","year":"2009","unstructured":"Liu, J., Luo, J., & Shah, M. (2009). Recognizing realistic actions from videos \u2018in the wild\u2019. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR48","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"F. Lv","year":"2007","unstructured":"Lv, F., & Nevatia, R. (2007). Single view human action recognition using key pose matching and Viterbi path searching. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR49","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"S. Maji","year":"2011","unstructured":"Maji, S., Bourdev, L., & Malik, J. (2011). Action recognition from a distributed representation of pose and appearance. In Proceedings IEEE conference on computer vision and pattern recognition."},{"issue":"3","key":"532_CR50","doi-asserted-by":"crossref","first-page":"311","DOI":"10.1109\/TSMCC.2007.893280","volume":"37","author":"S. Mitra","year":"2007","unstructured":"Mitra, S., & Acharya, T. (2007). Gesture recognition: a\u00a0survey. IEEE Transactions on Systems, Man and Cybernetics - Part\u00a0C, 37(3), 311\u2013324.","journal-title":"IEEE Transactions on Systems, Man and Cybernetics - Part\u00a0C"},{"issue":"2","key":"532_CR51","doi-asserted-by":"crossref","first-page":"90","DOI":"10.1016\/j.cviu.2006.08.002","volume":"104","author":"T. Moeslund","year":"2006","unstructured":"Moeslund, T., Hilton, A., & Kr\u00fcger, V. (2006). A survey of advances in vision-based human motion capture and analysis. Computer Vision and Image Understanding, 104(2), 90\u2013126.","journal-title":"Computer Vision and Image Understanding"},{"key":"532_CR52","first-page":"198","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"K. Moon","year":"2006","unstructured":"Moon, K., & Pavlovic, V. (2006). Impact of dynamics on subspace embedding and tracking of sequences. In Proceedings IEEE conference on computer vision and pattern recognition (pp. 198\u2013205)."},{"key":"532_CR53","doi-asserted-by":"crossref","first-page":"677","DOI":"10.1145\/1073204.1073247","volume":"24","author":"M. M\u00fcller","year":"2005","unstructured":"M\u00fcller, M., R\u00f6der, T., & Clausen, M. (2005). Efficient content-based retrieval of motion capture data. ACM Transactions on Graphics, 24, 677\u2013685.","journal-title":"ACM Transactions on Graphics"},{"key":"532_CR54","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"P. Natarajan","year":"2010","unstructured":"Natarajan, P., Singh, V., & Nevatia, R. (2010). Learning 3d action models from a few 2d videos for view invariant action recognition. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR55","first-page":"981","volume-title":"Neural information processing systems","author":"V. Pavlovic","year":"2000","unstructured":"Pavlovic, V., Rehg, J., & Maccormick, J. (2000). Learning switching linear models of human motion. In Neural information processing systems (pp. 981\u2013987)."},{"key":"532_CR56","doi-asserted-by":"crossref","first-page":"53","DOI":"10.1007\/s11263-009-0205-5","volume":"87","author":"P. Peursum","year":"2010","unstructured":"Peursum, P., Venkatesh, S., & West, G. (2010). A study on smoothing for particle-filtered 3d human body tracking. International Journal of Computer Vision, 87, 53\u201374.","journal-title":"International Journal of Computer Vision"},{"key":"532_CR57","doi-asserted-by":"crossref","unstructured":"Poppe, R. (2010). A survey on vision-based human action recognition. Image and Vision Computing.","DOI":"10.1016\/j.imavis.2009.11.014"},{"issue":"2","key":"532_CR58","doi-asserted-by":"crossref","first-page":"203","DOI":"10.1023\/A:1020350100748","volume":"50","author":"C. Rao","year":"2002","unstructured":"Rao, C., Yilmaz, A., & Shah, M. (2002). View-invariant representation and recognition of actions. International Journal of Computer Vision, 50(2), 203\u2013226.","journal-title":"International Journal of Computer Vision"},{"issue":"4","key":"532_CR59","doi-asserted-by":"crossref","first-page":"503","DOI":"10.1016\/j.cviu.2010.12.002","volume":"115","author":"L. Raskin","year":"2011","unstructured":"Raskin, L., Rudzsky, M., & Rivlin, E. (2011). Dimensionality reduction using a Gaussian process annealed particle filter for tracking and classification of articulated body motions. Computer Vision and Image Understanding, 115(4), 503\u2013519.","journal-title":"Computer Vision and Image Understanding"},{"key":"532_CR60","volume-title":"Gaussian processes for machine learning","author":"C. Rasmussen","year":"2006","unstructured":"Rasmussen, C., & Williams, C. (2006). Gaussian processes for machine learning. Cambridge: MIT Press."},{"key":"532_CR61","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"M. Rodriguez","year":"2008","unstructured":"Rodriguez, M., Ahmed, J., & Shah, M. (2008). Action Mach: a spatio-temporal maximum average correlation height filter for action recognition. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR62","volume-title":"Neural information processing systems","author":"R. Rosales","year":"2001","unstructured":"Rosales, R., & Sclaroff, S. (2001). Learning body pose via specialized maps. In Neural information processing systems."},{"key":"532_CR63","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"B. Rosenhahn","year":"2007","unstructured":"Rosenhahn, B., Brox, T., & Seidel, H. P. (2007). Scaled motion dynamics for markerless motion capture. In Proceedings IEEE conference on computer vision and pattern recognition."},{"issue":"5500","key":"532_CR64","doi-asserted-by":"crossref","first-page":"2323","DOI":"10.1126\/science.290.5500.2323","volume":"290","author":"S. Roweis","year":"2000","unstructured":"Roweis, S., & Saul, L. (2000). Nonlinear dimensionality reduction by locally Linear embedding. Science, 290(5500), 2323\u20132326.","journal-title":"Science"},{"key":"532_CR65","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"K. Schindler","year":"2008","unstructured":"Schindler, K., & Van Gool, L. (2008). Action snippets: how many frames does human action recognition require. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR66","first-page":"1","volume-title":"Machine vision and applications","author":"C. Schmaltz","year":"2011","unstructured":"Schmaltz, C., Rosenhahn, B., Brox, T., & Weickert, J. (2011). Region-based pose tracking with occlusions using 3d models. In Machine vision and applications (pp. 1\u201321)."},{"key":"532_CR67","volume-title":"Proceedings international conference on pattern recognition","author":"C. Schuldt","year":"2004","unstructured":"Schuldt, C., Laptev, I., & Caputo, B. (2004). Recognizing human actions: a local svm approach. In Proceedings international conference on pattern recognition."},{"key":"532_CR68","volume-title":"IEEE workshop on applications of computer vision","author":"M. Shaheen","year":"2009","unstructured":"Shaheen, M., Gall, J., Strzodka, R., Van Gool, L., & Seidel, H. P. (2009). A comparison of 3d model-based tracking approaches for human motion capture in uncontrolled environments. In IEEE workshop on applications of computer vision."},{"key":"532_CR69","volume-title":"Proceedings European conference on computer vision","author":"H. Sidenbladh","year":"2000","unstructured":"Sidenbladh, H., Black, M., & Fleet, D. (2000). Stochastic tracking of 3d human figures using 2d image motion. In Proceedings European conference on computer vision."},{"key":"532_CR70","first-page":"784","volume-title":"Proceedings European conference on computer vision","author":"H. Sidenbladh","year":"2002","unstructured":"Sidenbladh, H., Black, M., & Sigal, L. (2002). Implicit probabilistic models of human motion for synthesis and tracking. In Proceedings European conference on computer vision (pp. 784\u2013800)."},{"issue":"1\u20132","key":"532_CR71","doi-asserted-by":"crossref","first-page":"4","DOI":"10.1007\/s11263-009-0273-6","volume":"87","author":"L. Sigal","year":"2010","unstructured":"Sigal, L., Balan, A., & Black, M. (2010). Humaneva: synchronized video and motion capture dataset and baseline algorithm for evaluation of articulated human motion. International Journal of Computer Vision, 87(1\u20132), 4\u201327.","journal-title":"International Journal of Computer Vision"},{"key":"532_CR72","volume-title":"Proceedings international conference on machine learning","author":"C. Sminchisescu","year":"2004","unstructured":"Sminchisescu, C., & Jepson, A. (2004). Generative modeling for continuous non-linearly embedded visual inference. In Proceedings international conference on machine learning."},{"issue":"11","key":"532_CR73","doi-asserted-by":"crossref","first-page":"2030","DOI":"10.1109\/TPAMI.2007.1111","volume":"29","author":"C. Sminchisescu","year":"2007","unstructured":"Sminchisescu, C., Kanaujia, A., & Metaxas, D. (2007). Bm3e: discriminative density propagation for visual tracking. IEEE Transactions on Pattern Analysis and Machine Intelligence, 29(11), 2030\u20132044.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"532_CR74","first-page":"222","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"L. Taycher","year":"2006","unstructured":"Taycher, L., Demirdjian, D., Darrell, T., & Shakhnarovich, G. (2006). Conditional random people: tracking humans with crfs and grid filters. In Proceedings IEEE conference on computer vision and pattern recognition (pp. 222\u2013229)."},{"key":"532_CR75","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"G. Taylor","year":"2010","unstructured":"Taylor, G., Sigal, L., Fleet, D., & Hinton, G. (2010). Dynamical binary latent variable models for 3d human pose tracking. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR76","volume-title":"A global geometric framework for nonlinear dimensionality reduction","author":"J. Tenenbaum","year":"2000","unstructured":"Tenenbaum, J., de Silva, V., & Langford, J. (2000). A global geometric framework for nonlinear dimensionality reduction. Chicago: Science."},{"key":"532_CR77","volume-title":"IEEE workshop on tracking humans for the evaluation of their motion in image sequences","author":"M. Tenorth","year":"2009","unstructured":"Tenorth, M., Bandouch, J., & Beetz, M. (2009). The TUM kitchen data set of everyday manipulation activities for motion tracking and action recognition. In IEEE workshop on tracking humans for the evaluation of their motion in image sequences."},{"key":"532_CR78","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"C. Thurau","year":"2008","unstructured":"Thurau, C., & Hlavac, V. (2008). Pose primitive based human action recognition in videos or still images. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR79","volume-title":"Proceedings international conference on computer vision","author":"N. Ukita","year":"2009","unstructured":"Ukita, N., Hirai, M., & Kidode, M. (2009). Complex volume and pose tracking with probabilistic dynamical model and visual hull constraint. In Proceedings international conference on computer vision."},{"key":"532_CR80","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"R. Urtasun","year":"2006","unstructured":"Urtasun, R., Fleet, D., & Fua, P. (2006). 3d people tracking with Gaussian process dynamical models. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR81","volume-title":"Proceedings international conference on computer vision","author":"R. Urtasun","year":"2005","unstructured":"Urtasun, R., Fleet, D., Hertzman, A., & Fua, P. (2005). Priors for people tracking from small training sets. In Proceedings international conference on computer vision."},{"issue":"2","key":"532_CR82","doi-asserted-by":"crossref","first-page":"283","DOI":"10.1109\/TPAMI.2007.1167","volume":"30","author":"J. Wang","year":"2008","unstructured":"Wang, J., Fleet, D., & Hertzmann, A. (2008). Gaussian process dynamical models for human motion. IEEE Transactions on Pattern Analysis and Machine Intelligence, 30(2), 283\u2013298.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"532_CR83","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"D. Weinland","year":"2008","unstructured":"Weinland, D., & Boyer, E. (2008). Action recognition using exemplar-based embedding. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR84","volume-title":"Proceedings international conference on computer vision","author":"D. Weinland","year":"2007","unstructured":"Weinland, D., Boyer, E., & Ronfard, R. (2007). Action recognition from arbitrary views using 3d exemplars. In Proceedings international conference on computer vision."},{"key":"532_CR85","volume-title":"Proceedings British machine vision conference","author":"G. Willems","year":"2009","unstructured":"Willems, G., Becker, J., Tuytelaars, T., & Van Gool, L. (2009). Exemplar-based action recognition in video. In Proceedings British machine vision conference."},{"issue":"2","key":"532_CR86","doi-asserted-by":"crossref","first-page":"232","DOI":"10.1006\/cviu.1998.0726","volume":"73","author":"Y. Yacoob","year":"1999","unstructured":"Yacoob, Y., & Black, M. (1999). Parameterized modeling and recognition of activities. Computer Vision and Image Understanding, 73(2), 232\u2013247.","journal-title":"Computer Vision and Image Understanding"},{"key":"532_CR87","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"W. Yang","year":"2010","unstructured":"Yang, W., Wang, Y., & Mori, G. (2010). Recognizing human actions from still images with latent poses. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR88","volume-title":"Proceedings IEEE conference on computer vision and pattern recognition","author":"A. Yao","year":"2010","unstructured":"Yao, A., Gall, J., & Van Gool, L. (2010). A hough transform-based voting framework for action recognition. In Proceedings IEEE conference on computer vision and pattern recognition."},{"key":"532_CR89","volume-title":"Proceedings British machine vision conference","author":"A. Yao","year":"2011","unstructured":"Yao, A., Gall, J., Fanelli, G., & Van Gool, L. (2011). Does human action recognition benefit from pose estimation. In Proceedings British machine vision conference."},{"key":"532_CR90","volume-title":"Proceedings international conference on computer vision","author":"A. Yilmaz","year":"2005","unstructured":"Yilmaz, A., & Shah, M. (2005). Recognizing human actions in videos acquired by uncalibrated moving cameras. In Proceedings international conference on computer vision."}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-012-0532-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11263-012-0532-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-012-0532-9","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,6,29]],"date-time":"2019-06-29T02:35:40Z","timestamp":1561775740000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11263-012-0532-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,5,30]]},"references-count":90,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2012,10]]}},"alternative-id":["532"],"URL":"https:\/\/doi.org\/10.1007\/s11263-012-0532-9","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012,5,30]]}}}