{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,27]],"date-time":"2025-10-27T16:02:36Z","timestamp":1761580956187},"reference-count":61,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2012,1,31]],"date-time":"2012-01-31T00:00:00Z","timestamp":1327968000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2012,8]]},"DOI":"10.1007\/s11263-012-0516-9","type":"journal-article","created":{"date-parts":[[2012,1,30]],"date-time":"2012-01-30T18:53:24Z","timestamp":1327949604000},"page":"25-52","source":"Crossref","is-referenced-by-count":20,"title":["Fast Human Pose Detection Using Randomized Hierarchical Cascades of Rejectors"],"prefix":"10.1007","volume":"99","author":[{"given":"Gr\u00e9gory","family":"Rogez","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jonathan","family":"Rihan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Carlos","family":"Orrite-Uru\u00f1uela","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Philip H. S.","family":"Torr","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2012,1,31]]},"reference":[{"issue":"1","key":"516_CR1","doi-asserted-by":"crossref","first-page":"44","DOI":"10.1109\/TPAMI.2006.21","volume":"28","author":"A. Agarwal","year":"2006","unstructured":"Agarwal, A., & Triggs, B. (2006). Recovering 3d human pose from monocular images. IEEE Transactions on Pattern Analysis and Machine Intelligence, 28(1), 44\u201358.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"516_CR2","volume-title":"CVPR","author":"M. Andriluka","year":"2009","unstructured":"Andriluka, M., Roth, S., & Schiele, B. (2009). Pictorial structures revisited: People detection and articulated pose estimation. In CVPR."},{"key":"516_CR3","first-page":"623","volume-title":"CVPR","author":"M. Andriluka","year":"2010","unstructured":"Andriluka, M., Roth, S., & Schiele, B. (2010). Monocular 3d pose estimation and tracking by detection. In CVPR (pp.\u00a0623\u2013630)."},{"issue":"1\u20132","key":"516_CR4","doi-asserted-by":"crossref","first-page":"93","DOI":"10.1007\/s11263-009-0209-1","volume":"87","author":"M. Bergtholdt","year":"2010","unstructured":"Bergtholdt, M., Kappes, J. H., Schmidt, S., & Schn\u00f6rr, C. (2010). A\u00a0study of parts-based object class detection using complete graphs. International Journal of Computer Vision, 87(1\u20132), 93\u2013117.","journal-title":"International Journal of Computer Vision"},{"key":"516_CR5","first-page":"169","volume-title":"NIPS","author":"A. Bissacco","year":"2006","unstructured":"Bissacco, A., Yang, M. H., & Soatto, S. (2006). Detecting humans via their pose. In NIPS (pp.\u00a0169\u2013176)."},{"key":"516_CR6","volume-title":"CVPR","author":"A. Bissacco","year":"2007","unstructured":"Bissacco, A., Yang, M. H., & Soatto, S. (2007). Fast human pose estimation using appearance and motion via multi-dimensional boosting regression. In CVPR."},{"key":"516_CR7","volume-title":"Morphometric tools for landmark data: geometry and biology","author":"F. Bookstein","year":"1991","unstructured":"Bookstein, F. (1991). Morphometric tools for landmark data: geometry and biology. Cambridge: Cambridge University Press."},{"key":"516_CR8","volume-title":"ICCV","author":"A. Bosch","year":"2007","unstructured":"Bosch, A., Zisserman, A., & Munoz, X. (2007). Image classification using random forests and ferns. In ICCV."},{"key":"516_CR9","volume-title":"ICCV","author":"L. Bourdev","year":"2009","unstructured":"Bourdev, L., & Malik, J. (2009). Poselets: Body part detectors trained using 3d human pose annotations. In ICCV."},{"key":"516_CR10","first-page":"123","volume":"24","author":"L. Breiman","year":"1996","unstructured":"Breiman, L. (1996). Bagging predictors. Machine Learning, 24, 123\u2013140.","journal-title":"Machine Learning"},{"issue":"1","key":"516_CR11","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L. Breiman","year":"2001","unstructured":"Breiman, L. (2001). Random forests. Machine Learning, 45(1), 5\u201332.","journal-title":"Machine Learning"},{"key":"516_CR12","first-page":"44","volume-title":"ECCV","author":"G. J. Brostow","year":"2008","unstructured":"Brostow, G. J., Shotton, J., Fauqueur, J., & Cipolla, R. (2008). Segmentation and recognition using structure from motion point clouds. In ECCV (pp. 44\u201357)."},{"key":"516_CR13","volume-title":"ICCV","author":"R. Collins","year":"2003","unstructured":"Collins, R., & Liu, Y. (2003). On-line selection of discriminative tracking features. In ICCV."},{"key":"516_CR14","first-page":"886","volume-title":"CVPR","author":"N. Dalal","year":"2005","unstructured":"Dalal, N., & Triggs, B. (2005). Histograms of oriented gradients for human detection. In CVPR (pp.\u00a0886\u2013893)."},{"key":"516_CR15","doi-asserted-by":"crossref","first-page":"253","DOI":"10.1145\/997817.997857","volume-title":"Proc. of the 20th annual symposium on computational geometry","author":"M. Datar","year":"2004","unstructured":"Datar, M., Immorlica, N., Indyk, P., & Mirrokni, V. (2004). Locality-sensitive hashing scheme based on p-stable distributions. In Proc. of the 20th annual symposium on computational geometry (pp.\u00a0253\u2013262)."},{"key":"516_CR16","volume-title":"CVPR","author":"T. Deselaers","year":"2007","unstructured":"Deselaers, T., Criminisi, A., Winn, J. M., & Agarwal, A. (2007). Incorporating on-demand stereo for real time recognition. In CVPR."},{"issue":"2","key":"516_CR17","doi-asserted-by":"crossref","first-page":"127","DOI":"10.1016\/j.cviu.2006.07.007","volume":"104","author":"M. Dimitrijevic","year":"2006","unstructured":"Dimitrijevic, M., Lepetit, V., & Fua, P. (2006). Human body pose detection using bayesian spatio-temporal templates. Computer Vision and Image Understanding, 104(2), 127\u2013139.","journal-title":"Computer Vision and Image Understanding"},{"issue":"3","key":"516_CR18","doi-asserted-by":"crossref","first-page":"520","DOI":"10.1109\/TPAMI.2008.101","volume":"31","author":"A. M. Elgammal","year":"2009","unstructured":"Elgammal, A. M., & Lee, C. S. (2009). Tracking people on a torus. IEEE Transactions on Pattern Analysis and Machine Intelligence, 31(3), 520\u2013538.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"1","key":"516_CR19","doi-asserted-by":"crossref","first-page":"55","DOI":"10.1023\/B:VISI.0000042934.15159.49","volume":"61","author":"P. F. Felzenszwalb","year":"2005","unstructured":"Felzenszwalb, P. F., & Huttenlocher, D. P. (2005). Pictorial structures for object recognition. International Journal of Computer Vision, 61(1), 55\u201379.","journal-title":"International Journal of Computer Vision"},{"key":"516_CR20","first-page":"2241","volume-title":"CVPR","author":"P. F. Felzenszwalb","year":"2010","unstructured":"Felzenszwalb, P. F., Girshick, R. B., & McAllester, D. A. (2010). Cascade object detection with deformable part models. In CVPR (pp.\u00a02241\u20132248)."},{"key":"516_CR21","volume-title":"CVPR","author":"V. Ferrari","year":"2008","unstructured":"Ferrari, V., Marn-Jimnez, M. J., & Zisserman, A. (2008). Progressive search space reduction for human pose estimation. In CVPR."},{"key":"516_CR22","volume-title":"CVPR","author":"A. Fossati","year":"2007","unstructured":"Fossati, A., Dimitrijevic, M., Lepetit, V., & Fua, P. (2007). Bridging the gap between detection and tracking for 3d monocular video-based motion capture. In CVPR."},{"issue":"1\u20132","key":"516_CR23","doi-asserted-by":"crossref","first-page":"75","DOI":"10.1007\/s11263-008-0173-1","volume":"87","author":"J. Gall","year":"2010","unstructured":"Gall, J., Rosenhahn, B., Brox, T., & Seidel, H. P. (2010). Optimization and filtering for human motion capture. International Journal of Computer Vision, 87(1\u20132), 75\u201392.","journal-title":"International Journal of Computer Vision"},{"issue":"8","key":"516_CR24","doi-asserted-by":"crossref","first-page":"1408","DOI":"10.1109\/TPAMI.2007.1062","volume":"29","author":"D. M. Gavrila","year":"2007","unstructured":"Gavrila, D. M. (2007). A bayesian, exemplar-based approach to hierarchical shape matching. IEEE Transactions on Pattern Analysis and Machine Intelligence, 29(8), 1408\u20131421.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"516_CR25","unstructured":"Gross, R., & Shi, J. (2001). The cmu motion of body (mobo) database. Robotics Institute, Carnegie Mellon University, Pittsburgh, PA."},{"issue":"2","key":"516_CR26","doi-asserted-by":"crossref","first-page":"121","DOI":"10.1007\/s11263-008-0158-0","volume":"83","author":"T. Jaeggli","year":"2009","unstructured":"Jaeggli, T., Koller-Meier, E., & Gool, L. J. V. (2009). Learning generative models for multi-activity body pose estimation. International Journal of Computer Vision, 83(2), 121\u2013134.","journal-title":"International Journal of Computer Vision"},{"key":"516_CR27","first-page":"46","volume-title":"FG","author":"T. Kanade","year":"2000","unstructured":"Kanade, T., Cohn, J. F., & Tian, Y. (2000). Comprehensive database for facial expression analysis. In FG (pp.\u00a046\u201353)."},{"issue":"5","key":"516_CR28","doi-asserted-by":"crossref","first-page":"535","DOI":"10.1016\/j.imavis.2008.08.010","volume":"27","author":"I. Laptev","year":"2009","unstructured":"Laptev, I. (2009). Improving object detection with boosted histograms. Image and Vision Computing, 27(5), 535\u2013544.","journal-title":"Image and Vision Computing"},{"issue":"1\u20132","key":"516_CR29","doi-asserted-by":"crossref","first-page":"118","DOI":"10.1007\/s11263-009-0266-5","volume":"87","author":"C. S. Lee","year":"2010","unstructured":"Lee, C. S., & Elgammal, AM (2010). Coupled visual and kinematic manifold models for tracking. International Journal of Computer Vision, 87(1\u20132), 118\u2013139.","journal-title":"International Journal of Computer Vision"},{"issue":"9","key":"516_CR30","doi-asserted-by":"crossref","first-page":"1465","DOI":"10.1109\/TPAMI.2006.188","volume":"28","author":"V. Lepetit","year":"2006","unstructured":"Lepetit, V., & Fua, P. (2006). Keypoint recognition using randomized trees. IEEE Transactions on Pattern Analysis and Machine Intelligence, 28(9), 1465\u20131479.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"4","key":"516_CR31","doi-asserted-by":"crossref","first-page":"604","DOI":"10.1109\/TPAMI.2009.204","volume":"32","author":"Z. Lin","year":"2010","unstructured":"Lin, Z., & Davis, L. S. (2010). Shape-based human detection and segmentation via hierarchical part-template matching. IEEE Transactions on Pattern Analysis and Machine Intelligence, 32(4), 604\u2013618.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"2","key":"516_CR32","doi-asserted-by":"crossref","first-page":"91","DOI":"10.1023\/B:VISI.0000029664.99615.94","volume":"60","author":"D. G. Lowe","year":"2004","unstructured":"Lowe, D. G. (2004). Distinctive image features from scale-invariant keypoints. International Journal of Computer Vision, 60(2), 91\u2013110.","journal-title":"International Journal of Computer Vision"},{"issue":"2","key":"516_CR33","doi-asserted-by":"crossref","first-page":"152","DOI":"10.1016\/S1007-0214(05)70047-X","volume":"10","author":"Y. Ma","year":"2005","unstructured":"Ma, Y., & Ding, X. (2005). Real-time multi-view face detection and pose estimation based on cost-sensitive adaboost. Tsinghua Science and Technology, 10(2), 152\u2013157.","journal-title":"Tsinghua Science and Technology"},{"issue":"9","key":"516_CR34","doi-asserted-by":"crossref","first-page":"1632","DOI":"10.1109\/TPAMI.2007.70822","volume":"30","author":"F. Moosmann","year":"2008","unstructured":"Moosmann, F., Nowak, E., & Jurie, F. (2008). Randomized clustering forests for image classification. IEEE Transactions on Pattern Analysis and Machine Intelligence, 30(9), 1632\u20131646.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"7","key":"516_CR35","doi-asserted-by":"crossref","first-page":"1052","DOI":"10.1109\/TPAMI.2006.149","volume":"28","author":"G. Mori","year":"2006","unstructured":"Mori, G., & Malik, J. (2006). Recovering 3d human body configurations using shape contexts. IEEE Transactions on Pattern Analysis and Machine Intelligence, 28(7), 1052\u20131062.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"516_CR36","volume-title":"BMVC","author":"R. Navaratnam","year":"2005","unstructured":"Navaratnam, R., Thayananthan, A., Torr, P., & Cipolla, R. (2005). Hierarchical part-based human body pose estimation. In BMVC."},{"key":"516_CR37","first-page":"434","volume-title":"ECCV","author":"R. Okada","year":"2008","unstructured":"Okada, R., & Soatto, S. (2008). Relevant feature selection for human pose estimation and localization in cluttered images. In ECCV (pp.\u00a0434\u2013445)."},{"issue":"7","key":"516_CR38","doi-asserted-by":"crossref","first-page":"1855","DOI":"10.1093\/ietisy\/e91-d.7.1855","volume":"91","author":"R. Okada","year":"2008","unstructured":"Okada, R., & Stenger, B. (2008). A single camera motion capture system for human-computer interaction. IEICE Transactions on Information and Systems, 91(7), 1855\u20131862.","journal-title":"IEICE Transactions on Information and Systems"},{"key":"516_CR39","first-page":"176","volume-title":"IbPRIA","author":"C. Orrite","year":"2009","unstructured":"Orrite, C., Ga\u00f1\u00e1n, A., & Rogez, G. (2009). Hog-based decision tree for facial expression classification. In IbPRIA (pp.\u00a0176\u2013183)."},{"key":"516_CR40","first-page":"291","volume-title":"ECCV","author":"T. Roberts","year":"2004","unstructured":"Roberts, T., McKenna, S., & Ricketts, I. (2004). Human pose estimation using learnt probabilistic region similarities and partial configurations. In ECCV (pp.\u00a0291\u2013303)."},{"key":"516_CR41","doi-asserted-by":"crossref","unstructured":"Rogez, G., Orrite, C., & Mart\u00ednez, J. (2008a). A spatio-temporal 2d-models framework for human pose recovery in monocular sequences. Pattern Recognition.","DOI":"10.1016\/j.patcog.2008.02.012"},{"key":"516_CR42","first-page":"1","volume-title":"CVPR","author":"G. Rogez","year":"2008","unstructured":"Rogez, G., Rihan, J., Ramalingam, S., Orrite, C., & Torr, P. H. (2008b). Randomized trees for human pose detection. In CVPR (pp.\u00a01\u20138)."},{"key":"516_CR43","volume-title":"CVPR07","author":"P. Sabzmeydani","year":"2007","unstructured":"Sabzmeydani, P., & Mori, G. (2007). Detecting pedestrians by learning shapelet features. In CVPR07."},{"key":"516_CR44","volume-title":"ICCV","author":"G. Shakhnarovich","year":"2003","unstructured":"Shakhnarovich, G., Viola, P., & Darrell, R. (2003). Fast pose estimation with parameter-sensitive hashing. In ICCV."},{"key":"516_CR45","volume-title":"CVPR","author":"J. Shotton","year":"2008","unstructured":"Shotton, J., Johnson, M., Cipolla, R., Center, T., & Kawasaki, J. (2008). Semantic texton forests for image categorization and segmentation. In CVPR."},{"key":"516_CR46","volume-title":"CVPR","author":"J. Shotton","year":"2011","unstructured":"Shotton, J., Fitzgibbon, A., Cook, M., Sharp, T., Finocchio, M., Moore, R., Kipman, A., & Blake, A. (2011). Real-time human pose recognition in parts from single depth images. In CVPR."},{"issue":"1\u20132","key":"516_CR47","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/s11263-009-0293-2","volume":"87","author":"L. Sigal","year":"2010","unstructured":"Sigal, L., & Black, M. J. (2010). Guest editorial: State of the art in image- and video-based human pose and motion estimation. International Journal of Computer Vision, 87(1\u20132), 1\u20133.","journal-title":"International Journal of Computer Vision"},{"issue":"1\u20132","key":"516_CR48","doi-asserted-by":"crossref","first-page":"4","DOI":"10.1007\/s11263-009-0273-6","volume":"87","author":"L. Sigal","year":"2010","unstructured":"Sigal, L., Balan, A. O., & Black, M. J. (2010). Humaneva: Synchronized video and motion capture dataset and baseline algorithm for evaluation of articulated human motion. International Journal of Computer Vision, 87(1\u20132), 4\u201327.","journal-title":"International Journal of Computer Vision"},{"key":"516_CR49","first-page":"1743","volume-title":"CVPR (2)","author":"C. Sminchisescu","year":"2006","unstructured":"Sminchisescu, C., Kanaujia, A., & Metaxas, D. N. (2006). Learning joint top-down and bottom-up processes for 3d visual inference. In CVPR (2) (pp.\u00a01743\u20131752)."},{"key":"516_CR50","unstructured":"Stenger, B. (2004). Model-based hand tracking using a hierarchical bayesian filter. PhD thesis, Department of Engineering, University of Cambridge."},{"key":"516_CR51","doi-asserted-by":"crossref","first-page":"932","DOI":"10.1007\/978-3-540-77129-6_78","volume-title":"Proc. of the 2nd Pacific Rim conference on advances in image and video technology","author":"H. Sugano","year":"2007","unstructured":"Sugano, H., & Miyamoto, R. (2007). A real-time object recognition system on cell broadband engine. In Proc. of the 2nd Pacific Rim conference on advances in image and video technology (pp.\u00a0932\u2013943)."},{"key":"516_CR52","first-page":"124","volume-title":"ECCV (3)","author":"A. Thayananthan","year":"2006","unstructured":"Thayananthan, A., Navaratnam, R., Stenger, B., Torr, P. H. S., & Cipolla, R. (2006). Multivariate relevance vector machines for tracking. In ECCV (3) (pp.\u00a0124\u2013138)."},{"issue":"1","key":"516_CR53","doi-asserted-by":"crossref","first-page":"9","DOI":"10.1023\/A:1014899027014","volume":"48","author":"K. Toyama","year":"2002","unstructured":"Toyama, K., & Blake, A. (2002). Probabilistic tracking with exemplars in a metric space. International Journal of Computer Vision, 48(1), 9\u201319.","journal-title":"International Journal of Computer Vision"},{"key":"516_CR54","first-page":"128","volume-title":"IbPRIA","author":"M. Villamizar","year":"2009","unstructured":"Villamizar, M., Sanfeliu, A., & Andrade-Cetto, J. (2009). Local boosted features for pedestrian detection. In IbPRIA (pp.\u00a0128\u2013135)."},{"key":"516_CR55","unstructured":"Viola, P., & Jones, M. (2002). Robust real-time object detection. International Journal of Computer Vision."},{"issue":"2","key":"516_CR56","doi-asserted-by":"crossref","first-page":"153","DOI":"10.1007\/s11263-005-6644-8","volume":"63","author":"P. Viola","year":"2005","unstructured":"Viola, P., Jones, M. J., & Snow, D. (2005). Detecting pedestrians using patterns of motion and appearance. International Journal of Computer Vision, 63(2), 153\u2013161.","journal-title":"International Journal of Computer Vision"},{"key":"516_CR57","first-page":"90","volume-title":"ICCV","author":"B. Wu","year":"2005","unstructured":"Wu, B., & Nevatia, R. (2005). Detection of multiple, partially occluded humans in a single image by bayesian combination of edgelet part detectors. In ICCV (pp.\u00a090\u201397)."},{"key":"516_CR58","first-page":"329","volume-title":"MLMI","author":"P. Zehnder","year":"2005","unstructured":"Zehnder, P., Koller-Meier, E., & Van Gool, L. (2005). A hierarchical system for recognition, tracking and pose estimation. In MLMI (pp.\u00a0329\u2013340)."},{"key":"516_CR59","first-page":"1","volume-title":"CVPR","author":"J. Zhang","year":"2007","unstructured":"Zhang, J., Zhou, S., McMillan, L., & Comaniciu, D. (2007). Joint real-time object detection and pose estimation using probabilistic boosting network. In CVPR (pp.\u00a01\u20138)."},{"key":"516_CR60","doi-asserted-by":"crossref","first-page":"149","DOI":"10.1109\/AFGR.2002.1004147","volume-title":"Proc. int\u2019l conf. automatic face and gesture recognition","author":"Z. Zhang","year":"2002","unstructured":"Zhang, Z., Zhu, L., Li, S., & Zhang, H. (2002). Real-time multi-view face detection. In Proc. int\u2019l conf. automatic face and gesture recognition (pp.\u00a0149\u2013154)."},{"key":"516_CR61","first-page":"1491","volume-title":"CVPR","author":"Q. Zhu","year":"2006","unstructured":"Zhu, Q., Avidan, S., Yeh, M. C., & Cheng, K. T. (2006). Fast human detection using a cascade of histograms of oriented gradients. In CVPR (pp.\u00a01491\u20131498)."}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-012-0516-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11263-012-0516-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-012-0516-9","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,12,27]],"date-time":"2021-12-27T08:41:44Z","timestamp":1640594504000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11263-012-0516-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,1,31]]},"references-count":61,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2012,8]]}},"alternative-id":["516"],"URL":"https:\/\/doi.org\/10.1007\/s11263-012-0516-9","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012,1,31]]}}}