{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T15:49:57Z","timestamp":1775317797054,"version":"3.50.1"},"publisher-location":"Cham","reference-count":53,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030012489","type":"print"},{"value":"9783030012496","type":"electronic"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-030-01249-6_5","type":"book-chapter","created":{"date-parts":[[2018,10,5]],"date-time":"2018-10-05T11:35:46Z","timestamp":1538739346000},"page":"69-86","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":246,"title":["Exploiting Temporal Information for 3D Human Pose Estimation"],"prefix":"10.1007","author":[{"given":"Mir Rayat Imtiaz","family":"Hossain","sequence":"first","affiliation":[]},{"given":"James J.","family":"Little","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,10,6]]},"reference":[{"key":"5_CR1","unstructured":"Sutskever, I., Vinyals, O., Le, Q.V.: Sequence to sequence learning with neural networks. In: Advances in neural information processing systems (NIPS), pp. 3104\u20133112 (2014)"},{"key":"5_CR2","unstructured":"Agarwal, A., Triggs, B.: 3D human pose from silhouettes by relevance vector regression. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2004)"},{"issue":"7","key":"5_CR3","doi-asserted-by":"publisher","first-page":"1052","DOI":"10.1109\/TPAMI.2006.149","volume":"28","author":"G Mori","year":"2006","unstructured":"Mori, G., Malik, J.: Recovering 3D human body configurations using shape contexts. IEEE Trans Pattern Anal. Mach. Intell. (TPAMI) 28(7), 1052\u20131062 (2006)","journal-title":"IEEE Trans Pattern Anal. Mach. Intell. (TPAMI)"},{"key":"5_CR4","doi-asserted-by":"crossref","unstructured":"Bo, L.F., Sminchisescu, C., Kanaujia, A., Metaxas, D.N.: Fast algorithms for large scale conditional 3D prediction. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 1\u20138 (2008)","DOI":"10.1109\/CVPR.2008.4587578"},{"key":"5_CR5","doi-asserted-by":"crossref","unstructured":"Shakhnarovich, G., Viola, P.A., Darrell, T.J.: Fast pose estimation with parameter-sensitive hashing. In: IEEE International Conference on Computer Vision (ICCV) (2003)","DOI":"10.1109\/ICCV.2003.1238424"},{"key":"5_CR6","doi-asserted-by":"crossref","unstructured":"Tekin, B., Katircioglu, I., Salzmann, M., Lepetit, V., Fua, P.: Structured prediction of 3D human pose with deep neural networks. In: British Machine Vision Conference (BMVC) (2016)","DOI":"10.5244\/C.30.130"},{"key":"5_CR7","doi-asserted-by":"crossref","unstructured":"Pavlakos, G., Zhou, X., Derpanis, K.G., Daniilidis, K.: Coarse-to-fine volumetric prediction for single-image 3D human pose. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2017)","DOI":"10.1109\/CVPR.2017.139"},{"key":"5_CR8","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"332","DOI":"10.1007\/978-3-319-16808-1_23","volume-title":"Computer Vision \u2013 ACCV 2014","author":"S Li","year":"2015","unstructured":"Li, S., Chan, A.B.: 3D human pose estimation from monocular images with deep convolutional neural network. In: Cremers, D., Reid, I., Saito, H., Yang, M.-H. (eds.) ACCV 2014. LNCS, vol. 9004, pp. 332\u2013347. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-16808-1_23"},{"key":"5_CR9","doi-asserted-by":"crossref","unstructured":"Mehta, D., Rhodin, H., Casas, D., Sotnychenko, O., Xu, W., Theobalt, C.: Monocular 3D human pose estimation using transfer learning and improved CNN supervision. arXiv preprint arXiv:1611.09813 (2016)","DOI":"10.1109\/3DV.2017.00064"},{"key":"5_CR10","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"186","DOI":"10.1007\/978-3-319-49409-8_17","volume-title":"Computer Vision \u2013 ECCV 2016 Workshops","author":"X Zhou","year":"2016","unstructured":"Zhou, X., Sun, X., Zhang, W., Liang, S., Wei, Y.: Deep kinematic pose regression. In: Hua, G., J\u00e9gou, H. (eds.) ECCV 2016. LNCS, vol. 9915, pp. 186\u2013201. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-49409-8_17"},{"issue":"4","key":"5_CR11","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1145\/3072959.3073596","volume":"36","author":"D Mehta","year":"2017","unstructured":"Mehta, D., et al.: VNect: real-time 3D human pose estimation with a single RGB camera. ACM Trans. Graph. 36(4), 44 (2017)","journal-title":"ACM Trans. Graph."},{"key":"5_CR12","doi-asserted-by":"crossref","unstructured":"Nie, B.X., Wei, P., Zhu, S.C.: Monocular 3D human pose estimation by predicting depth on joints. In: IEEE International Conference on Computer Vision (ICCV) (2017)","DOI":"10.1109\/ICCV.2017.373"},{"key":"5_CR13","doi-asserted-by":"crossref","unstructured":"Lin, M., Lin, L., Liang, X., Wang, K., Chen, H.: Recurrent 3D pose sequence machines. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2017)","DOI":"10.1109\/CVPR.2017.588"},{"key":"5_CR14","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"156","DOI":"10.1007\/978-3-319-49409-8_15","volume-title":"Computer Vision \u2013 ECCV 2016 Workshops","author":"S Park","year":"2016","unstructured":"Park, S., Hwang, J., Kwak, N.: 3D human pose estimation using convolutional neural networks with 2D pose information. In: Hua, G., J\u00e9gou, H. (eds.) ECCV 2016. LNCS, vol. 9915, pp. 156\u2013169. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-49409-8_15"},{"key":"5_CR15","doi-asserted-by":"crossref","unstructured":"Sun, X., Shang, J., Liang, S., Wei, Y.: Compositional human pose regression. In: IEEE International Conference on Computer Vision (ICCV) (2017)","DOI":"10.1109\/ICCV.2017.284"},{"key":"5_CR16","doi-asserted-by":"crossref","unstructured":"Tekin, B., Marquez Neila, P., Salzmann, M., Fua, P.: Learning to fuse 2D and 3D image cues for monocular body pose estimation. In: International Conference on Computer Vision (ICCV) (2017)","DOI":"10.1109\/ICCV.2017.425"},{"key":"5_CR17","doi-asserted-by":"crossref","unstructured":"Wei, S.E., Ramakrishna, V., Kanade, T., Sheikh, Y.: Convolutional pose machines. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2016)","DOI":"10.1109\/CVPR.2016.511"},{"key":"5_CR18","doi-asserted-by":"publisher","first-page":"483","DOI":"10.1007\/978-3-319-46484-8_29","volume-title":"Computer Vision \u2013 ECCV 2016","author":"Alejandro Newell","year":"2016","unstructured":"Newell, A., Yang, K., Deng, J.: Stacked hourglass networks for human pose estimation. In: European Conference on Computer Vision (ECCV) (2016)"},{"key":"5_CR19","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"573","DOI":"10.1007\/978-3-642-33765-9_41","volume-title":"Computer Vision \u2013 ECCV 2012","author":"V Ramakrishna","year":"2012","unstructured":"Ramakrishna, V., Kanade, T., Sheikh, Y.: Reconstructing 3D human pose from 2D image landmarks. In: Fitzgibbon, A., Lazebnik, S., Perona, P., Sato, Y., Schmid, C. (eds.) ECCV 2012. LNCS, vol. 7575, pp. 573\u2013586. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-33765-9_41"},{"key":"5_CR20","doi-asserted-by":"crossref","unstructured":"Zhou, X., Zhu, M., Leonardos, S., Derpanis, K.G., Daniilidis, K.: Sparseness meets deepness: 3D human pose estimation from monocular video. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 4966\u20134975 (2016)","DOI":"10.1109\/CVPR.2016.537"},{"key":"5_CR21","doi-asserted-by":"crossref","unstructured":"Akhter, I., Black, M.J.: Pose-conditioned joint angle limits for 3D human pose reconstruction. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 1446\u20131455 (2015)","DOI":"10.1109\/CVPR.2015.7298751"},{"key":"5_CR22","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"561","DOI":"10.1007\/978-3-319-46454-1_34","volume-title":"Computer Vision \u2013 ECCV 2016","author":"F Bogo","year":"2016","unstructured":"Bogo, F., Kanazawa, A., Lassner, C., Gehler, P., Romero, J., Black, M.J.: Keep it SMPL: automatic estimation of 3D human pose and shape from a single image. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9909, pp. 561\u2013578. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46454-1_34"},{"key":"5_CR23","doi-asserted-by":"crossref","unstructured":"Moreno-Noguer, F.: 3D human pose estimation from a single image via distance matrix regression. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2017)","DOI":"10.1109\/CVPR.2017.170"},{"key":"5_CR24","doi-asserted-by":"crossref","unstructured":"Martinez, J., Hossain, R., Romero, J., Little, J.J.: A simple yet effective baseline for 3D human pose estimation. In: IEEE International Conference on Computer Vision (ICCV) (2017)","DOI":"10.1109\/ICCV.2017.288"},{"key":"5_CR25","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: IEEE conference on Computer Vision and Pattern Recognition (CVPR), pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"issue":"8","key":"5_CR26","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S., Schmidhuber, J.: Long short-term memory. Neural Comput. 9(8), 1735\u20131780 (1997)","journal-title":"Neural Comput."},{"key":"5_CR27","unstructured":"Ba, J.L., Kiros, J.R., Hinton, G.E.: Layer normalization. arXiv preprint arXiv:1607.06450 (2016)"},{"key":"5_CR28","unstructured":"Zaremba, W., Sutskever, I., Vinyals, O.: Recurrent neural network regularization. arXiv preprint arXiv:1409.2329 (2014)"},{"issue":"7","key":"5_CR29","doi-asserted-by":"publisher","first-page":"1325","DOI":"10.1109\/TPAMI.2013.248","volume":"36","author":"C Ionescu","year":"2014","unstructured":"Ionescu, C., Papava, D., Olaru, V., Sminchisescu, C.: Human3.6M: large scale datasets and predictive methods for 3D human sensing in natural environments. IEEE Trans. Pattern Anal. Mach. Intell. (T-PAMI) 36(7), 1325\u20131339 (2014)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell. (T-PAMI)"},{"issue":"3","key":"5_CR30","doi-asserted-by":"publisher","first-page":"269","DOI":"10.1006\/cviu.2000.0888","volume":"81","author":"C Barron","year":"2001","unstructured":"Barron, C., Kakadiaris, I.A.: Estimating anthropometry and pose from a single uncalibrated image. Compu. Vis. Image Underst. (CVIU) 81(3), 269\u2013284 (2001)","journal-title":"Compu. Vis. Image Underst. (CVIU)"},{"key":"5_CR31","unstructured":"Parameswaran, V., Chellappa, R.: View independent human body pose estimation from a single perspective image. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2004)"},{"key":"5_CR32","doi-asserted-by":"publisher","first-page":"148","DOI":"10.1016\/0734-189X(85)90094-5","volume":"30","author":"HJ Lee","year":"1985","unstructured":"Lee, H.J., Chen, Z.: Determination of 3D human body postures from a single view. Comput. Vis., Graph. Image Process. 30, 148\u2013168 (1985)","journal-title":"Comput. Vis., Graph. Image Process."},{"key":"5_CR33","doi-asserted-by":"crossref","unstructured":"Jiang, H.: 3D human pose reconstruction using millions of exemplars. In: IEEE International Conference on Pattern Recognition (ICPR), pp. 1674\u20131677. IEEE (2010)","DOI":"10.1109\/ICPR.2010.414"},{"key":"5_CR34","doi-asserted-by":"crossref","unstructured":"Taylor, C.J.: Reconstruction of articulated objects from point correspondences in a single uncalibrated image. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR), vol. 1, pp. 677\u2013684. IEEE (2000)","DOI":"10.1109\/CVPR.2000.855885"},{"key":"5_CR35","doi-asserted-by":"crossref","unstructured":"Gupta, A., Martinez, J., Little, J.J., Woodham, R.J.: 3D pose from motion for cross-view action recognition via non-linear circulant temporal encoding. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2014)","DOI":"10.1109\/CVPR.2014.333"},{"key":"5_CR36","doi-asserted-by":"crossref","unstructured":"Chen, C.H., Ramanan, D.: 3D human pose estimation = 2D pose estimation + matching. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2017)","DOI":"10.1109\/CVPR.2017.610"},{"key":"5_CR37","doi-asserted-by":"crossref","unstructured":"Wang, C., Wang, Y., Lin, Z., Yuille, A.L., Gao, W.: Robust estimation of 3D human poses from a single image. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2014)","DOI":"10.1109\/CVPR.2014.303"},{"key":"5_CR38","doi-asserted-by":"crossref","unstructured":"Varol, G., et al.: Learning from synthetic humans. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2017)","DOI":"10.1109\/CVPR.2017.492"},{"key":"5_CR39","unstructured":"Rogez, G., Schmid, C.: MoCap-guided data augmentation for 3D pose estimation in the wild. In: Advances in Neural Information Processing Systems (NIPS) (2016)"},{"key":"5_CR40","doi-asserted-by":"crossref","unstructured":"Tome, D., Russell, C., Agapito, L.: Lifting from the deep: convolutional 3D pose estimation from a single image. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 2500\u20132509 (2017)","DOI":"10.1109\/CVPR.2017.603"},{"key":"5_CR41","unstructured":"Fang, H., Xu, Y., Wang, W., Liu, X., Zhu, S.C.: Learning knowledge-guided pose grammar machine for 3D human pose estimation. arXiv preprint arXiv:1710.06513 (2017)"},{"key":"5_CR42","doi-asserted-by":"crossref","unstructured":"Andriluka, M., Roth, S., Schiele, B.: Monocular 3D pose estimation and tracking by detection. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 623\u2013630. IEEE (2010)","DOI":"10.1109\/CVPR.2010.5540156"},{"key":"5_CR43","doi-asserted-by":"crossref","unstructured":"Tekin, B., Rozantsev, A., Lepetit, V., Fua, P.: Direct prediction of 3D body poses from motion compensated sequences. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 991\u20131000 (2016)","DOI":"10.1109\/CVPR.2016.113"},{"key":"5_CR44","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1007\/978-3-319-46493-0_2","volume-title":"Computer Vision \u2013 ECCV 2016","author":"Y Du","year":"2016","unstructured":"Du, Y., et al.: Marker-less 3D human motion capture with monocular image sequence and height-maps. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9908, pp. 20\u201336. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46493-0_2"},{"issue":"1\u20132","key":"5_CR45","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1007\/s11263-009-0273-6","volume":"87","author":"L Sigal","year":"2010","unstructured":"Sigal, L., Balan, A.O., Black, M.J.: HUMANEVA: synchronized video and motion capture dataset and baseline algorithm for evaluation of articulated human motion. Int. J. Comput. Vis. (IJCV) 87(1\u20132), 4 (2010)","journal-title":"Int. J. Comput. Vis. (IJCV)"},{"key":"5_CR46","doi-asserted-by":"crossref","unstructured":"Andriluka, M., Pishchulin, L., Gehler, P., Schiele, B.: 2D human pose estimation: new Benchmark and state of the art analysis. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2014)","DOI":"10.1109\/CVPR.2014.471"},{"key":"5_CR47","unstructured":"Kingma, D., Ba, J.: Adam: a method for stochastic optimization. In: ICLR (2015)"},{"key":"5_CR48","unstructured":"Glorot, X., Bengio, Y.: Understanding the difficulty of training deep feedforward neural networks. In: Proceedings of the Thirteenth International Conference on Artificial Intelligence and Statistics, pp. 249\u2013256 (2010)"},{"key":"5_CR49","doi-asserted-by":"crossref","unstructured":"Radwan, I., Dhall, A., Goecke, R.: Monocular image 3D human pose estimation under self-occlusion. In: IEEE International Conference on Computer Vision (ICCV) (2013)","DOI":"10.1109\/ICCV.2013.237"},{"key":"5_CR50","doi-asserted-by":"crossref","unstructured":"Simo-Serra, E., Quattoni, A., Torras, C., Moreno-Noguer, F.: A joint model for 2D and 3D pose estimation from a single image. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2013)","DOI":"10.1109\/CVPR.2013.466"},{"issue":"1\u20132","key":"5_CR51","doi-asserted-by":"publisher","first-page":"28","DOI":"10.1007\/s11263-008-0204-y","volume":"87","author":"L Bo","year":"2010","unstructured":"Bo, L., Sminchisescu, C.: Twin Gaussian processes for structured prediction. Int. J. Comput. Vis. (IJCV) 87(1\u20132), 28 (2010)","journal-title":"Int. J. Comput. Vis. (IJCV)"},{"key":"5_CR52","doi-asserted-by":"crossref","unstructured":"Kostrikov, I., Gall, J.: Depth sweep regression forests for estimating 3D human pose from images. In: British Machine Vision Conference (BMVC) (2014)","DOI":"10.5244\/C.28.80"},{"key":"5_CR53","doi-asserted-by":"crossref","unstructured":"Yasin, H., Iqbal, U., Kruger, B., Weber, A., Gall, J.: A dual-source approach for 3D pose estimation from a single image. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 4948\u20134956 (2016)","DOI":"10.1109\/CVPR.2016.535"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2018"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-01249-6_5","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,24]],"date-time":"2026-03-24T15:11:17Z","timestamp":1774365077000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-01249-6_5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783030012489","9783030012496"],"references-count":53,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-01249-6_5","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018]]},"assertion":[{"value":"6 October 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Munich","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Germany","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 September 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14 September 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2018.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}