{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,4]],"date-time":"2026-04-04T17:59:46Z","timestamp":1775325586386,"version":"3.50.1"},"publisher-location":"Cham","reference-count":76,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030585440","type":"print"},{"value":"9783030585457","type":"electronic"}],"license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020]]},"DOI":"10.1007\/978-3-030-58545-7_20","type":"book-chapter","created":{"date-parts":[[2020,11,4]],"date-time":"2020-11-04T10:04:51Z","timestamp":1604484291000},"page":"346-364","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":181,"title":["DLow: Diversifying Latent Flows for Diverse Human Motion Prediction"],"prefix":"10.1007","author":[{"given":"Ye","family":"Yuan","sequence":"first","affiliation":[]},{"given":"Kris","family":"Kitani","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,11,5]]},"reference":[{"key":"20_CR1","doi-asserted-by":"crossref","unstructured":"Aksan, E., Kaufmann, M., Hilliges, O.: Structured prediction helps 3D human motion modelling. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 7144\u20137153 (2019)","DOI":"10.1109\/ICCV.2019.00724"},{"key":"20_CR2","doi-asserted-by":"crossref","unstructured":"Alahi, A., Goel, K., Ramanathan, V., Robicquet, A., Fei-Fei, L., Savarese, S.: Social LSTM: human trajectory prediction in crowded spaces. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 961\u2013971 (2016)","DOI":"10.1109\/CVPR.2016.110"},{"key":"20_CR3","doi-asserted-by":"crossref","unstructured":"Aliakbarian, S., Saleh, F.S., Salzmann, M., Petersson, L., Gould, S.: A stochastic conditioning scheme for diverse human motion prediction. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5223\u20135232 (2020)","DOI":"10.1109\/CVPR42600.2020.00527"},{"key":"20_CR4","unstructured":"Arjovsky, M., Chintala, S., Bottou, L.: Wasserstein GAN. arXiv preprint arXiv:1701.07875 (2017)"},{"key":"20_CR5","doi-asserted-by":"crossref","unstructured":"Azadi, S., Feng, J., Darrell, T.: Learning detection with diverse proposals. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7149\u20137157 (2017)","DOI":"10.1109\/CVPR.2017.779"},{"key":"20_CR6","doi-asserted-by":"crossref","unstructured":"Barsoum, E., Kender, J., Liu, Z.: HP-GAN: probabilistic 3D human motion prediction via GAN. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition Workshops, pp. 1418\u20131427 (2018)","DOI":"10.1109\/CVPRW.2018.00191"},{"key":"20_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/978-3-642-33715-4_1","volume-title":"Computer Vision \u2013 ECCV 2012","author":"D Batra","year":"2012","unstructured":"Batra, D., Yadollahpour, P., Guzman-Rivera, A., Shakhnarovich, G.: Diverse M-best solutions in Markov random fields. In: Fitzgibbon, A., Lazebnik, S., Perona, P., Sato, Y., Schmid, C. (eds.) ECCV 2012. LNCS, vol. 7576, pp. 1\u201316. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-33715-4_1"},{"key":"20_CR8","doi-asserted-by":"crossref","unstructured":"Bhattacharyya, A., Schiele, B., Fritz, M.: Accurate and diverse sampling of sequences based on a \u201cbest of many\u201d sample objective. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 8485\u20138493 (2018)","DOI":"10.1109\/CVPR.2018.00885"},{"key":"20_CR9","doi-asserted-by":"crossref","unstructured":"Butepage, J., Black, M.J., Kragic, D., Kjellstrom, H.: Deep representation learning for human motion prediction and classification. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 6158\u20136166 (2017)","DOI":"10.1109\/CVPR.2017.173"},{"key":"20_CR10","doi-asserted-by":"crossref","unstructured":"Chao, Y.W., Yang, J., Price, B., Cohen, S., Deng, J.: Forecasting human dynamics from static images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 548\u2013556 (2017)","DOI":"10.1109\/CVPR.2017.388"},{"key":"20_CR11","unstructured":"Che, T., Li, Y., Jacob, A.P., Bengio, Y., Li, W.: Mode regularized generative adversarial networks. arXiv preprint arXiv:1612.02136 (2016)"},{"key":"20_CR12","unstructured":"Chen, X., Duan, Y., Houthooft, R., Schulman, J., Sutskever, I., Abbeel, P.: InfoGAN: interpretable representation learning by information maximizing generative adversarial nets. In: Advances in Neural Information Processing Systems, pp. 2172\u20132180 (2016)"},{"key":"20_CR13","doi-asserted-by":"crossref","unstructured":"Chiu, H.k., Adeli, E., Wang, B., Huang, D.A., Niebles, J.C.: Action-agnostic human pose forecasting. In: 2019 IEEE Winter Conference on Applications of Computer Vision (WACV), pp. 1423\u20131432. IEEE (2019)","DOI":"10.1109\/WACV.2019.00156"},{"key":"20_CR14","unstructured":"Dilokthanakul, N., et al.: Deep unsupervised clustering with Gaussian mixture variational autoencoders. arXiv preprint arXiv:1611.02648 (2016)"},{"key":"20_CR15","unstructured":"Elfeki, M., Couprie, C., Riviere, M., Elhoseiny, M.: GDPP: learning diverse generations using determinantal point process. arXiv preprint arXiv:1812.00068 (2018)"},{"key":"20_CR16","doi-asserted-by":"crossref","unstructured":"Fragkiadaki, K., Levine, S., Felsen, P., Malik, J.: Recurrent network models for human dynamics. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 4346\u20134354 (2015)","DOI":"10.1109\/ICCV.2015.494"},{"key":"20_CR17","doi-asserted-by":"crossref","unstructured":"Ghosh, P., Song, J., Aksan, E., Hilliges, O.: Learning human motion models for long-term predictions. In: 2017 International Conference on 3D Vision (3DV), pp. 458\u2013466. IEEE (2017)","DOI":"10.1109\/3DV.2017.00059"},{"key":"20_CR18","unstructured":"Gillenwater, J.A., Kulesza, A., Fox, E., Taskar, B.: Expectation-maximization for learning determinantal point processes. In: Advances in Neural Information Processing Systems, pp. 3149\u20133157 (2014)"},{"key":"20_CR19","unstructured":"Gong, B., Chao, W.L., Grauman, K., Sha, F.: Diverse sequential subset selection for supervised video summarization. In: Advances in Neural Information Processing Systems, pp. 2069\u20132077 (2014)"},{"key":"20_CR20","unstructured":"Goodfellow, I., et al.: Generative adversarial nets. In: Advances in Neural Information Processing Systems, pp. 2672\u20132680 (2014)"},{"key":"20_CR21","doi-asserted-by":"crossref","unstructured":"Gopalakrishnan, A., Mali, A., Kifer, D., Giles, L., Ororbia, A.G.: A neural temporal model for human motion prediction. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 12116\u201312125 (2019)","DOI":"10.1109\/CVPR.2019.01239"},{"key":"20_CR22","unstructured":"Gu, Q., Li, Z., Han, J.: Generalized fisher score for feature selection. arXiv preprint arXiv:1202.3725 (2012)"},{"key":"20_CR23","doi-asserted-by":"crossref","unstructured":"Guan, J., Yuan, Y., Kitani, K.M., Rhinehart, N.: Generative hybrid representations for activity forecasting with no-regret learning. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (2020)","DOI":"10.1109\/CVPR42600.2020.00025"},{"key":"20_CR24","unstructured":"Gulrajani, I., Ahmed, F., Arjovsky, M., Dumoulin, V., Courville, A.C.: Improved training of wasserstein gans. In: Advances in Neural Information Processing Systems, pp. 5767\u20135777 (2017)"},{"key":"20_CR25","doi-asserted-by":"crossref","unstructured":"Gupta, A., Johnson, J., Fei-Fei, L., Savarese, S., Alahi, A.: Social GAN: socially acceptable trajectories with generative adversarial networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2255\u20132264 (2018)","DOI":"10.1109\/CVPR.2018.00240"},{"key":"20_CR26","doi-asserted-by":"crossref","unstructured":"Gurumurthy, S., Kiran Sarvadevabhatla, R., Venkatesh Babu, R.: DeliGAN: generative adversarial networks for diverse and limited data. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 166\u2013174 (2017)","DOI":"10.1109\/CVPR.2017.525"},{"key":"20_CR27","unstructured":"Guzman-Rivera, A., Batra, D., Kohli, P.: Multiple choice learning: learning to produce multiple structured outputs. In: Advances in Neural Information Processing Systems, pp. 1799\u20131807 (2012)"},{"key":"20_CR28","unstructured":"He, J., Spokoyny, D., Neubig, G., Berg-Kirkpatrick, T.: Lagging inference networks and posterior collapse in variational autoencoders. arXiv preprint arXiv:1901.05534 (2019)"},{"issue":"5","key":"20_CR29","first-page":"6","volume":"2","author":"I Higgins","year":"2017","unstructured":"Higgins, I., et al.: beta-VAE: learning basic visual concepts with a constrained variational framework. ICLR 2(5), 6 (2017)","journal-title":"ICLR"},{"key":"20_CR30","doi-asserted-by":"crossref","unstructured":"Hsiao, W.L., Grauman, K.: Creating capsule wardrobes from fashion images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7161\u20137170 (2018)","DOI":"10.1109\/CVPR.2018.00748"},{"key":"20_CR31","doi-asserted-by":"crossref","unstructured":"Huang, D.A., Ma, M., Ma, W.C., Kitani, K.M.: How do we use our hands? discovering a diverse set of common grasps. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 666\u2013675 (2015)","DOI":"10.1109\/CVPR.2015.7298666"},{"key":"20_CR32","doi-asserted-by":"crossref","unstructured":"Ionescu, C., Papava, D., Olaru, V., Sminchisescu, C.: Human3.6M: large scale datasets and predictive methods for 3D human sensing in natural environments. IEEE Trans. Pattern Anal. Mach. Intell. 36(7), 1325\u20131339 (2013)","DOI":"10.1109\/TPAMI.2013.248"},{"key":"20_CR33","doi-asserted-by":"crossref","unstructured":"Jain, A., Zamir, A.R., Savarese, S., Saxena, A.: Structural-RNN: deep learning on spatio-temporal graphs. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5308\u20135317 (2016)","DOI":"10.1109\/CVPR.2016.573"},{"issue":"2","key":"20_CR34","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1023\/A:1007665907178","volume":"37","author":"MI Jordan","year":"1999","unstructured":"Jordan, M.I., Ghahramani, Z., Jaakkola, T.S., Saul, L.K.: An introduction to variational methods for graphical models. Mach. Learn. 37(2), 183\u2013233 (1999)","journal-title":"Mach. Learn."},{"key":"20_CR35","unstructured":"Kim, Y., Wiseman, S., Miller, A.C., Sontag, D., Rush, A.M.: Semi-amortized variational autoencoders. arXiv preprint arXiv:1802.02550 (2018)"},{"key":"20_CR36","unstructured":"Kingma, D.P., Welling, M.: Auto-encoding variational bayes. arXiv preprint arXiv:1312.6114 (2013)"},{"key":"20_CR37","doi-asserted-by":"crossref","unstructured":"Koppula, H.S., Saxena, A.: Anticipating human activities for reactive robotic response. In: IROS, Tokyo, p. 2071 (2013)","DOI":"10.1109\/IROS.2013.6696634"},{"key":"20_CR38","unstructured":"Kulesza, A., Taskar, B.: k-dpps: Fixed-size determinantal point processes. In: Proceedings of the 28th International Conference on Machine Learning (ICML 2011), pp. 1193\u20131200 (2011)"},{"key":"20_CR39","doi-asserted-by":"crossref","unstructured":"Kulesza, A., Taskar, B., et al.: Determinantal point processes for machine learning. Found. Trends\u00ae Mach. Learn. 5(2\u20133), 123\u2013286 (2012)","DOI":"10.1561\/2200000044"},{"key":"20_CR40","doi-asserted-by":"crossref","unstructured":"Kundu, J.N., Gor, M., Babu, R.V.: BIHMP-GAN: bidirectional 3D human motion prediction GAN. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 33, pp. 8553\u20138560 (2019)","DOI":"10.1609\/aaai.v33i01.33018553"},{"key":"20_CR41","doi-asserted-by":"crossref","unstructured":"Lee, N., Choi, W., Vernaza, P., Choy, C.B., Torr, P.H., Chandraker, M.: Desire: distant future prediction in dynamic scenes with interacting agents. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 336\u2013345 (2017)","DOI":"10.1109\/CVPR.2017.233"},{"key":"20_CR42","unstructured":"Lee, S., Prakash, S.P.S., Cogswell, M., Ranjan, V., Crandall, D., Batra, D.: Stochastic multiple choice learning for training diverse deep ensembles. In: Advances in Neural Information Processing Systems, pp. 2119\u20132127 (2016)"},{"key":"20_CR43","unstructured":"Li, Z., Zhou, Y., Xiao, S., He, C., Huang, Z., Li, H.: Auto-conditioned recurrent networks for extended complex human motion synthesis. arXiv preprint arXiv:1707.05363 (2017)"},{"key":"20_CR44","unstructured":"Lin, X., Amer, M.R.: Human motion modeling using DVGANs. arXiv preprint arXiv:1804.10652 (2018)"},{"key":"20_CR45","unstructured":"Lin, Z., Khetan, A., Fanti, G., Oh, S.: PACGAN: the power of two samples in generative adversarial networks. In: Advances in Neural Information Processing Systems, pp. 1498\u20131507 (2018)"},{"key":"20_CR46","unstructured":"Liu, X., Gao, J., Celikyilmaz, A., Carin, L., et al.: Cyclical annealing schedule: a simple approach to mitigating KL vanishing. arXiv preprint arXiv:1903.10145 (2019)"},{"key":"20_CR47","doi-asserted-by":"crossref","unstructured":"Luvizon, D.C., Picard, D., Tabia, H.: 2D\/3D pose estimation and action recognition using multitask deep learning. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5137\u20135146 (2018)","DOI":"10.1109\/CVPR.2018.00539"},{"issue":"1","key":"20_CR48","doi-asserted-by":"publisher","first-page":"83","DOI":"10.2307\/1425855","volume":"7","author":"O Macchi","year":"1975","unstructured":"Macchi, O.: The coincidence approach to stochastic point processes. Adv. Appl. Probab. 7(1), 83\u2013122 (1975)","journal-title":"Adv. Appl. Probab."},{"key":"20_CR49","doi-asserted-by":"crossref","unstructured":"Mao, W., Liu, M., Salzmann, M., Li, H.: Learning trajectory dependencies for human motion prediction. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 9489\u20139497 (2019)","DOI":"10.1109\/ICCV.2019.00958"},{"key":"20_CR50","doi-asserted-by":"crossref","unstructured":"Martinez, J., Black, M.J., Romero, J.: On human motion prediction using recurrent neural networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2891\u20132900 (2017)","DOI":"10.1109\/CVPR.2017.497"},{"key":"20_CR51","doi-asserted-by":"crossref","unstructured":"Martinez, J., Hossain, R., Romero, J., Little, J.J.: A simple yet effective baseline for 3D human pose estimation. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2640\u20132649 (2017)","DOI":"10.1109\/ICCV.2017.288"},{"issue":"2","key":"20_CR52","doi-asserted-by":"publisher","first-page":"159","DOI":"10.1023\/A:1008990218483","volume":"8","author":"D Nilsson","year":"1998","unstructured":"Nilsson, D.: An efficient algorithm for finding the m most probable configurations in probabilistic expert systems. Stat. Comput. 8(2), 159\u2013173 (1998)","journal-title":"Stat. Comput."},{"issue":"1","key":"20_CR53","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1109\/TIV.2016.2578706","volume":"1","author":"B Paden","year":"2016","unstructured":"Paden, B., \u010c\u00e1p, M., Yong, S.Z., Yershov, D., Frazzoli, E.: A survey of motion planning and control techniques for self-driving urban vehicles. IEEE Trans. Intell. Veh. 1(1), 33\u201355 (2016)","journal-title":"IEEE Trans. Intell. Veh."},{"key":"20_CR54","doi-asserted-by":"crossref","unstructured":"Pavllo, D., Feichtenhofer, C., Grangier, D., Auli, M.: 3D human pose estimation in video with temporal convolutions and semi-supervised training. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7753\u20137762 (2019)","DOI":"10.1109\/CVPR.2019.00794"},{"key":"20_CR55","unstructured":"Pavllo, D., Grangier, D., Auli, M.: QuaterNet: a quaternion-based recurrent model for human motion. arXiv preprint arXiv:1805.06485 (2018)"},{"key":"20_CR56","unstructured":"Rezende, D.J., Mohamed, S.: Variational inference with normalizing flows. arXiv preprint arXiv:1505.05770 (2015)"},{"key":"20_CR57","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"794","DOI":"10.1007\/978-3-030-01261-8_47","volume-title":"Computer Vision \u2013 ECCV 2018","author":"N Rhinehart","year":"2018","unstructured":"Rhinehart, N., Kitani, K.M., Vernaza, P.: r2p2: a reparameterized pushforward policy for diverse, precise generative path forecasting. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11217, pp. 794\u2013811. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01261-8_47"},{"issue":"1","key":"20_CR58","doi-asserted-by":"publisher","first-page":"40","DOI":"10.1109\/18.481776","volume":"42","author":"JJ Rissanen","year":"1996","unstructured":"Rissanen, J.J.: Fisher information and stochastic complexity. IEEE Trans. Inf. Theory 42(1), 40\u201347 (1996)","journal-title":"IEEE Trans. Inf. Theory"},{"key":"20_CR59","unstructured":"Ruiz, A.H., Gall, J., Moreno-Noguer, F.: Human motion prediction via spatio-temporal inpainting. arXiv preprint arXiv:1812.05478 (2018)"},{"issue":"3","key":"20_CR60","doi-asserted-by":"publisher","first-page":"205","DOI":"10.1016\/0888-613X(94)90031-0","volume":"11","author":"B Seroussi","year":"1994","unstructured":"Seroussi, B., Golmard, J.L.: An algorithm directly finding the k most probable configurations in Bayesian networks. Int. J. Approx. Reason. 11(3), 205\u2013233 (1994)","journal-title":"Int. J. Approx. Reason."},{"issue":"1\u20132","key":"20_CR61","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1007\/s11263-009-0273-6","volume":"87","author":"L Sigal","year":"2010","unstructured":"Sigal, L., Balan, A.O., Black, M.J.: HUMANEVA: synchronized video and motion capture dataset and baseline algorithm for evaluation of articulated human motion. Int. J. Comput. Vis. 87(1\u20132), 4 (2010)","journal-title":"Int. J. Comput. Vis."},{"issue":"8","key":"20_CR62","doi-asserted-by":"publisher","first-page":"2023","DOI":"10.1109\/TPAMI.2017.2743707","volume":"40","author":"J Sourati","year":"2017","unstructured":"Sourati, J., Akcakaya, M., Erdogmus, D., Leen, T.K., Dy, J.G.: A probabilistic active learning algorithm based on fisher information ratio. IEEE Trans. Pattern Anal. Mach. Intell. 40(8), 2023\u20132029 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"20_CR63","unstructured":"Srivastava, A., Valkov, L., Russell, C., Gutmann, M.U., Sutton, C.: VeeGAN: reducing mode collapse in GANs using implicit variational learning. In: Advances in Neural Information Processing Systems, pp. 3308\u20133318 (2017)"},{"key":"20_CR64","unstructured":"Tolstikhin, I., Bousquet, O., Gelly, S., Schoelkopf, B.: Wasserstein auto-encoders. arXiv preprint arXiv 1711, 01558 (2017)"},{"key":"20_CR65","doi-asserted-by":"crossref","unstructured":"Troje, N.F.: Decomposing biological motion: a framework for analysis and synthesis of human gait patterns. J. Vis. 2(5), 2 (2002)","DOI":"10.1167\/2.5.2"},{"key":"20_CR66","doi-asserted-by":"crossref","unstructured":"Walker, J., Marino, K., Gupta, A., Hebert, M.: The pose knows: video forecasting by generating pose futures. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 3332\u20133341 (2017)","DOI":"10.1109\/ICCV.2017.361"},{"key":"20_CR67","doi-asserted-by":"crossref","unstructured":"Wang, B., Adeli, E., Chiu, H.k., Huang, D.A., Niebles, J.C.: Imitation learning for human pose prediction. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 7124\u20137133 (2019)","DOI":"10.1109\/ICCV.2019.00722"},{"key":"20_CR68","doi-asserted-by":"crossref","unstructured":"Weng, X., Yuan, Y., Kitani, K.: Joint 3d tracking and forecasting with graph neural network and diversity sampling. arXiv:2003.07847 (2020)","DOI":"10.1109\/LRA.2021.3068925"},{"key":"20_CR69","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"276","DOI":"10.1007\/978-3-030-01228-1_17","volume-title":"Computer Vision \u2013 ECCV 2018","author":"X Yan","year":"2018","unstructured":"Yan, X., et al.: MT-VAE: learning motion transformations to generate multimodal human dynamics. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11209, pp. 276\u2013293. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01228-1_17"},{"key":"20_CR70","unstructured":"Yang, D., Hong, S., Jang, Y., Zhao, T., Lee, H.: Diversity-sensitive conditional generative adversarial networks. arXiv preprint arXiv:1901.09024 (2019)"},{"key":"20_CR71","doi-asserted-by":"crossref","unstructured":"Yang, W., Ouyang, W., Wang, X., Ren, J., Li, H., Wang, X.: 3D human pose estimation in the wild by adversarial learning. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5255\u20135264 (2018)","DOI":"10.1109\/CVPR.2018.00551"},{"key":"20_CR72","unstructured":"Yuan, Y., Kitani, K.: Diverse trajectory forecasting with determinantal point processes. arXiv preprint arXiv:1907.04967 (2019)"},{"key":"20_CR73","doi-asserted-by":"crossref","unstructured":"Yuan, Y., Kitani, K.: Ego-pose estimation and forecasting as real-time PD control. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 10082\u201310092 (2019)","DOI":"10.1109\/ICCV.2019.01018"},{"key":"20_CR74","unstructured":"Yuan, Y., Kitani, K.: Residual force control for agile human behavior imitation and extended motion synthesis. arXiv preprint arXiv:2006.07364 (2020)"},{"key":"20_CR75","doi-asserted-by":"crossref","unstructured":"Zhang, J.Y., Felsen, P., Kanazawa, A., Malik, J.: Predicting 3D human dynamics from video. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 7114\u20137123 (2019)","DOI":"10.1109\/ICCV.2019.00721"},{"key":"20_CR76","unstructured":"Zhao, S., Song, J., Ermon, S.: InfoVAE: information maximizing variational autoencoders. arXiv preprint arXiv:1706.02262 (2017)"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2020"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-58545-7_20","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,4]],"date-time":"2024-11-04T01:09:18Z","timestamp":1730682558000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-58545-7_20"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020]]},"ISBN":["9783030585440","9783030585457"],"references-count":76,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-58545-7_20","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020]]},"assertion":[{"value":"5 November 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Glasgow","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"United Kingdom","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2020","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23 August 2020","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28 August 2020","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"16","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2020","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2020.eu\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"OpenReview","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"5025","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1360","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"27% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"7","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"The conference was held virtually due to the COVID-19 pandemic. From the ECCV Workshops 249 full papers, 18 short papers, and 21 further contributions were published out of a total of 467 submissions.","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}