{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,28]],"date-time":"2025-10-28T10:53:32Z","timestamp":1761648812473,"version":"3.40.3"},"publisher-location":"Cham","reference-count":50,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030585761"},{"type":"electronic","value":"9783030585778"}],"license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020]]},"DOI":"10.1007\/978-3-030-58577-8_2","type":"book-chapter","created":{"date-parts":[[2020,9,23]],"date-time":"2020-09-23T14:04:27Z","timestamp":1600869867000},"page":"18-34","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":31,"title":["Structure-Aware Human-Action Generation"],"prefix":"10.1007","author":[{"given":"Ping","family":"Yu","sequence":"first","affiliation":[]},{"given":"Yang","family":"Zhao","sequence":"additional","affiliation":[]},{"given":"Chunyuan","family":"Li","sequence":"additional","affiliation":[]},{"given":"Junsong","family":"Yuan","sequence":"additional","affiliation":[]},{"given":"Changyou","family":"Chen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,9,24]]},"reference":[{"key":"2_CR1","unstructured":"Bahdanau, D., Cho, K., Bengio, Y.: Neural machine translation by jointly learning to align and translate. arXiv preprint arXiv:1409.0473 (2014)"},{"key":"2_CR2","doi-asserted-by":"crossref","unstructured":"Barsoum, E., Kender, J., Liu, Z.: HP-GAN: probabilistic 3D human motion prediction via GAN (2017). https:\/\/arxiv.org\/abs\/1711.09561","DOI":"10.1109\/CVPRW.2018.00191"},{"key":"2_CR3","doi-asserted-by":"crossref","unstructured":"Barsoum, E., Kender, J., Liu, Z.: HP-GAN: probabilistic 3D human motion prediction via GAN. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition Workshops, pp. 1418\u20131427 (2018)","DOI":"10.1109\/CVPRW.2018.00191"},{"issue":"1","key":"2_CR4","doi-asserted-by":"publisher","first-page":"101","DOI":"10.1007\/s11263-009-0248-7","volume":"85","author":"A Bissacco","year":"2009","unstructured":"Bissacco, A., Soatto, S.: Hybrid dynamical models of human motion for the recognition of human gaits. Int. J. Comput. Vis. 85(1), 101\u2013114 (2009). https:\/\/doi.org\/10.1007\/s11263-009-0248-7","journal-title":"Int. J. Comput. Vis."},{"key":"2_CR5","unstructured":"Brock, A., Donahue, J., Simonyan, K.: Large scale GAN training for high fidelity natural image synthesis. arXiv preprint arXiv:1809.11096 (2018)"},{"key":"2_CR6","unstructured":"Bruna, J., Zaremba, W., Szlam, A., LeCun, Y.: Spectral networks and locally connected networks on graphs. arXiv preprint arXiv:1312.6203 (2013)"},{"key":"2_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"374","DOI":"10.1007\/978-3-030-01216-8_23","volume-title":"Computer Vision \u2013 ECCV 2018","author":"H Cai","year":"2018","unstructured":"Cai, H., Bai, C., Tai, Y.-W., Tang, C.-K.: Deep Video Generation, Prediction and Completion of Human Action Sequences. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11206, pp. 374\u2013390. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01216-8_23"},{"key":"2_CR8","unstructured":"Chen, X., Mishra, N., Rohaninejad, M., Abbeel, P.: PixelSNAIL: an improved autoregressive generative model. arXiv preprint arXiv:1712.09763 (2017)"},{"key":"2_CR9","unstructured":"Clark, A., Donahue, J., Simonyan, K.: Efficient video generation on complex datasets. arXiv preprint arXiv:1907.06571 (2019)"},{"key":"2_CR10","unstructured":"Du, Y., Wang, W., Wang, L.: Hierarchical recurrent neural network for skeleton based action recognition. In: CVPR (2015)"},{"key":"2_CR11","unstructured":"Goodfellow, I., et al.: Generative adversarial nets. In: Advances in Neural Information Processing Systems, pp. 2672\u20132680 (2014)"},{"key":"2_CR12","unstructured":"Gretton, A., Borgwardt, K.M., Rasch, M.J., Sch\u00f6lkopf, B., Smola, A.: A kernel two-sample test. J. Mach. Learn. Res. 13(Mar), 723\u2013773 (2012)"},{"key":"2_CR13","doi-asserted-by":"crossref","unstructured":"Habibie, I., Holden, D., Schwarz, J., Yearsley, J., Komura, T., et al.: A recurrent variational autoencoder for human motion synthesis (2017)","DOI":"10.5244\/C.31.119"},{"key":"2_CR14","unstructured":"Han, J., Liu, Q.: Stein variational gradient descent without gradient. arXiv preprint arXiv:1806.02775 (2018)"},{"key":"2_CR15","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"2_CR16","doi-asserted-by":"crossref","unstructured":"Ionescu, C., Papava, D., Olaru, V., Sminchisescu, C.: Human 3.6m: large scale datasets and predictive methods for 3D human sensing in natural environments. IEEE Trans. Pattern Anal. Mach. Intell. 36(7), 1325\u20131339 (2013)","DOI":"10.1109\/TPAMI.2013.248"},{"key":"2_CR17","doi-asserted-by":"crossref","unstructured":"Ke, Q., Bennamoun, M., An, S., Sohel, F., Boussaid, F.: A new representation of skeleton sequences for 3D action recognition. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.486"},{"key":"2_CR18","unstructured":"Kiasari, M.A., Moirangthem, D.S., Lee, M.: Human action generation with generative adversarial networks. arXiv preprint arXiv:1805.10416 (2018)"},{"key":"2_CR19","doi-asserted-by":"crossref","unstructured":"Kim, T.S., Reiter, A.: Interpretable 3D human action analysis with temporal convolutional networks. In: BNMW CVPR (2017)","DOI":"10.1109\/CVPRW.2017.207"},{"key":"2_CR20","unstructured":"Kingma, D.P., Welling, M.: Auto-encoding variational bayes. arXiv preprint arXiv:1312.6114 (2013)"},{"key":"2_CR21","unstructured":"Kipf, T.N., Welling, M.: Semi-supervised classification with graph convolutional networks. arXiv preprint arXiv:1609.02907 (2016)"},{"key":"2_CR22","unstructured":"Li, C., et al.: Alice: towards understanding adversarial learning for joint distribution matching. In: Advances in Neural Information Processing Systems, pp. 5495\u20135503 (2017)"},{"key":"2_CR23","unstructured":"van der Maaten, L., Hinton, G.: Visualizing data using t-SNE. J. Mach. Learn. Res. 9(Nov), 2579\u20132605 (2008)"},{"key":"2_CR24","doi-asserted-by":"crossref","unstructured":"Martinez, J., Black, M.J., Romero, J.: On human motion prediction using recurrent neural networks. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.497"},{"key":"2_CR25","unstructured":"Mirza, M., Osindero, S.: Conditional generative adversarial nets. arXiv preprint arXiv:1411.1784 (2014)"},{"key":"2_CR26","unstructured":"Niepert, M., Ahmed, M., Kutzkov, K.: Learning convolutional neural networks for graphs. In: International Conference on Machine Learning, pp. 2014\u20132023 (2016)"},{"key":"2_CR27","doi-asserted-by":"crossref","unstructured":"Oh, S.M., Rehg, J.M., Balch, T., Dellaert, F.: Learning and inference in parametric switching linear dynamic systems. In: Tenth IEEE International Conference on Computer Vision, ICCV 2005 Volume 1, vol. 2, pp. 1161\u20131168. IEEE (2005)","DOI":"10.1109\/ICCV.2005.135"},{"key":"2_CR28","unstructured":"Pavlovic, V., Rehg, J.M., MacCormick, J.: Learning switching linear models of human motion. In: Advances in Neural Information Processing Systems, pp. 981\u2013987 (2001)"},{"key":"2_CR29","doi-asserted-by":"crossref","unstructured":"Shahroudy, A., Liu, J., Ng, T.T., Wang, G.: NTU RGB+ D: a large scale dataset for 3D human activity analysis. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1010\u20131019 (2016)","DOI":"10.1109\/CVPR.2016.115"},{"key":"2_CR30","unstructured":"Taylor, G.W., Hinton, G.E., Roweis, S.T.: Two distributed-state models for generating high-dimensional time series. J. Mach. Learn. Res. 12(Mar), 1025\u20131068 (2011)"},{"key":"2_CR31","doi-asserted-by":"crossref","unstructured":"Tulyakov, S., Liu, M.Y., Yang, X., Kautz, J.: MoCoGAN: decomposing motion and content for video generation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1526\u20131535 (2018)","DOI":"10.1109\/CVPR.2018.00165"},{"key":"2_CR32","doi-asserted-by":"crossref","unstructured":"Urtasun, R., Fleet, D.J., Geiger, A., Popovi\u0107, J., Darrell, T.J., Lawrence, N.D.: Topologically-constrained latent variable models. In: Proceedings of the 25th International Conference on Machine Learning, pp. 1080\u20131087 (2008)","DOI":"10.1145\/1390156.1390292"},{"key":"2_CR33","unstructured":"Vaswani, A., et al.: Attention is all you need. In: Advances in Neural Information Processing Systems, pp. 5998\u20136008 (2017)"},{"key":"2_CR34","doi-asserted-by":"crossref","unstructured":"Walker, J., Marino, K., Gupta, A., Hebert, M.: The pose knows: video forecasting by generating pose futures. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 3332\u20133341 (2017)","DOI":"10.1109\/ICCV.2017.361"},{"key":"2_CR35","doi-asserted-by":"crossref","unstructured":"Wang, J.M., Fleet, D.J., Hertzmann, A.: Optimizing walking controllers. In: ACM SIGGRAPH Asia 2009 Papers, pp. 1\u20138 (2009)","DOI":"10.1145\/1661412.1618514"},{"issue":"4","key":"2_CR36","first-page":"1","volume":"29","author":"JM Wang","year":"2010","unstructured":"Wang, J.M., Fleet, D.J., Hertzmann, A.: Optimizing walking controllers for uncertain inputs and environments. ACM Trans. Graph. (TOG) 29(4), 1\u20138 (2010)","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"2_CR37","unstructured":"Wang, T.C., et al.: Video-to-video synthesis. In: NeurIPS (2018)"},{"key":"2_CR38","doi-asserted-by":"crossref","unstructured":"Wang, X., Girshick, R., Gupta, A., He, K.: Non-local neural networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7794\u20137803 (2018)","DOI":"10.1109\/CVPR.2018.00813"},{"key":"2_CR39","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"823","DOI":"10.1007\/978-3-030-01225-0_48","volume-title":"Computer Vision \u2013 ECCV 2018","author":"L-Y Gui","year":"2018","unstructured":"Gui, L.-Y., Wang, Y.-X., Liang, X., Moura, J.M.F.: Adversarial Geometry-Aware Human Motion Prediction. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11208, pp. 823\u2013842. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01225-0_48"},{"key":"2_CR40","unstructured":"Wang, Z., et al.: Learning diverse stochastic human-action generators by learning smooth latent transitions. arXiv preprint arXiv:1912.10150 (2019)"},{"key":"2_CR41","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2019.2938520","volume-title":"Combining recurrent neural networks and adversarial training for human motion synthesis and control","author":"Z Wang","year":"2019","unstructured":"Wang, Z., Chai, J., Xia, S.: Combining recurrent neural networks and adversarial training for human motion synthesis and control. IEEE Trans. Vis. Comput, Graph (2019)"},{"key":"2_CR42","unstructured":"Wichers, N., Villegas, R., Erhan, D., Lee, H.: Hierarchical long-term video prediction without supervision. arXiv preprint arXiv:1806.04768 (2018)"},{"key":"2_CR43","unstructured":"Xu, K., Li, C., Tian, Y., Sonobe, T., Kawarabayashi, K., Jegelka, S.: Representation learning on graphs with jumping knowledge networks. arXiv preprint arXiv:1806.03536 (2018)"},{"key":"2_CR44","doi-asserted-by":"crossref","unstructured":"Yan, S., Xiong, Y., Lin, D.: Spatial temporal graph convolutional networks for skeleton-based action recognition. In: Thirty-Second AAAI Conference on Artificial Intelligence (2018)","DOI":"10.1609\/aaai.v32i1.12328"},{"key":"2_CR45","doi-asserted-by":"crossref","unstructured":"Yan, Y., Xu, J., Ni, B., Zhang, W., Yang, X.: Skeleton-aided articulated motion generation. In: Proceedings of the 25th ACM International Conference on Multimedia, pp. 199\u2013207 (2017)","DOI":"10.1145\/3123266.3123277"},{"key":"2_CR46","unstructured":"Zhang, H., Goodfellow, I., Metaxas, D., Odena, A.: Self-attention generative adversarial networks. In: International Conference on Machine Learning, pp. 7354\u20137363 (2019)"},{"key":"2_CR47","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Qi, P., Manning, C.D.: Graph convolution over pruned dependency trees improves relation extraction. arXiv preprint arXiv:1809.10185 (2018)","DOI":"10.18653\/v1\/D18-1244"},{"key":"2_CR48","unstructured":"Zhao, Y., Li, C., Yu, P., Gao, J., Chen, C.: Feature quantization improves GAN training. In: ICML (2020)"},{"key":"2_CR49","first-page":"5893","volume":"33","author":"Y Zhao","year":"2019","unstructured":"Zhao, Y., Zhang, J., Chen, C.: Self-adversarially learned Bayesian sampling. Proc. AAAI Conf. Artif. Intell. 33, 5893\u20135900 (2019)","journal-title":"Proc. AAAI Conf. Artif. Intell."},{"key":"2_CR50","unstructured":"Zhou, J., et al.: Graph neural networks: a review of methods and applications. arXiv preprint arXiv:1812.08434 (2018)"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2020"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-58577-8_2","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,23]],"date-time":"2024-09-23T00:02:37Z","timestamp":1727049757000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-58577-8_2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020]]},"ISBN":["9783030585761","9783030585778"],"references-count":50,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-58577-8_2","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2020]]},"assertion":[{"value":"24 September 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Glasgow","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"United Kingdom","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2020","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23 August 2020","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28 August 2020","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"16","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2020","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2020.eu\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"OpenReview","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"5025","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1360","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"27% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"7","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"The conference was held virtually due to the COVID-19 pandemic.","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}