{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,22]],"date-time":"2026-01-22T10:23:03Z","timestamp":1769077383340,"version":"3.49.0"},"reference-count":37,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,5,29]],"date-time":"2023-05-29T00:00:00Z","timestamp":1685318400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,5,29]],"date-time":"2023-05-29T00:00:00Z","timestamp":1685318400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,5,29]]},"DOI":"10.1109\/icra48891.2023.10160722","type":"proceedings-article","created":{"date-parts":[[2023,7,4]],"date-time":"2023-07-04T17:20:56Z","timestamp":1688491256000},"page":"9837-9843","source":"Crossref","is-referenced-by-count":21,"title":["Can We Use Diffusion Probabilistic Models for 3D Motion Prediction?"],"prefix":"10.1109","author":[{"given":"Hyemin","family":"Ahn","sequence":"first","affiliation":[{"name":"Artificial Intelligence Graduate School (AIGS), Ulsan National Institute of Science and Technology (UNIST),Ulsan,Korea"}]},{"given":"Esteve Valls","family":"Mascaro","sequence":"additional","affiliation":[{"name":"Autonomous Systems, Technische Universit&#x00E4;t Wien (TU Wien),Vienna,Austria"}]},{"given":"Dongheui","family":"Lee","sequence":"additional","affiliation":[{"name":"Autonomous Systems, Technische Universit&#x00E4;t Wien (TU Wien),Vienna,Austria"}]}],"member":"263","reference":[{"key":"ref13","first-page":"9489","article-title":"Learning trajectory de-pendencies for human motion prediction","author":"mao","year":"2019","journal-title":"International Conference on Computer Vision (ICCV)"},{"key":"ref35","article-title":"Motiondiffuse: Text-driven human motion generation with diffusion model","author":"zhang","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.573"},{"key":"ref34","article-title":"Flame: Free-form language-based motion synthesis & editing","author":"kim","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref15","article-title":"Robust human motion forcasting using transformer-based model","author":"valls mascaro","year":"2022","journal-title":"International Conference on Intelligent Robots and Systems (IROS)"},{"key":"ref37","article-title":"Progressive distillation for fast sampling of diffusion models","author":"salimans","year":"2021","journal-title":"International Conference on Learning Representations"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/3DV53792.2021.00066"},{"key":"ref36","article-title":"Plan-ning with diffusion for flexible behavior synthesis","author":"janner","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref31","first-page":"8599","article-title":"Grad-tts: A diffusion probabilistic model for text-to-speech","author":"popov","year":"2021","journal-title":"International Conference on Machine Learning"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/3422622"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.494"},{"key":"ref33","article-title":"Video diffusion models","author":"ho","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.497"},{"key":"ref32","article-title":"Diffsound: Discrete diffusion model for text-to-sound generation","author":"yang","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00553"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-014-0735-3"},{"key":"ref17","first-page":"265","article-title":"Mt-vae: Learning motion trans-formations to generate multimodal human dynamics","author":"yan","year":"2018","journal-title":"European Conference on Computer Vision (ECCV)"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2018.00191"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01306"},{"key":"ref18","first-page":"346","article-title":"Dlow: Diversifying latent flows for diverse human motion prediction","author":"yuan","year":"0","journal-title":"European Conference on Computer Vision (ECCV)"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01114"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3528233.3530757"},{"key":"ref26","article-title":"Empirical evaluation of gated recurrent neural networks on sequence modeling","author":"chung","year":"2014","journal-title":"ArXiv Preprint"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref20","first-page":"6840","article-title":"Denoising diffusion probabilistic mod-els","volume":"33","author":"ho","year":"2020","journal-title":"Advances in Neural IInformation Processing Systems"},{"key":"ref22","article-title":"Photorealistic text-to-image diffusion models with deep language understanding","author":"saharia","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref21","first-page":"24804","article-title":"Csdi: Conditional score-based diffusion models for probabilistic time series imputation","volume":"34","author":"tashiro","year":"2021","journal-title":"Ad-vances in Neural Information Processing Systems (NeurIPS)"},{"key":"ref28","article-title":"Attention is all you need","volume":"30","author":"vaswani","year":"2017","journal-title":"Advances in Neural IInformation Processing Systems"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58568-6_28"},{"key":"ref29","article-title":"Auto-encoding variational bayes","author":"kingma","year":"2013","journal-title":"ArXiv Preprint"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00554"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/2816795.2818013"},{"key":"ref9","article-title":"Humaneva: Synchronized video and motion capture dataset for evaluation of articulated human motion","volume":"120","author":"sigal","year":"2006","journal-title":"Brown Univertsity TR"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/IROS45743.2020.9341083"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00636"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.248"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8460651"}],"event":{"name":"2023 IEEE International Conference on Robotics and Automation (ICRA)","location":"London, United Kingdom","start":{"date-parts":[[2023,5,29]]},"end":{"date-parts":[[2023,6,2]]}},"container-title":["2023 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10160211\/10160212\/10160722.pdf?arnumber=10160722","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,24]],"date-time":"2023-07-24T17:37:21Z","timestamp":1690220241000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10160722\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,5,29]]},"references-count":37,"URL":"https:\/\/doi.org\/10.1109\/icra48891.2023.10160722","relation":{},"subject":[],"published":{"date-parts":[[2023,5,29]]}}}