{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T02:35:33Z","timestamp":1730255733161,"version":"3.28.0"},"reference-count":40,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,5,1]],"date-time":"2020-05-01T00:00:00Z","timestamp":1588291200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,5,1]],"date-time":"2020-05-01T00:00:00Z","timestamp":1588291200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,5,1]],"date-time":"2020-05-01T00:00:00Z","timestamp":1588291200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,5]]},"DOI":"10.1109\/icra40945.2020.9196839","type":"proceedings-article","created":{"date-parts":[[2020,9,15]],"date-time":"2020-09-15T17:25:46Z","timestamp":1600190746000},"page":"8316-8322","source":"Crossref","is-referenced-by-count":4,"title":["Action-conditioned Benchmarking of Robotic Video Prediction Models: a Comparative Study"],"prefix":"10.1109","author":[{"given":"Manuel Serra","family":"Nunes","sequence":"first","affiliation":[]},{"given":"Atabak","family":"Dehban","sequence":"additional","affiliation":[]},{"given":"Plinio","family":"Moreno","sequence":"additional","affiliation":[]},{"given":"Jose","family":"Santos-Victor","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","article-title":"Videoflow: A conditional flow-based model for stochastic video generation","author":"kumar","year":"2020","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref38","article-title":"Visual foresight: Model-based deep reinforcement learning for vision-based robotic control","author":"ebert","year":"2018","journal-title":"arXiv preprint arXiv 1812 02588"},{"key":"ref33","article-title":"Towards accurate generative models of video: A new metric & challenges","author":"unterthiner","year":"2018","journal-title":"arXiv preprint arXiv 1812 01717"},{"key":"ref32","first-page":"4268","article-title":"Temporal coherency based criteria for predicting video frames using deep multi-stage generative adversarial networks","author":"bhattacharjee","year":"2017","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00068"},{"key":"ref30","doi-asserted-by":"crossref","first-page":"121","DOI":"10.1016\/S0923-5965(03)00076-6","article-title":"Video quality assessment based on structural distortion measurement","volume":"19","author":"wang","year":"2004","journal-title":"Signal Processing Image Communication"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00770"},{"article-title":"Self-supervised visual planning with temporal skip connections","year":"2017","author":"ebert","key":"ref36"},{"key":"ref35","doi-asserted-by":"crossref","DOI":"10.23915\/distill.00010","article-title":"The building blocks of interpretability","author":"olah","year":"2018","journal-title":"Distillation"},{"article-title":"Inceptionism: Going deeper into neural networks","year":"2015","author":"mordvintsev","key":"ref34"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989324"},{"key":"ref40","first-page":"1171","article-title":"Scheduled sampling for sequence prediction with recurrent neural networks","author":"bengio","year":"2015","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref11","article-title":"Robonet: Large-scale multi-robot learning","author":"dasari","year":"2019","journal-title":"arXiv preprint arXiv 1910 11215"},{"key":"ref12","first-page":"802","article-title":"Convolutional lstm network: A machine learning approach for precipitation nowcasting","author":"xingjian","year":"2015","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.77"},{"key":"ref14","volume":"1","author":"james","year":"1890","journal-title":"The Principles of Psychology"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/j.tics.2014.06.011"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1038\/4580"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1038\/nrn3112"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/DEVLRN.2014.6982995"},{"key":"ref19","first-page":"91","article-title":"Visual dynamics: Probabilistic future frame synthesis via cross convolutional networks","author":"xue","year":"2016","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/TBC.2008.2000733"},{"key":"ref4","article-title":"Deep multi-scale video prediction beyond mean square error","author":"mathieu","year":"2015","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref27","article-title":"Stochastic video generation with a learned prior","author":"denton","year":"2018","journal-title":"International Conference on Machine Learning (ICML)"},{"key":"ref3","first-page":"843","article-title":"Unsupervised learning of video representations using lstms","author":"srivastava","year":"2015","journal-title":"International Conference on Machine Learning (ICML)"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/s10339-007-0167-x"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/s11235-010-9351-x"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1098\/rstb.2005.1622"},{"article-title":"Openai gym","year":"2016","author":"brockman","key":"ref8"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1162\/NECO_a_00699"},{"key":"ref2","first-page":"568","article-title":"Two-stream convolutional networks for action recognition in videos","author":"simonyan","year":"2014","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref9","article-title":"Recurrent world models facilitate policy evolution","author":"ha","year":"2018","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref1","article-title":"Unsupervised learning of object keypoints for perception and control","author":"kulkarni","year":"2019","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref20","first-page":"667","article-title":"Dynamic filter networks","author":"jia","year":"2016","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref22","article-title":"Stochastic adversarial video prediction","author":"lee","year":"2018","journal-title":"arXiv preprint arXiv 1804 01523"},{"key":"ref21","article-title":"Stochastic variational video prediction","author":"babaeizadeh","year":"2017","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref24","first-page":"2863","article-title":"Action-conditional video prediction using deep networks in atari games","author":"oh","year":"2015","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref23","article-title":"Decomposing motion and content for natural video sequence prediction","author":"villegas","year":"2017","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref26","first-page":"64","article-title":"Unsupervised learning for physical interaction through video prediction","author":"finn","year":"2016","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref25","article-title":"Deep predictive coding networks for video prediction and unsupervised learning","author":"lotter","year":"2016","journal-title":"International Conference on Learning Representations (ICLR)"}],"event":{"name":"2020 IEEE International Conference on Robotics and Automation (ICRA)","start":{"date-parts":[[2020,5,31]]},"location":"Paris, France","end":{"date-parts":[[2020,8,31]]}},"container-title":["2020 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9187508\/9196508\/09196839.pdf?arnumber=9196839","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,27]],"date-time":"2022-06-27T20:27:25Z","timestamp":1656361645000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9196839\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,5]]},"references-count":40,"URL":"https:\/\/doi.org\/10.1109\/icra40945.2020.9196839","relation":{},"subject":[],"published":{"date-parts":[[2020,5]]}}}