{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T16:40:07Z","timestamp":1777653607832,"version":"3.51.4"},"reference-count":27,"publisher":"IEEE","license":[{"start":{"date-parts":[[2022,10,16]],"date-time":"2022-10-16T00:00:00Z","timestamp":1665878400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,10,16]],"date-time":"2022-10-16T00:00:00Z","timestamp":1665878400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022,10,16]]},"DOI":"10.1109\/icip46576.2022.9897982","type":"proceedings-article","created":{"date-parts":[[2022,11,3]],"date-time":"2022-11-03T21:27:24Z","timestamp":1667510844000},"page":"3943-3947","source":"Crossref","is-referenced-by-count":11,"title":["HARP: Autoregressive Latent Video Prediction with High-Fidelity Image Generator"],"prefix":"10.1109","author":[{"given":"Younggyo","family":"Seo","sequence":"first","affiliation":[{"name":"KAIST University of California,Berkeley"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kimin","family":"Lee","sequence":"additional","affiliation":[{"name":"KAIST University of California,Berkeley"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fangchen","family":"Liu","sequence":"additional","affiliation":[{"name":"KAIST University of California,Berkeley"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Stephen","family":"James","sequence":"additional","affiliation":[{"name":"KAIST University of California,Berkeley"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Pieter","family":"Abbeel","sequence":"additional","affiliation":[{"name":"KAIST University of California,Berkeley"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Qt-opt: Scalable deep reinforcement learning for vision-based robotic manipulation","author":"Kalashnikov","year":"2018","journal-title":"CoRL"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.376"},{"key":"ref3","article-title":"Unsupervised learning for physical interaction through video prediction","author":"Finn","year":"2016","journal-title":"NeurIPS"},{"key":"ref4","article-title":"Stochastic variational video prediction","author":"Babaeizadeh","year":"2018","journal-title":"ICLR"},{"key":"ref5","article-title":"Stochastic video generation with a learned prior","author":"Denton","year":"2018","journal-title":"ICML"},{"key":"ref6","article-title":"Stochastic adversarial video prediction","author":"Lee","year":"2018"},{"key":"ref7","article-title":"Scaling autoregressive video models","author":"Weissenborn","year":"2020","journal-title":"ICLR"},{"key":"ref8","article-title":"Fitvid: Overfitting in pixel-level video prediction","author":"Babaeizadeh","year":"2021"},{"key":"ref9","article-title":"High fidelity video prediction with large stochastic recurrent neural networks","author":"Villegas","year":"2019","journal-title":"NeurIPS"},{"key":"ref10","article-title":"Adversarial video generation on complex datasets","author":"Clark","year":"2019"},{"key":"ref11","article-title":"Transformation-based adversarial video prediction on large-scale data","author":"Luc","year":"2020"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.5220\/0010241801010112"},{"key":"ref13","article-title":"Videogpt: Video generation using vq-vae and transformers","author":"Yan","year":"2021"},{"key":"ref14","article-title":"Neural discrete representation learning","author":"van den Oord","year":"2017","journal-title":"NeurIPS"},{"key":"ref15","article-title":"Generative pretraining from pixels","author":"Chen","year":"2020","journal-title":"ICML"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01268"},{"key":"ref17","article-title":"Meta-world: A benchmark and evaluation for multitask and meta reinforcement learning","author":"Yu","year":"2020","journal-title":"CoRL"},{"key":"ref18","article-title":"Robonet: Large-scale multi-robot learning","author":"Dasari","year":"2019","journal-title":"CoRL"},{"key":"ref19","article-title":"A short note about kinetics-600","author":"Carreira","year":"2018"},{"key":"ref20","article-title":"Self-supervised visual planning with temporal skip connections","author":"Ebert","year":"2017","journal-title":"CoRL"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1177\/0278364913491297"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00068"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.632"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1082"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00235"},{"key":"ref26","article-title":"Towards accurate generative models of video: A new metric & challenges","author":"Unterthiner","year":"2018"},{"key":"ref27","article-title":"A good image generator is what you need for highresolution video synthesis","author":"Tian","year":"2021","journal-title":"ICLR"}],"event":{"name":"2022 IEEE International Conference on Image Processing (ICIP)","location":"Bordeaux, France","start":{"date-parts":[[2022,10,16]]},"end":{"date-parts":[[2022,10,19]]}},"container-title":["2022 IEEE International Conference on Image Processing (ICIP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9897158\/9897159\/09897982.pdf?arnumber=9897982","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,22]],"date-time":"2024-01-22T21:10:09Z","timestamp":1705957809000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9897982\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,10,16]]},"references-count":27,"URL":"https:\/\/doi.org\/10.1109\/icip46576.2022.9897982","relation":{},"subject":[],"published":{"date-parts":[[2022,10,16]]}}}