{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,21]],"date-time":"2026-02-21T03:40:21Z","timestamp":1771645221250,"version":"3.50.1"},"reference-count":17,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,7,15]],"date-time":"2024-07-15T00:00:00Z","timestamp":1721001600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,7,15]],"date-time":"2024-07-15T00:00:00Z","timestamp":1721001600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100006190","name":"Research and Development","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100006190","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100006190","name":"Research and Development","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100006190","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,7,15]]},"DOI":"10.1109\/icme57554.2024.10687529","type":"proceedings-article","created":{"date-parts":[[2024,9,30]],"date-time":"2024-09-30T17:24:16Z","timestamp":1727717056000},"page":"1-6","source":"Crossref","is-referenced-by-count":3,"title":["InstructVid2Vid: Controllable Video Editing with Natural Language Instructions"],"prefix":"10.1109","author":[{"given":"Bosheng","family":"Qin","sequence":"first","affiliation":[{"name":"Zhejiang University,College of Computer Science and Technology"}]},{"given":"Juncheng","family":"Li","sequence":"additional","affiliation":[{"name":"Zhejiang University,College of Computer Science and Technology"}]},{"given":"Siliang","family":"Tang","sequence":"additional","affiliation":[{"name":"Zhejiang University,College of Computer Science and Technology"}]},{"given":"Tat-Seng","family":"Chua","sequence":"additional","affiliation":[{"name":"National University of Singapore,School of Computing"}]},{"given":"Yueting","family":"Zhuang","sequence":"additional","affiliation":[{"name":"Zhejiang University,College of Computer Science and Technology"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr52729.2023.01764"},{"key":"ref2","article-title":"Dreamix: Video diffusion models are general video editors","author":"Molad","year":"2023"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr52733.2024.00821"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/iccv51070.2023.00701"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01460"},{"key":"ref6","first-page":"12888","article-title":"Blip: Bootstrapping language-image pre-training for unified vision-language understanding and generation","volume-title":"Proceedings of the 39th International Conference on Machine Learning, ser. Series BLIP: Bootstrapping Language-Image Pre-training for Unified Vision-Language Understanding and Generation","volume":"162","author":"Li"},{"key":"ref7","article-title":"Zero-shot video editing using off-the-shelf image diffusion models","author":"Wang","year":"2023"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01460"},{"key":"ref9","article-title":"Edit-a-video: Single video editing with object-aware consistency","author":"Shin","year":"2023"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19784-0_41"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.02121"},{"key":"ref12","article-title":"Denoising diffusion implicit models","volume-title":"International Conference on Learning Representations","author":"Song"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1016\/0004-3702(81)90024-2"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/j.image.2003.09.001"},{"key":"ref16","first-page":"6629","article-title":"Gans trained by a two time-scale update rule converge to a local nash equilibrium","volume-title":"Proceedings of the 31st International Conference on Neural Information Processing Systems, ser. Series GANs trained by a two time-scale update rule converge to a local nash equilibrium","author":"Heusel"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.308"}],"event":{"name":"2024 IEEE International Conference on Multimedia and Expo (ICME)","location":"Niagara Falls, ON, Canada","start":{"date-parts":[[2024,7,15]]},"end":{"date-parts":[[2024,7,19]]}},"container-title":["2024 IEEE International Conference on Multimedia and Expo (ICME)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10685847\/10687354\/10687529.pdf?arnumber=10687529","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,1]],"date-time":"2024-10-01T06:13:38Z","timestamp":1727763218000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10687529\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7,15]]},"references-count":17,"URL":"https:\/\/doi.org\/10.1109\/icme57554.2024.10687529","relation":{},"subject":[],"published":{"date-parts":[[2024,7,15]]}}}