{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T10:02:16Z","timestamp":1777888936826,"version":"3.51.4"},"reference-count":43,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62176043,U22A2097"],"award-info":[{"award-number":["62176043,U22A2097"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,19]]},"DOI":"10.1109\/iccv51701.2025.02110","type":"proceedings-article","created":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T19:45:49Z","timestamp":1777491949000},"page":"22728-22737","source":"Crossref","is-referenced-by-count":0,"title":["Borrowing Eyes for the Blind Spot: Overcoming Data Scarcity in Malicious Video Detection Via Cross-Domain Retrieval Augmentation"],"prefix":"10.1109","author":[{"given":"Rongpei","family":"Hong","sequence":"first","affiliation":[{"name":"University of Electronic Science and Technology of China,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jian","family":"Lang","sequence":"additional","affiliation":[{"name":"University of Electronic Science and Technology of China,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ting","family":"Zhong","sequence":"additional","affiliation":[{"name":"University of Electronic Science and Technology of China,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fan","family":"Zhou","sequence":"additional","affiliation":[{"name":"University of Electronic Science and Technology of China,China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00676"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/NILES63360.2024.10753192"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-021-09975-1"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2102.05095"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3612426"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3680663"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/p19-1239"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.502"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/3459637.3482212"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1609\/icwsm.v17i1.22209"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.24818\/ida-ql\/2019.5"},{"key":"ref12","article-title":"An Image is Worth 16\u00d716 Words: Transformers for Image Recognition at Scale","volume-title":"International Conference on Learning Representations (ICLR)","author":"Dosovitskiy","year":"2021"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00630"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72627-9_19"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3696410.3714559"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.223"},{"key":"ref17","article-title":"The Hateful Memes Challenge: Detecting Hate Speech in Multimodal Memes","volume-title":"Conference on Neural Information Processing Systems (NeurIPS)","author":"Kiela","year":"2020"},{"key":"ref18","first-page":"5583","article-title":"Vilt: Vision-and-Language Transformer Without Convolution or Region Supervision","volume-title":"International Conference on Machine Learning (ICML)","author":"Kim","year":"2021"},{"key":"ref19","article-title":"Videopoet: A Large Language Model for Zero-Shot Video Generation","volume-title":"International Conference on Machine Learning (ICML)","author":"Kondratyuk","year":"2024"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3696410.3714560"},{"key":"ref21","article-title":"Llava-OneVision: Easy Visual Task Transfer","volume":"abs\/2408.03326","author":"Li","year":"2024","journal-title":"arXiv"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/icme59968.2025.11209008"},{"key":"ref23","article-title":"Sora: A Review on Background, Technology, Limitations, and Opportunities of Large Vision Models","volume":"abs\/2402.17177","author":"Liu","year":"2024","journal-title":"arXiv"},{"key":"ref24","article-title":"Decoupled Weight Decay Regularization","volume-title":"International Conference on Learning Representations (ICLR)","author":"Loshchilov","year":"2019"},{"key":"ref25","first-page":"2579","article-title":"Visualizing Data using t-SNE","volume":"9","author":"Maaten","year":"2008","journal-title":"Journal of Machine Learning Research"},{"key":"ref26","article-title":"r\/Fakeddit: A New Multimodal Benchmark Dataset for Fine-grained Fake News Detection","volume":"abs\/1911.03854","author":"Nakamura","year":"2019","journal-title":"arXiv"},{"key":"ref27","article-title":"St-Adapter: Parameter-Efficient Image-to-Video Transfer Learning","volume-title":"Conference on Neural Information Processing Systems (NeurIPS)","author":"Pan","year":"2022"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1108\/OIR-03-2018-0101"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i12.26689"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-acl.756"},{"key":"ref31","first-page":"8748","article-title":"Learning Transferable Visual Models From Natural Language Supervision","volume-title":"International Conference on Machine Learning (ICML)","author":"Radford","year":"2021"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/BigData52589.2021.9671928"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1089\/big.2020.0062"},{"key":"ref34","first-page":"568","article-title":"Two-Stream Convolutional Networks for Action Recognition in Videos","volume-title":"Conference on Neural Information Processing Systems (NeurIPS)","author":"Simonyan","year":"2014"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3681521"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1145\/3696410.3714534"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46484-8_2"},{"key":"ref38","article-title":"Qwen2-VL: Enhancing Vision-Language Model\u2019s Perception of the World at Any Resolution","volume":"abs\/2409.12191","author":"Wang","year":"2024","journal-title":"arXiv"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00701"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58577-8_20"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3548255"},{"key":"ref42","article-title":"Recapture: Generative Video Camera Controls for User-Provided Videos using Masked Video Fine-Tuning","author":"Zhang","year":"2024","journal-title":"arXiv"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01751"}],"event":{"name":"2025 IEEE\/CVF International Conference on Computer Vision (ICCV)","location":"Honolulu, HI, USA","start":{"date-parts":[[2025,10,19]]},"end":{"date-parts":[[2025,10,25]]}},"container-title":["2025 IEEE\/CVF International Conference on Computer Vision (ICCV)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11443115\/11443287\/11445694.pdf?arnumber=11445694","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T05:02:58Z","timestamp":1777611778000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11445694\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,19]]},"references-count":43,"URL":"https:\/\/doi.org\/10.1109\/iccv51701.2025.02110","relation":{},"subject":[],"published":{"date-parts":[[2025,10,19]]}}}