{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T10:02:42Z","timestamp":1777888962801,"version":"3.51.4"},"reference-count":97,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001665","name":"French National Research Agency","doi-asserted-by":"publisher","award":["ANR-24-CE23-4369"],"award-info":[{"award-number":["ANR-24-CE23-4369"]}],"id":[{"id":"10.13039\/501100001665","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,19]]},"DOI":"10.1109\/iccv51701.2025.01680","type":"proceedings-article","created":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T19:45:49Z","timestamp":1777491949000},"page":"18078-18089","source":"Crossref","is-referenced-by-count":0,"title":["Ask and Remember: A Questions-Only Replay Strategy for Continual Visual Question Answering"],"prefix":"10.1109","author":[{"given":"Imad Eddine","family":"Marouf","sequence":"first","affiliation":[{"name":"T&#x00E9;el&#x00E9;ecom-Paris, Institut Polytechnique de Paris,LTCI,France"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Enzo","family":"Tartaglione","sequence":"additional","affiliation":[{"name":"T&#x00E9;el&#x00E9;ecom-Paris, Institut Polytechnique de Paris,LTCI,France"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"St\u00e9phane","family":"Lathuili\u00e8re","sequence":"additional","affiliation":[{"name":"T&#x00E9;el&#x00E9;ecom-Paris, Institut Polytechnique de Paris,LTCI,France"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Joost","family":"van de Weijer","sequence":"additional","affiliation":[{"name":"Universitat Aut&#x00F3;noma de Barcelona,Spain"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","author":"Agrawal","year":"2024","journal-title":"Pixtral 12b"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01219-9_9"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW60793.2023.00309"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.279"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.279"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01252-6_33"},{"key":"ref7","article-title":"Efficient lifelong learning with agem","author":"Chaudhry","year":"2018","journal-title":"arXiv preprint"},{"key":"ref8","article-title":"Continual learning with tiny episodic memories","volume":"abs\/1902.10486","author":"Chaudhry","year":"2019","journal-title":"CoRR"},{"key":"ref9","author":"Chaudhry","year":"2019","journal-title":"On tiny episodic memories in continual learning"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01034"},{"key":"ref11","author":"Cho","year":"2021","journal-title":"Unifying vision-and-language tasks via text generation"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/WACV61041.2025.00550"},{"key":"ref13","article-title":"Ratt: Recurrent attention to transient tasks for continual image captioning","author":"Del Chiaro","year":"2020","journal-title":"NeurIPS"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00528"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CSF57540.2023.00027"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58565-5_6"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00907"},{"key":"ref18","article-title":"Memory efficient continual learning with transformers","author":"Ermis","year":"2022","journal-title":"NeurIPS"},{"key":"ref19","article-title":"Vision language transformers: A survey","author":"Fields","year":"2023","journal-title":"arXiv preprint"},{"key":"ref20","article-title":"Sharpness-aware minimization for efficiently improving generalization","author":"Foret","year":"2020","journal-title":"arXiv preprint"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01055"},{"key":"ref22","article-title":"General Data Protection Regulation GDPR. General data protection regulation","year":"2016","journal-title":"Regulation (EU) 2016\/679 of the European Parliament and of the Council of 27 April 2016 on the protection of natural persons with regard to the processing of personal data and on the free movement of such data, and repealing Directive 95\/46\/EC"},{"key":"ref23","author":"Ghosh","year":"2024","journal-title":"Exploring the frontier of visionlanguage models: A survey of current methodologies and future directions"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1190\/1.9781560804048.ch13"},{"key":"ref25","volume-title":"Deep Learning","author":"Goodfellow","year":"2016"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.52202\/075280-0288"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1350"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1350"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00685"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.4140\/TCP.n.2015.249"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00092"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.01826"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.215"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01560"},{"key":"ref35","article-title":"Measuring compositional generalization: A comprehensive method on realistic data","author":"Keysers","year":"2019","journal-title":"arXiv preprint"},{"key":"ref36","article-title":"Adam: A method for stochastic optimization","author":"Kingma","year":"2015","journal-title":"ICLR"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1611835114"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1611835114"},{"key":"ref39","article-title":"Deep weight factorization: Sparse learning through the lens of artificial symmetries","author":"Kolb","year":"2025","journal-title":"ICLR"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-016-0981-7"},{"key":"ref41","first-page":"4568","article-title":"Mitigating the diminishing effect of elastic weight consolidation","volume-title":"Proceedings of the 29th International Conference on Computational Linguistics","author":"Kruengkrai"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1017\/S0140525X16001837"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00725"},{"key":"ref44","article-title":"BLIP-2: bootstrapping language-image pre-training with frozen image encoders and large language models","author":"Li","year":"2023","journal-title":"ICML"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02522"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2773081"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2773081"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1145\/3547299"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.52202\/075280-1516"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1145\/3560815"},{"key":"ref52","article-title":"Gradient episodic memory for continual learning","author":"Lopez-Paz","year":"2017","journal-title":"NeurIPS"},{"key":"ref53","author":"Lopez-Paz","year":"2022","journal-title":"Gradient episodic memory for continual learning"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00718"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW53098.2021.00398"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-73209-6_18"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1037\/0033-295X.102.3.419"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1016\/s0079-7421(08)60536-8"},{"key":"ref59","article-title":"An empirical investigation of the role of pre-training in lifelong learning","author":"Mehta","year":"2021","journal-title":"arXiv preprint"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/iccvw60793.2023.00301"},{"key":"ref61","article-title":"Task formulation matters when learning continually: A case study in visual question answering","author":"Nikandrou","year":"2022","journal-title":"arXiv preprint"},{"key":"ref62","article-title":"Pytorch: An imperative style, high-performance deep learning library","author":"Paszke","year":"2019","journal-title":"NeurIPS"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00427"},{"key":"ref64","author":"Raffel","year":"2020","journal-title":"Exploring the limits of transfer learning with a unified text-to-text transformer"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/WACV56688.2023.00121"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.587"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2016.2577031"},{"key":"ref68","article-title":"Task-recency bias strikes back: Adapting covariances in exemplar-free class incremental learning","author":"Rype\u015b\u0107","year":"2025","journal-title":"NeurIPS"},{"key":"ref69","article-title":"Gradient projection memory for continual learning","author":"Saha","year":"2021","journal-title":"ICLR"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20074-8_9"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01291"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01146"},{"key":"ref73","article-title":"Climb: A continual learning benchmark for vision-andlanguage tasks","author":"Srinivasan","year":"2022","journal-title":"NeurIPS"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1186\/s42400-024-00213-z"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1580"},{"key":"ref76","author":"Vyas","year":"2021","journal-title":"Learning soft labels via meta learning"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01620"},{"key":"ref78","article-title":"S-prompts learning with pre-trained transformers: An occam\u2019s razor for domain incremental learning","author":"Wang","year":"2022","journal-title":"NeurIPS"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.findings-acl.74"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00027"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19809-0_36"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00024"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00264"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00558"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00965"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20059-5_3"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01970"},{"key":"ref88","article-title":"Zero-shot video question answering via frozen bidirectional language models","author":"Yang","year":"2022","journal-title":"NeurIPS"},{"key":"ref89","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00518"},{"key":"ref90","article-title":"Self-chained image-language model for video localization and question answering","author":"Yu","year":"2023","journal-title":"arXiv preprint"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1145\/3389685"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.1145\/3386263.3407599"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02270"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00344"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01831"},{"key":"ref96","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-long.255"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr52733.2024.02223"}],"event":{"name":"2025 IEEE\/CVF International Conference on Computer Vision (ICCV)","location":"Honolulu, HI, USA","start":{"date-parts":[[2025,10,19]]},"end":{"date-parts":[[2025,10,25]]}},"container-title":["2025 IEEE\/CVF International Conference on Computer Vision (ICCV)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11443115\/11443287\/11446056.pdf?arnumber=11446056","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T05:03:48Z","timestamp":1777611828000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11446056\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,19]]},"references-count":97,"URL":"https:\/\/doi.org\/10.1109\/iccv51701.2025.01680","relation":{},"subject":[],"published":{"date-parts":[[2025,10,19]]}}}