{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,21]],"date-time":"2026-01-21T22:02:57Z","timestamp":1769032977792,"version":"3.49.0"},"reference-count":24,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T00:00:00Z","timestamp":1761091200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T00:00:00Z","timestamp":1761091200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100003759","name":"Universidad Polit\u00e9cnica de Madrid (Programa Propio I+D+i)","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100003759","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,22]]},"DOI":"10.1109\/cbmi66578.2025.11339266","type":"proceedings-article","created":{"date-parts":[[2026,1,20]],"date-time":"2026-01-20T20:38:56Z","timestamp":1768941536000},"page":"1-7","source":"Crossref","is-referenced-by-count":0,"title":["Exploring the Effect of Size, Architecture and Fine-Tuning Hyperparameters on Large Visual-Language Model Adaptation for Video Memorability Prediction"],"prefix":"10.1109","author":[{"given":"David","family":"Luna-Garc\u00eda","sequence":"first","affiliation":[{"name":"Universidad Polit&#x00E9;cnica de Madrid,THAU Group, IPTC,Madrid,Spain"}]},{"given":"Iv\u00e1n","family":"Mart\u00edn-Fern\u00e1ndez","sequence":"additional","affiliation":[{"name":"Universidad Polit&#x00E9;cnica de Madrid,THAU Group, IPTC,Madrid,Spain"}]},{"given":"Sergio","family":"Esteban-Romero","sequence":"additional","affiliation":[{"name":"Universidad Polit&#x00E9;cnica de Madrid,THAU Group, IPTC,Madrid,Spain"}]},{"given":"Manuel","family":"Gil-Mart\u00edn","sequence":"additional","affiliation":[{"name":"Universidad Polit&#x00E9;cnica de Madrid,THAU Group, IPTC,Madrid,Spain"}]},{"given":"Fernando","family":"Fern\u00e1ndez-Mart\u00ednez","sequence":"additional","affiliation":[{"name":"Universidad Polit&#x00E9;cnica de Madrid,THAU Group, IPTC,Madrid,Spain"}]}],"member":"263","reference":[{"key":"ref1","volume-title":"Long-Term Ad Memorability: Understanding & Generating Memorable Ads","author":"Harini","year":"2023"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/3617233.3617260"},{"key":"ref3","volume-title":"Multimodal memorability: Modeling effects of semantics and decay on video memorability","author":"Newman","year":"2023"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.670"},{"key":"ref5","doi-asserted-by":"crossref","DOI":"10.1007\/s44267-024-00050-1","volume-title":"Effectiveness Assessment of Recent Large Vision-Language Models","author":"Jiang","year":"2024"},{"key":"ref6","volume-title":"LoRA: Low-Rank Adaptation of Large Language Models","author":"Hu","year":"2021"},{"key":"ref7","volume-title":"Qwen- VL: A Versatile Vision-Language Model for Understanding, Localization, Text Reading, and Beyond","author":"Bai","year":"2023"},{"key":"ref8","volume-title":"Qwen2.5-VL Technical Report","author":"Bai","year":"2025"},{"issue":"6","key":"ref9","doi-asserted-by":"crossref","DOI":"10.3390\/s25061661","article-title":"Parameter-Efficient Adaptation of Large Vision-Language Models for Video Memorability Prediction","volume":"25","author":"Mart\u00edn-Fernandez","year":"2025","journal-title":"Sensors"},{"key":"ref10","doi-asserted-by":"crossref","first-page":"104714","DOI":"10.1016\/j.cognition.2021.104714","article-title":"Visual memorability in the absence of semantic content","volume":"212","author":"Lin","year":"2021","journal-title":"Cognition"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1038\/s41562-020-0901-2"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.21236\/ADA554133"},{"key":"ref13","volume-title":"The Illustrated Transformer","author":"Alammar","year":"2018"},{"key":"ref14","volume-title":"Low-rank adaptation (LoRA) for fine-tuning large models"},{"key":"ref15","article-title":"THAU-UPM at EmoSPeech-IberLEF2024: Efficient Adaptation of Mono-modal and Multi-modal Large Language Models for Automatic Speech Emotion Recognition","volume-title":"Proceedings of the Iberian Languages Evaluation Fo-rum (IberLEF 2024), Co-Located with the 40th Conference of the Span-ish Society for Natural Language Processing (SEPLN 2024)","author":"Esteban-Romero"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.3390\/sym17081349"},{"key":"ref17","first-page":"10088","article-title":"QLoRA: Efficient Finetuning of Quantized LLMs","volume-title":"Proceedings of the Ad-vances in Neural Information Processing Systems, New Orleans, LA, USA","volume":"36","author":"Dettmers","year":"2023"},{"key":"ref18","article-title":"Overview of The MediaEval 2023 Predicting Video Memorability Task","volume-title":"Proceedings of the MediaEval \u201923: Multimedia Evaluation Workshop","author":"Constantin"},{"key":"ref19","volume-title":"arXiv preprint","author":"Chen","year":"2023"},{"key":"ref20","volume-title":"Video-LLaMA: An Instruction-tuned Audio- Visual Language Model for Video Understanding","author":"Zhang","year":"2023"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3206025.3206056"},{"key":"ref22","volume-title":"Magerit v3: Documentacion del sistema","author":"de Supercomputacion","year":"2025"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00033"},{"key":"ref24","article-title":"Something-Anything: Disentangling the effect of semantic content for video transformers","volume-title":"Proceedings of the 36th Conference on Neural Information Processing Systems (NeurIPS 2022) Datasets and Benchmarks Track","author":"Huber"}],"event":{"name":"2025 International Conference on Content-Based Multimedia Indexing (CBMI)","location":"Dublin, Ireland","start":{"date-parts":[[2025,10,22]]},"end":{"date-parts":[[2025,10,24]]}},"container-title":["2025 International Conference on Content-Based Multimedia Indexing (CBMI)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11339229\/11339242\/11339266.pdf?arnumber=11339266","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,21]],"date-time":"2026-01-21T07:11:18Z","timestamp":1768979478000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11339266\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,22]]},"references-count":24,"URL":"https:\/\/doi.org\/10.1109\/cbmi66578.2025.11339266","relation":{},"subject":[],"published":{"date-parts":[[2025,10,22]]}}}