{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,20]],"date-time":"2026-02-20T18:55:36Z","timestamp":1771613736345,"version":"3.50.1"},"reference-count":24,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,8,31]],"date-time":"2025-08-31T00:00:00Z","timestamp":1756598400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,8,31]],"date-time":"2025-08-31T00:00:00Z","timestamp":1756598400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,8,31]]},"DOI":"10.1109\/mlsp62443.2025.11204231","type":"proceedings-article","created":{"date-parts":[[2025,10,24]],"date-time":"2025-10-24T17:15:52Z","timestamp":1761326152000},"page":"1-5","source":"Crossref","is-referenced-by-count":2,"title":["Colflor: Towards Bert-Size Vision-Language Document Retrieval Models"],"prefix":"10.1109","author":[{"given":"Ahmed","family":"Masry","sequence":"first","affiliation":[{"name":"York University,Department of Electrical Engineering and Computer Science,Toronto,Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Enamul","family":"Hoque","sequence":"additional","affiliation":[{"name":"York University,Department of Electrical Engineering and Computer Science,Toronto,Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","author":"Mitra","year":"2019","journal-title":"An updated duet model for passage re-ranking"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/3397271.3401075"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1410"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.eacl-main.148"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/WACV48630.2021.00225"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/wacv51458.2022.00264"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.findings-acl.177"},{"key":"ref8","author":"Faysse","year":"2024","journal-title":"Colpali: Efficient document retrieval with vision language models"},{"key":"ref9","author":"Beyer","year":"2024","journal-title":"Paligemma: A versatile 3b vlm for transfer"},{"key":"ref10","author":"Wang","year":"2024","journal-title":"Qwen2-vl: Enhancing vision-language model\u2019s perception of the world at any resolution"},{"key":"ref11","author":"Liu","year":"2023","journal-title":"Visual instruction tuning"},{"key":"ref12","author":"Chen","year":"2025","journal-title":"Expanding performance boundaries of opensource multimodal models with model, data, and testtime scaling"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr52733.2024.00461"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20053-3_5"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.703"},{"key":"ref16","author":"Radford","year":"2021","journal-title":"Learning transferable visual models from natural language supervision"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3548422"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.775"},{"key":"ref19","year":"2024","journal-title":"Introducing the next generation of claude"},{"key":"ref20","author":"Koukounas","year":"2024","journal-title":"Jina clip: Your clip model is also your text retriever"},{"key":"ref21","author":"Nussbaum","year":"2024","journal-title":"Nomic embed vision: Expanding the latent space"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/iccv51070.2023.01100"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/iccv51070.2023.01100"},{"key":"ref24","author":"Team","year":"2025","journal-title":"Nomic embed multimodal: Interleaved text, image, and screenshots for visual document retrieval"}],"event":{"name":"2025 IEEE 35th International Workshop on Machine Learning for Signal Processing (MLSP)","location":"Istanbul, Turkiye","start":{"date-parts":[[2025,8,31]]},"end":{"date-parts":[[2025,9,3]]}},"container-title":["2025 IEEE 35th International Workshop on Machine Learning for Signal Processing (MLSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11204201\/11204202\/11204231.pdf?arnumber=11204231","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,5]],"date-time":"2025-11-05T18:37:09Z","timestamp":1762367829000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11204231\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,31]]},"references-count":24,"URL":"https:\/\/doi.org\/10.1109\/mlsp62443.2025.11204231","relation":{},"subject":[],"published":{"date-parts":[[2025,8,31]]}}}