{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T19:49:35Z","timestamp":1776887375425,"version":"3.51.2"},"reference-count":43,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,4,6]],"date-time":"2025-04-06T00:00:00Z","timestamp":1743897600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,4,6]],"date-time":"2025-04-06T00:00:00Z","timestamp":1743897600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,4,6]]},"DOI":"10.1109\/icassp49660.2025.10888395","type":"proceedings-article","created":{"date-parts":[[2025,3,12]],"date-time":"2025-03-12T17:15:02Z","timestamp":1741799702000},"page":"1-5","source":"Crossref","is-referenced-by-count":8,"title":["Enhancing Remote Sensing Vision-Language Models for Zero-Shot Scene Classification"],"prefix":"10.1109","author":[{"given":"Karim","family":"El Khoury","sequence":"first","affiliation":[{"name":"UCLouvain,Belgium"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Maxime","family":"Zanella","sequence":"additional","affiliation":[{"name":"UCLouvain,Belgium"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Beno\u00eet","family":"G\u00e9rin","sequence":"additional","affiliation":[{"name":"UCLouvain,Belgium"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tiffanie","family":"Godelaine","sequence":"additional","affiliation":[{"name":"UCLouvain,Belgium"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Beno\u00eet","family":"Macq","sequence":"additional","affiliation":[{"name":"UCLouvain,Belgium"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sa\u00efd","family":"Mahmoudi","sequence":"additional","affiliation":[{"name":"UMons,Belgium"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Christophe","family":"De Vleeschouwer","sequence":"additional","affiliation":[{"name":"UCLouvain,Belgium"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ismail","family":"Ben Ayed","sequence":"additional","affiliation":[{"name":"&#x00C9;TS Montreal,Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Land-cover change detection using paired openstreetmap data and optical highresolution imagery via object-guided transformer","author":"Chen","year":"2023"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.rse.2020.111716"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/j.tplants.2018.11.007"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2023.3330886"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/s13753-023-00526-6"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP51287.2024.10647448"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58598-3_10"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46478-7_5"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.3390\/rs12030405"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.3390\/app10248931"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2024.3390838"},{"key":"ref12","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"Proc. 38th Int. Conf. Mach. Learn","volume":"139","author":"Radford"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2024.3449154"},{"key":"ref14","article-title":"Towards helpful and honest remote sensing large vision language model","author":"Pang","year":"2024"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i6.28393"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72904-1_26"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/MGRS.2024.3383473"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/72.788640"},{"key":"ref19","first-page":"200","article-title":"Transductive inference for text classification using support vector machines","volume-title":"ICML","volume":"99","author":"Joachims"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02722"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-73471-7_16"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1056\/aioa2400640"},{"key":"ref23","article-title":"Does clip benefit visual question answering in the medical domain as much as it does in the general domain?","author":"Eslami","year":"2021"},{"key":"ref24","article-title":"Skysensegpt: A fine-grained instruction tuning dataset and model for remote sensing vision-language understanding","author":"Luo","year":"2024"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/tgrs.2024.3409624"},{"key":"ref26","article-title":"Remote sensing vision-language foundation models without annotations via ground remote alignment","volume-title":"ICLR","author":"Mall"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1016\/j.isprsjprs.2025.03.028"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.3390\/rs16091477"},{"key":"ref29","article-title":"A baseline for few-shot image classification","volume-title":"ICLR","author":"Dhillon"},{"key":"ref30","first-page":"2445","article-title":"Information maximization for fewshot learning","volume-title":"Adv. Neural Inf. Process. Syst","volume":"33","author":"Boudiaf"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_43"},{"key":"ref32","article-title":"Laplacian regularized few-shot learning","volume-title":"ICML","author":"Ziko"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-73471-7_16"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2017.2685945"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/IGARSS.2018.8519248"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1016\/j.isprsjprs.2020.09.020"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2018.2864987"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1016\/j.isprsjprs.2018.01.004"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2017.2675998"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1117\/1.JRS.10.035004"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.3390\/s20061594"},{"key":"ref42","article-title":"Structural high-resolution satellite image indexing","volume":"38","author":"Xia","year":"2010","journal-title":"Int. Arch. Photogramm. Remote Sens. Spatial Inf. Sci."},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02245"}],"event":{"name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Hyderabad, India","start":{"date-parts":[[2025,4,6]]},"end":{"date-parts":[[2025,4,11]]}},"container-title":["ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10887540\/10887541\/10888395.pdf?arnumber=10888395","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,25]],"date-time":"2026-03-25T05:22:07Z","timestamp":1774416127000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10888395\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,6]]},"references-count":43,"URL":"https:\/\/doi.org\/10.1109\/icassp49660.2025.10888395","relation":{},"subject":[],"published":{"date-parts":[[2025,4,6]]}}}