{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,25]],"date-time":"2026-02-25T21:03:08Z","timestamp":1772053388224,"version":"3.50.1"},"reference-count":17,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,11,21]],"date-time":"2023-11-21T00:00:00Z","timestamp":1700524800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,11,21]],"date-time":"2023-11-21T00:00:00Z","timestamp":1700524800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,11,21]]},"DOI":"10.1109\/snams60348.2023.10375440","type":"proceedings-article","created":{"date-parts":[[2024,1,2]],"date-time":"2024-01-02T20:36:22Z","timestamp":1704227782000},"page":"1-5","source":"Crossref","is-referenced-by-count":5,"title":["Pushing Boundaries: Exploring Zero Shot Object Classification with Large Multimodal Models"],"prefix":"10.1109","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9717-3252","authenticated-orcid":false,"given":"Ashhadul","family":"Islam","sequence":"first","affiliation":[{"name":"College of Science and Engineering, Hamad Bin Khalifa University,Doha,Qatar"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5145-1990","authenticated-orcid":false,"given":"Md. Rafiul","family":"Biswas","sequence":"additional","affiliation":[{"name":"College of Science and Engineering, Hamad Bin Khalifa University,Doha,Qatar"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1521-5568","authenticated-orcid":false,"given":"Wajdi","family":"Zaghouani","sequence":"additional","affiliation":[{"name":"College of Humanities and Social Sciences, Hamad Bin Khalifa University,Doha,Qatar"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2336-0490","authenticated-orcid":false,"given":"Samir Brahim","family":"Belhaouari","sequence":"additional","affiliation":[{"name":"College of Science and Engineering, Hamad Bin Khalifa University,Doha,Qatar"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7389-3274","authenticated-orcid":false,"given":"Zubair","family":"Shah","sequence":"additional","affiliation":[{"name":"College of Science and Engineering, Hamad Bin Khalifa University,Doha,Qatar"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jacr.2023.07.010"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.2196\/48659"},{"key":"ref3","author":"Lee","year":"2023","journal-title":"Building multimodal ai chatbots"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.bspc.2023.105292"},{"key":"ref5","author":"Bagdasaryan","year":"2023","journal-title":"Abusing images and sounds for indirect instruction injection in multimodal llms"},{"key":"ref6","author":"Liu","year":"2023","journal-title":"Visual instruction tuning"},{"key":"ref7","author":"Radford","year":"2021","journal-title":"Learning transferable visual models from natural language supervision"},{"key":"ref8","author":"Taori","year":"2023","journal-title":"Stanford alpaca: An instruction-following llama model"},{"key":"ref9","author":"Liu","year":"2023","journal-title":"Improved baselines with visual instruction tuning"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00686"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2012.2211477"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1017\/9789048505456.015"},{"key":"ref13","author":"Melody","journal-title":"Hymenoptera Data"},{"key":"ref14","author":"Ahsan","year":"2022","journal-title":"Image data collection and implementation of deep learning-based model in detecting monkeypox disease using modified vgg16"},{"key":"ref15","author":"Ahsan","year":"2022","journal-title":"Monkeypox image data collection"},{"key":"ref16","article-title":"Autistic Children Facial Image Data Set","volume-title":"G.","year":"2023"},{"key":"ref17","article-title":"GitHub - haotian-liu\/LLaVA: [NeurIPS23 Oral] Visual Instruction Tuning: LLaVA (Large Language-and-Vision Assistant) built towards GPT-4V level capabilities.","journal-title":"Haotian-Liu"}],"event":{"name":"2023 Tenth International Conference on Social Networks Analysis, Management and Security (SNAMS)","location":"Abu Dhabi, United Arab Emirates","start":{"date-parts":[[2023,11,21]]},"end":{"date-parts":[[2023,11,24]]}},"container-title":["2023 Tenth International Conference on Social Networks Analysis, Management and Security (SNAMS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10375374\/10375393\/10375440.pdf?arnumber=10375440","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,12]],"date-time":"2024-01-12T22:26:01Z","timestamp":1705098361000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10375440\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,11,21]]},"references-count":17,"URL":"https:\/\/doi.org\/10.1109\/snams60348.2023.10375440","relation":{},"subject":[],"published":{"date-parts":[[2023,11,21]]}}}