{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,23]],"date-time":"2026-04-23T20:44:26Z","timestamp":1776977066745,"version":"3.51.4"},"reference-count":32,"publisher":"IEEE","license":[{"start":{"date-parts":[[2026,2,24]],"date-time":"2026-02-24T00:00:00Z","timestamp":1771891200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,2,24]],"date-time":"2026-02-24T00:00:00Z","timestamp":1771891200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026,2,24]]},"DOI":"10.1109\/icaiic68212.2026.11454372","type":"proceedings-article","created":{"date-parts":[[2026,3,31]],"date-time":"2026-03-31T19:50:24Z","timestamp":1774986624000},"page":"1517-1522","source":"Crossref","is-referenced-by-count":0,"title":["Enhancing Large Vision\u2013Language Models for Multimodal Defect Detection via SFT\u2013GRPO Reinforcement Learning"],"prefix":"10.1109","author":[{"given":"Hung Viet","family":"Nguyen","sequence":"first","affiliation":[{"name":"INJE University,Department of Digital Anti-Aging Healthcare,Kimhae,Rep. of Korea,50834"}]},{"given":"Hyojin","family":"Park","sequence":"additional","affiliation":[{"name":"Kyungnam University,Gyeongnam Intelligence Innovation Center (GIIC),Changwon,Rep. of Korea,51767"}]},{"given":"Namhyun","family":"Yoo","sequence":"additional","affiliation":[{"name":"Kyungnam University,Department of Computer Engineering,Changwon,Rep. of Korea,51767"}]},{"given":"Jinhong","family":"Yang","sequence":"additional","affiliation":[{"name":"INJE University,Department of Medical IT,Kimhae,Rep. of Korea,50834"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1108\/tqm-11-2023-0361"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/s10796-022-10252-x"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-97-6790-8_5"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/access.2024.3425166"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.3390\/mi14030570"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.71465\/ajipe.3405"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.91"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.119623"},{"key":"ref9","article-title":"LLaVA-NeXT: Improved reasoning, OCR, and world knowledge","author":"Lee","year":"2025","journal-title":"LLaVA"},{"key":"ref10","article-title":"Gemma 3 Technical Report","volume-title":"CoRR","volume":"abs\/2503.19786","author":"Kamath","year":"2025"},{"key":"ref11","author":"Bai","year":"2025","journal-title":"Qwen2.5-VL Technical Report"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1145\/3696410.3714764"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i3.27963"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1088\/1742-6596\/2897\/1\/012050"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.3390\/electronics14142748"},{"key":"ref16","first-page":"2052","article-title":"ReConPatch: Contrastive Patch Representation Learning for Industrial Anomaly Detection","volume-title":"presented at the Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, 2024","author":"Hyun","year":"2025"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/smc54092.2024.10831766"},{"key":"ref18","first-page":"20405","article-title":"Dinomaly: The Less Is More Philosophy in Multi-Class Unsupervised Anomaly Detection","volume-title":"presented at the Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 2025","author":"Guo","year":"2025"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/access.2025.3525567"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01580"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72761-0_4"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01878"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1115\/DETC2025-168875"},{"key":"ref24","first-page":"4097","article-title":"Detect, Classify, Act: Categorizing Industrial Anomalies with MultiModal Large Language Models","volume-title":"presented at the Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 2025","author":"Mokhtar","year":"2025"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v39i4.32433"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.01897"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/tase.2025.3591656"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/icdm65498.2025.00097"},{"key":"ref29","article-title":"AnomalyR 1","author":"Chao","year":"2025","journal-title":"A GRPO-based End-to-end MLLM for Industrial Anomaly Detection"},{"key":"ref30","article-title":"LADReasoner","author":"Li","year":"2025","journal-title":"Tiny Multimodal Models are Good Reasoners for Logical Anomaly Detection"},{"key":"ref31","article-title":"AIHub","volume-title":"LNG Tank Quality Inspection Image Data.","year":"2025"},{"key":"ref32","volume-title":"Unsloth","author":"Han","year":"(2023)"}],"event":{"name":"2026 International Conference on Artificial Intelligence in Information and Communication (ICAIIC)","location":"Tokyo, Japan","start":{"date-parts":[[2026,2,24]]},"end":{"date-parts":[[2026,2,27]]}},"container-title":["2026 International Conference on Artificial Intelligence in Information and Communication (ICAIIC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11454127\/11454137\/11454372.pdf?arnumber=11454372","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,23]],"date-time":"2026-04-23T19:56:09Z","timestamp":1776974169000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11454372\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,2,24]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/icaiic68212.2026.11454372","relation":{},"subject":[],"published":{"date-parts":[[2026,2,24]]}}}