{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,11]],"date-time":"2026-02-11T21:29:02Z","timestamp":1770845342121,"version":"3.50.1"},"reference-count":33,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,5]],"date-time":"2025-10-05T00:00:00Z","timestamp":1759622400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,5]],"date-time":"2025-10-05T00:00:00Z","timestamp":1759622400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,5]]},"DOI":"10.1109\/smc58881.2025.11343602","type":"proceedings-article","created":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T20:54:44Z","timestamp":1769633684000},"page":"1550-1555","source":"Crossref","is-referenced-by-count":0,"title":["Few-Shot Fine-Grained Image Classification via Vision Transformer"],"prefix":"10.1109","author":[{"given":"Yongqi","family":"Liu","sequence":"first","affiliation":[{"name":"Chongqing University,College of Computer Science,Chongqing,China,400044"}]},{"given":"Tong","family":"Xiao","sequence":"additional","affiliation":[{"name":"Tsinghua University,Department of Computer Science and Technology,Beijing,China,100084"}]},{"given":"Zeao","family":"Chen","sequence":"additional","affiliation":[{"name":"Chongqing University,College of Computer Science,Chongqing,China,400044"}]},{"given":"Chen","family":"Zhou","sequence":"additional","affiliation":[{"name":"Chongqing University,College of Computer Science,Chongqing,China,400044"}]},{"given":"Zhi-Jie","family":"Wang","sequence":"additional","affiliation":[{"name":"Chongqing University,College of Computer Science,Chongqing,China,400044"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/3485133"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.9"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/3582688"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298775"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00977"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2023.3236636"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2020.3043128"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i5.28208"},{"key":"ref9","article-title":"Deep meta-learning: Learning to learn in the concept space","volume":"abs\/1802.03596","author":"Zhou","year":"2018","journal-title":"CoRR"},{"key":"ref10","article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","author":"Dosovitskiy","year":"2021","journal-title":"ICLR"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20077-9_17"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01887"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00676"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i1.19967"},{"key":"ref15","first-page":"4077","article-title":"Prototypical networks for few-shot learning","author":"Snell","year":"2017","journal-title":"NIPS"},{"key":"ref16","first-page":"1126","article-title":"Model-agnostic meta-learning for fast adaptation of deep networks","author":"Finn","year":"2017","journal-title":"ICML"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3230709"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2019.2921876"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.170"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01216-8_38"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6822"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2024.3405713"},{"key":"ref23","first-page":"3057","article-title":"Meta-reinforced synthetic data for one-shot fine-grained visual recognition","author":"Tsutsui","year":"2019","journal-title":"NeurIPS"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3680593"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.110158"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2024.110967"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i3.25383"},{"key":"ref28","article-title":"Adaptformer: Adapting vision transformers for scalable visual recognition","author":"Chen","year":"2022","journal-title":"NIPS"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107404"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00886"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1145\/3474085.3475532"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2024.110485"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2024.110736"}],"event":{"name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","location":"Vienna, Austria","start":{"date-parts":[[2025,10,5]]},"end":{"date-parts":[[2025,10,8]]}},"container-title":["2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11342430\/11342431\/11343602.pdf?arnumber=11343602","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,11]],"date-time":"2026-02-11T20:50:31Z","timestamp":1770843031000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11343602\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,5]]},"references-count":33,"URL":"https:\/\/doi.org\/10.1109\/smc58881.2025.11343602","relation":{},"subject":[],"published":{"date-parts":[[2025,10,5]]}}}