{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,25]],"date-time":"2026-03-25T06:25:04Z","timestamp":1774419904707,"version":"3.50.1"},"reference-count":48,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,4,6]],"date-time":"2025-04-06T00:00:00Z","timestamp":1743897600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,4,6]],"date-time":"2025-04-06T00:00:00Z","timestamp":1743897600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,4,6]]},"DOI":"10.1109\/icassp49660.2025.10889269","type":"proceedings-article","created":{"date-parts":[[2025,3,12]],"date-time":"2025-03-12T17:15:19Z","timestamp":1741799719000},"page":"1-5","source":"Crossref","is-referenced-by-count":0,"title":["KARST: Multi-Kernel Kronecker Adaptation with Re-Scaling Transmission for Visual Classification"],"prefix":"10.1109","author":[{"given":"Yue","family":"Zhu","sequence":"first","affiliation":[{"name":"Dalian University of Technology,Dalian,China"}]},{"given":"Haiwen","family":"Diao","sequence":"additional","affiliation":[{"name":"Dalian University of Technology,Dalian,China"}]},{"given":"Shang","family":"Gao","sequence":"additional","affiliation":[{"name":"Dalian University of Technology,Dalian,China"}]},{"given":"Long","family":"Chen","sequence":"additional","affiliation":[{"name":"The Hong Kong University of Science and Technology,Hong Kong,China"}]},{"given":"Huchuan","family":"Lu","sequence":"additional","affiliation":[{"name":"Dalian University of Technology,Dalian,China"}]}],"member":"263","reference":[{"key":"ref1","article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","author":"Dosovitskiy","year":"2021","journal-title":"ICLR"},{"key":"ref2","article-title":"Llama: Open and efficient foundation language models","author":"Touvron","year":"2023"},{"key":"ref3","article-title":"Unveiling encoder-free vision-language models","author":"Diao","year":"2024"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i2.16209"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02714"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72784-9_5"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-short.1"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19827-4_41"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2024.3485498"},{"key":"ref10","article-title":"Lora: Low-rank adaptation of large language models","author":"Hu","year":"2022","journal-title":"ICLR"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i1.25187"},{"key":"ref12","first-page":"1022","article-title":"Compacter: Efficient low-rank hypercomplex adapter layers","author":"Mahabadi","year":"2021","journal-title":"NeurIPS"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-85747-8_4"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/cvprw63382.2024.00804"},{"key":"ref15","article-title":"One-for-all: Generalized lora for parameter-efficient fine-tuning","author":"Chavan","year":"2023"},{"key":"ref16","article-title":"Multilora: Democratizing lora for better multi-task learning","author":"Wang","year":"2023"},{"key":"ref17","article-title":"Lora+: Efficient low rank adaptation of large models","author":"Hayou","year":"2024"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-short.107"},{"key":"ref19","article-title":"A large-scale study of representation learning with the visual task adaptation benchmark","author":"Zhai","year":"2019"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2006.79"},{"key":"ref21","article-title":"Learning multiple layers of features from tiny images","author":"Krizhevsky","year":"2009"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.461"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICVGIP.2008.47"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6248092"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2010.5539970"},{"issue":"2","key":"ref26","first-page":"4","article-title":"Reading digits in natural images with unsupervised feature learning","volume-title":"NIPS workshop on deep learning and unsupervised feature learning","volume":"2011","author":"Netzer"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2017.2675998"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/JSTARS.2019.2918242"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-00934-2_24"},{"key":"ref30","article-title":"Kaggle diabetic retinopathy detection","author":"Kaggle","year":"2015"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.215"},{"key":"ref32","article-title":"dsprites: Disentanglement testing sprites dataset","author":"Matthey","year":"2017"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2004.1315150"},{"key":"ref34","article-title":"Deepmind lab","author":"Beattie","year":"2016"},{"key":"ref35","first-page":"1","article-title":"Vision meets robotics: The kitti dataset. the international journal of robotics research","author":"Geiger","journal-title":"Int. J. Rob. Res"},{"key":"ref36","article-title":"Fine-grained visual classification of aircraft","author":"Maji","year":"2013"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10599-4_29"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW.2013.77"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2006.42"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2024.3435939"},{"key":"ref41","first-page":"5389","article-title":"Do imagenet classifiers generalize to imagenet?","volume-title":"International conference on machine learning.","author":"Recht","year":"2019"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref43","article-title":"LST: ladder side-tuning for parameter and memory efficient transfer learning","author":"Sung","year":"2022","journal-title":"NeurIPS"},{"key":"ref44","article-title":"Adapt-former: Adapting vision transformers for scalable visual recognition","author":"Chen","year":"2022","journal-title":"NeurIPS"},{"key":"ref45","article-title":"Scaling & shifting your features: A new baseline for efficient model tuning","author":"Lian","year":"2022","journal-title":"NeurIPS"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i11.29096"},{"key":"ref47","article-title":"Heat: Head-level parameter efficient adaptation of vision transformers with taylor-expansion importance scores","author":"Zhong","year":"2024"},{"key":"ref48","article-title":"Sparse-tuning: Adapting vision transformers with efficient fine-tuning and inference","author":"Liu","year":"2024"}],"event":{"name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Hyderabad, India","start":{"date-parts":[[2025,4,6]]},"end":{"date-parts":[[2025,4,11]]}},"container-title":["ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10887540\/10887541\/10889269.pdf?arnumber=10889269","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,25]],"date-time":"2026-03-25T05:25:20Z","timestamp":1774416320000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10889269\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,6]]},"references-count":48,"URL":"https:\/\/doi.org\/10.1109\/icassp49660.2025.10889269","relation":{},"subject":[],"published":{"date-parts":[[2025,4,6]]}}}