{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,10]],"date-time":"2026-03-10T05:16:04Z","timestamp":1773119764775,"version":"3.50.1"},"reference-count":91,"publisher":"Springer Science and Business Media LLC","issue":"9","license":[{"start":{"date-parts":[[2024,3,18]],"date-time":"2024-03-18T00:00:00Z","timestamp":1710720000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,3,18]],"date-time":"2024-03-18T00:00:00Z","timestamp":1710720000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2024,9]]},"DOI":"10.1007\/s11263-024-02036-4","type":"journal-article","created":{"date-parts":[[2024,3,18]],"date-time":"2024-03-18T12:02:05Z","timestamp":1710763325000},"page":"3375-3407","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":12,"title":["Vision-Language Alignment Learning Under Affinity and Divergence Principles for Few-Shot Out-of-Distribution Generalization"],"prefix":"10.1007","volume":"132","author":[{"given":"Lin","family":"Zhu","sequence":"first","affiliation":[]},{"given":"Weihan","family":"Yin","sequence":"additional","affiliation":[]},{"given":"Yiyao","family":"Yang","sequence":"additional","affiliation":[]},{"given":"Fan","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Zhaoyu","family":"Zeng","sequence":"additional","affiliation":[]},{"given":"Qinying","family":"Gu","sequence":"additional","affiliation":[]},{"given":"Xinbing","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Chenghu","family":"Zhou","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3129-3953","authenticated-orcid":false,"given":"Nanyang","family":"Ye","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,3,18]]},"reference":[{"key":"2036_CR1","unstructured":"Adebayo, J., Gilmer, J., Muelly, M., Goodfellow, I., Hardt, M., & Kim, B. (2018). Sanity checks for saliency maps. arXiv:1810.03292v3"},{"key":"2036_CR2","unstructured":"Ahuja, K., Shanmugam, K., Varshney, K., & Dhurandhar, A. (2020). Invariant risk minimization games. In International Conference on Machine Learning, pp. 145\u2013155. PMLR."},{"key":"2036_CR3","doi-asserted-by":"crossref","unstructured":"Akuzawa, K., Iwasawa, Y., & Matsuo, Y. (2019). Adversarial invariant feature learning with accuracy constraint for domain generalization. In Joint European Conference on Machine Learning and Knowledge Discovery in Databases, pp. 315\u2013331. Springer.","DOI":"10.1007\/978-3-030-46147-8_19"},{"key":"2036_CR4","unstructured":"Arjovsky, M., Bottou, L., Gulrajani, I., & Lopez-Paz, D. (2019). Invariant risk minimization. arXiv:1907.02893."},{"key":"2036_CR5","first-page":"8265","volume":"35","author":"D Arpit","year":"2022","unstructured":"Arpit, D., Wang, H., Zhou, Y., & Xiong, C. (2022). Ensemble of averages: Improving model selection and boosting performance in domain generalization. Advances in Neural Information Processing Systems, 35, 8265\u20138277.","journal-title":"Advances in Neural Information Processing Systems"},{"issue":"61","key":"2036_CR6","first-page":"1803","volume":"11","author":"D Baehrens","year":"2010","unstructured":"Baehrens, D., Schroeter, T., Harmeling, S., Kawanabe, M., Hansen, K., & M\u00fcller, K.-R. (2010). How to explain individual classification decisions. Journal of Machine Learning Research, 11(61), 1803\u20131831.","journal-title":"Journal of Machine Learning Research"},{"key":"2036_CR7","unstructured":"Bahng, H., Chun, S., Yun, S., Choo, J., & Oh, S. J. (2020). Learning de-biased representations with biased representations. In: International Conference on Machine Learning, pp. 528\u2013539. PMLR."},{"key":"2036_CR8","doi-asserted-by":"publisher","first-page":"6705","DOI":"10.1609\/aaai.v35i8.16829","volume":"35","author":"H Bai","year":"2021","unstructured":"Bai, H., Sun, R., Hong, L., Zhou, F., Ye, N., Ye, H.-J., Chan, S.-H.G., & Li, Z. (2021). Decaug: Out-of-distribution generalization via decomposed feature representation and semantic augmentation. In Proceedings of the AAAI Conference on Artificial Intelligence, 35, 6705\u20136713.","journal-title":"In Proceedings of the AAAI Conference on Artificial Intelligence"},{"key":"2036_CR9","unstructured":"Barbu, A., Mayo, D., Alverio, J., Luo, W., Wang, C., Gutfreund, D., Tenenbaum, J., & Katz, B. (2019). Objectnet: A large-scale bias-controlled dataset for pushing the limits of object recognition models. In NeurIPS."},{"key":"2036_CR10","unstructured":"Beery, S., Agarwal, A., Cole, E., & Birodkar, V. (2021). The iwildcam 2021 competition dataset. arXiv:2105.03494."},{"issue":"1","key":"2036_CR11","first-page":"46","volume":"22","author":"G Blanchard","year":"2021","unstructured":"Blanchard, G., Deshmukh, A. A., Dogan, \u00dc., Lee, G., & Scott, C. (2021). Domain generalization by marginal transfer learning. The Journal of Machine Learning Research, 22(1), 46\u2013100.","journal-title":"The Journal of Machine Learning Research"},{"key":"2036_CR12","unstructured":"Chen, Z., Duan, Y., Wang, W., He, J., Lu, T., Dai, J., & Qiao, Y. (2022). Vision transformer adapter for dense predictions. arXiv:2205.08534."},{"key":"2036_CR13","unstructured":"Chen, T., Kornblith, S., Norouzi, M., & Hinton, G. (2020). A simple framework for contrastive learning of visual representations. In International Conference on Machine Learning, pp. 1597\u20131607. PMLR."},{"key":"2036_CR14","unstructured":"Chen, H., Tao, R., Zhang, H., Wang, Y., Ye, W., Wang, J., Hu, G., & Savvides, M. (2022). Conv-adapter: Exploring parameter efficient transfer learning for convnets. arXiv:2208.07463."},{"key":"2036_CR15","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.-J., Li, K., & Fei-Fei, L. (2009). Imagenet: A large-scale hierarchical image database. In 2009 IEEE Conference on Computer Vision and Pattern Recognition, pp. 248\u2013255","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"2036_CR16","unstructured":"Donahue, J., Jia, Y., Vinyals, O., Hoffman, J., Zhang, N., Tzeng, E., & Darrell, T. (2014) Decaf: A deep convolutional activation feature for generic visual recognition. In: Xing, E. P., Jebara, T. (eds.) Proceedings of the 31st International Conference on Machine Learning. Proceedings of Machine Learning Research, vol. 32, pp. 647\u2013655. PMLR"},{"key":"2036_CR17","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., Weissenborn, D., Zhai, X., Unterthiner, T., Dehghani, M., Minderer, M., Heigold, G., & Gelly, S., et\u00a0al. (2020). An image is worth 16x16 words: Transformers for image recognition at scale. arXiv:2010.11929"},{"key":"2036_CR18","unstructured":"Dou, Q., Coelho\u00a0de Castro, D., Kamnitsas, K., & Glocker, B. (2019). Domain generalization via model-agnostic learning of semantic features. arXiv:1910.13580v1"},{"key":"2036_CR19","doi-asserted-by":"crossref","unstructured":"Du, Y., Xu, J., Xiong, H., Qiu, Q., Zhen, X., Snoek, C. G., & Shao, L. (2020). Learning to learn with variational information bottleneck for domain generalization. In Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part X 16, pp. 200\u2013216. Springer.","DOI":"10.1007\/978-3-030-58607-2_12"},{"key":"2036_CR20","unstructured":"Du, Y., Zhen, X., Shao, L., & Snoek, C. G. (2021). Metanorm: Learning to normalize few-shot batches across domains. In International Conference on Learning Representations."},{"key":"2036_CR21","doi-asserted-by":"crossref","unstructured":"Fan, Z., Ma, Y., Li, Z., & Sun, J. (2021). Generalized few-shot object detection without forgetting. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4527\u20134536.","DOI":"10.1109\/CVPR46437.2021.00450"},{"key":"2036_CR22","unstructured":"Finn, C., Abbeel, P., & Levine, S. (2017). Model-agnostic meta-learning for fast adaptation of deep networks. In International Conference on Machine Learning, pp. 1126\u20131135. PMLR."},{"key":"2036_CR23","doi-asserted-by":"crossref","unstructured":"Gao, T., Fisch, A., & Chen, D. (2020). Making pre-trained language models better few-shot learners. arXiv:2012.15723.","DOI":"10.18653\/v1\/2021.acl-long.295"},{"key":"2036_CR24","unstructured":"Gao, P., Geng, S., Zhang, R., Ma, T., Fang, R., Zhang, Y., Li, H., & Qiao, Y. (2021). Clip-adapter: Better vision-language models with feature adapters. arXiv:2110.04544."},{"key":"2036_CR25","doi-asserted-by":"crossref","unstructured":"Goyal, S., Kumar, A., Garg, S., Kolter, Z., & Raghunathan, A. (2023). Finetune like you pretrain: Improved finetuning of zero-shot vision models. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 19338\u201319347.","DOI":"10.1109\/CVPR52729.2023.01853"},{"key":"2036_CR26","unstructured":"Gulrajani, I., & Lopez-Paz, D. (2020). In search of lost domain generalization. arXiv:2007.01434."},{"key":"2036_CR27","unstructured":"Hao, T., Chen, H., Guo, Y., & Ding, G. (2023). Consolidator: Mergable adapter with group connections for vision transformer. In International Conference on Learning Representations."},{"key":"2036_CR28","doi-asserted-by":"crossref","unstructured":"Hendrycks, D., Basart, S., Mu, N., Kadavath, S., Wang, F., Dorundo, E., Desai, R., Zhu, T., Parajuli, S., & Guo, M., et\u00a0al. (2021). The many faces of robustness: A critical analysis of out-of-distribution generalization. In Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 8340\u20138349.","DOI":"10.1109\/ICCV48922.2021.00823"},{"key":"2036_CR29","doi-asserted-by":"crossref","unstructured":"Hendrycks, D., Zhao, K., Basart, S., Steinhardt, J., & Song, D. (2021). Natural adversarial examples. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 15262\u201315271.","DOI":"10.1109\/CVPR46437.2021.01501"},{"key":"2036_CR30","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2020.107383","volume":"110","author":"Y He","year":"2021","unstructured":"He, Y., Shen, Z., & Cui, P. (2021). Towards non-iid image classification: A dataset and baselines. Pattern Recognition, 110, 107383.","journal-title":"Pattern Recognition"},{"key":"2036_CR31","unstructured":"Houlsby, N., Giurgiu, A., Jastrzebski, S., Morrone, B., De\u00a0Laroussilhe, Q., Gesmundo, A., Attariyan, M., & Gelly, S. (2019). Parameter-efficient transfer learning for nlp. In International Conference on Machine Learning, pp. 2790\u20132799. PMLR."},{"key":"2036_CR32","doi-asserted-by":"crossref","unstructured":"Huang, L., Niu, G., Liu, J., Xiao, X., & Wu, H. (2022). Du-vlg: Unifying vision-and-language generation via dual sequence-to-sequence pre-training. arXiv:2203.09052.","DOI":"10.18653\/v1\/2022.findings-acl.201"},{"key":"2036_CR33","doi-asserted-by":"crossref","unstructured":"Huang, Z., Wang, H., Huang, D., Lee, Y. J., & Xing, E. P. (2022). The two dimensions of worst-case training and their integrated effect for out-of-domain generalization. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9631\u20139641.","DOI":"10.1109\/CVPR52688.2022.00941"},{"key":"2036_CR34","doi-asserted-by":"crossref","unstructured":"Huang, Z., Wang, H., Xing, E.P., & Huang, D. (2020). Self-challenging improves cross-domain generalization. arXiv:2007.02454.","DOI":"10.1007\/978-3-030-58536-5_8"},{"key":"2036_CR35","doi-asserted-by":"crossref","unstructured":"Immer, A., Hennigen, L.T., Fortuin, V., & Cotterell, R. (2021). Probing as quantifying inductive bias. arXiv:2110.08388.","DOI":"10.18653\/v1\/2022.acl-long.129"},{"key":"2036_CR36","doi-asserted-by":"crossref","unstructured":"Jain, A., Guo, M., Srinivasan, K., Chen, T., Kudugunta, S., Jia, C., Yang, Y., & Baldridge, J. (2021). Mural: Multimodal, multitask retrieval across languages. arXiv:2109.05125.","DOI":"10.18653\/v1\/2021.findings-emnlp.293"},{"key":"2036_CR37","doi-asserted-by":"crossref","unstructured":"Jia, M., Tang, L., Chen, B.-C., Cardie, C., Belongie, S., Hariharan, B., & Lim, S.-N. (2022). Visual prompt tuning. In Computer Vision\u2013ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23\u201327, 2022, Proceedings, Part XXXIII, pp. 709\u2013727. Springer.","DOI":"10.1007\/978-3-031-19827-4_41"},{"key":"2036_CR38","unstructured":"Jia, C., Yang, Y., Xia, Y., Chen, Y.-T., Parekh, Z., Pham, H., Le, Q., Sung, Y.-H., Li, Z., & Duerig, T. (2021). Scaling up visual and vision-language representation learning with noisy text supervision. In International Conference on Machine Learning, pp. 4904\u20134916. PMLR."},{"issue":"1","key":"2036_CR39","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1007\/s11263-023-01858-y","volume":"132","author":"J Jiang","year":"2023","unstructured":"Jiang, J., Liu, Z., & Zheng, N. (2023). Correlation information bottleneck: Towards adapting pretrained multimodal models for robust visual question answering. International Journal of Computer Vision, 132(1), 185\u2013207.","journal-title":"International Journal of Computer Vision"},{"key":"2036_CR40","doi-asserted-by":"crossref","unstructured":"Khandelwal, P., & Yushkevich, P. (2020). Domain generalizer: A few-shot meta learning framework for domain generalization in medical imaging. In Domain Adaptation and Representation Transfer, and Distributed and Collaborative Learning: Second MICCAI Workshop, DART 2020, and First MICCAI Workshop, DCL 2020, Held in Conjunction with MICCAI 2020, Lima, Peru, October 4\u20138, 2020, Proceedings 2, pp. 73\u201384. Springer.","DOI":"10.1007\/978-3-030-60548-3_8"},{"key":"2036_CR41","unstructured":"Kirichenko, P., Izmailov, P., & Wilson, A. G. (2022). Last layer re-training is sufficient for robustness to spurious correlations. arXiv:2204.02937."},{"key":"2036_CR42","unstructured":"Koh, P.W., Sagawa, S., Marklund, H., Xie, S.M., Zhang, M., Balsubramani, A., Hu, W., Yasunaga, M., Phillips, R.L., & Gao, I. (2021). Wilds: A benchmark of in-the-wild distribution shifts. In International conference on machine learning, pp. 5637\u20135664"},{"issue":"6","key":"2036_CR43","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/3065386","volume":"60","author":"A Krizhevsky","year":"2017","unstructured":"Krizhevsky, A., Sutskever, I., & Hinton, G. E. (2017). Imagenet classification with deep convolutional neural networks. Communications of the ACM, 60(6), 84\u201390.","journal-title":"Communications of the ACM"},{"key":"2036_CR44","unstructured":"Krueger, D., Caballero, E., Jacobsen, J.-H., Zhang, A., Binas, J., Zhang, D., Le\u00a0Priol, R., & Courville, A. (2021). Out-of-distribution generalization via risk extrapolation (rex). In International Conference on Machine Learning, pp. 5815\u20135826. PMLR."},{"key":"2036_CR45","unstructured":"Kumar, A., Raghunathan, A., Jones, R., Ma, T., & Liang, P. (2022). Fine-tuning can distort pretrained features and underperform out-of-distribution. arXiv:2202.10054."},{"key":"2036_CR46","unstructured":"Lee, Y., Chen, A. S., Tajwar, F., Kumar, A., Yao, H., Liang, P., & Finn, C. (2022). Surgical fine-tuning improves adaptation to distribution shifts. arXiv:2210.11466."},{"key":"2036_CR47","unstructured":"Li, Y., Liang, F., Zhao, L., Cui, Y., Ouyang, W., Shao, J., Yu, F., & Yan, J. (2021). Supervision exists everywhere: A data efficient contrastive language-image pre-training paradigm. In International Conference on Learning Representations."},{"key":"2036_CR48","doi-asserted-by":"crossref","unstructured":"Li, D., Yang, Y., Song, Y.-Z., & Hospedales, T. M. (2017). Deeper, broader and artier domain generalization. In Proceedings of the IEEE International Conference on Computer Vision, pp. 5542\u20135550.","DOI":"10.1109\/ICCV.2017.591"},{"key":"2036_CR49","doi-asserted-by":"crossref","unstructured":"Li, D., Yang, Y., Song, Y.-Z., & Hospedales, T. (2018). Learning to generalize: Meta-learning for domain generalization. In Proceedings of the AAAI Conference on Artificial Intelligence, vol. 32.","DOI":"10.1609\/aaai.v32i1.11596"},{"key":"2036_CR50","doi-asserted-by":"crossref","unstructured":"Li, X., Yin, X., Li, C., Zhang, P., Hu, X., Zhang, L., Wang, L., Hu, H., Dong, L., & Wei, F., et\u00a0al. (2020). Oscar: Object-semantics aligned pre-training for vision-language tasks. In European Conference on Computer Vision, pp. 121\u2013137. Springer.","DOI":"10.1007\/978-3-030-58577-8_8"},{"key":"2036_CR51","doi-asserted-by":"crossref","unstructured":"Lin, Y., Dong, H., Wang, H., & Zhang, T. (2022). Bayesian invariant risk minimization. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16021\u201316030.","DOI":"10.1109\/CVPR52688.2022.01555"},{"key":"2036_CR52","doi-asserted-by":"crossref","unstructured":"Liu, Z., Lin, Y., Cao, Y., Hu, H., Wei, Y., Zhang, Z., Lin, S., & Guo, B. (2021). Swin transformer: Hierarchical vision transformer using shifted windows. In Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 10012\u201310022.","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"2036_CR53","unstructured":"Lu, C., Wu, Y., Hern\u00e1ndez-Lobato, J. M., & Sch\u00f6lkopf, B. (2021). Invariant causal representation learning for out-of-distribution generalization. In International Conference on Learning Representations."},{"key":"2036_CR54","doi-asserted-by":"crossref","unstructured":"Mancini, M., Akata, Z., Ricci, E., & Caputo, B. (2020). Towards recognizing unseen categories in unseen domains. In European Conference on Computer Vision, pp. 466\u2013483. Springer.","DOI":"10.1007\/978-3-030-58592-1_28"},{"key":"2036_CR55","doi-asserted-by":"publisher","first-page":"10051","DOI":"10.1609\/aaai.v36i9.21244","volume":"36","author":"Y Ming","year":"2022","unstructured":"Ming, Y., Yin, H., & Li, Y. (2022). On the impact of spurious correlation for out-of-distribution detection. In Proceedings of the AAAI Conference on Artificial Intelligence, 36, 10051\u201310059.","journal-title":"In Proceedings of the AAAI Conference on Artificial Intelligence"},{"key":"2036_CR56","unstructured":"Muandet, K., Balduzzi, D., & Sch\u00f6lkopf, B. (2013). Domain generalization via invariant feature representation. In International Conference on Machine Learning, pp. 10\u201318. PMLR."},{"key":"2036_CR57","unstructured":"Nakamura, A., & Harada, T. (2019). Revisiting fine-tuning for few-shot learning. arXiv:1910.00216."},{"key":"2036_CR58","unstructured":"Nichol, A., Achiam, J., & Schulman, J. (2018). On first-order meta-learning algorithms. arXiv:1803.02999."},{"key":"2036_CR59","unstructured":"Pantazis, O., Brostow, G., Jones, K., & Mac\u00a0Aodha, O. (2022) Svl-adapter: Self-supervised adapter for vision-language pretrained models. arXiv:2210.03794."},{"key":"2036_CR60","unstructured":"Peng, D., & Pan, S. J. (2022). Learning gradient-based mixup towards flatter minima for domain generalization. arXiv:2209.14742."},{"key":"2036_CR61","unstructured":"Radford, A., Kim, J. W., Hallacy, C., Ramesh, A., Goh, G., Agarwal, S., Sastry, G., Askell, A., Mishkin, P., & Clark, J., et\u00a0al. (2021). Learning transferable visual models from natural language supervision. In International Conference on Machine Learning, pp. 8748\u20138763. PMLR."},{"key":"2036_CR62","unstructured":"Radford, A., Kim, J. W., Hallacy, C., Ramesh, A., Goh, G., Agarwal, S., Sastry, G., Askell, A., Mishkin, P., & Clark, J., et\u00a0al. (2021). Learning transferable visual models from natural language supervision. In International Conference on Machine Learning, pp. 8748\u20138763. PMLR."},{"key":"2036_CR63","unstructured":"Rame, A., Dancette, C., & Cord, M. (2022). Fishr: Invariant gradient variances for out-of-distribution generalization. In International Conference on Machine Learning, pp. 18347\u201318377. PMLR."},{"key":"2036_CR64","unstructured":"Recht, B., Roelofs, R., Schmidt, L., & Shankar, V. (2019). Do imagenet classifiers generalize to imagenet? In International Conference on Machine Learning, pp. 5389\u20135400. PMLR."},{"issue":"1","key":"2036_CR65","first-page":"1309","volume":"19","author":"M Rojas-Carulla","year":"2018","unstructured":"Rojas-Carulla, M., Sch\u00f6lkopf, B., Turner, R., & Peters, J. (2018). Invariant models for causal transfer learning. The Journal of Machine Learning Research, 19(1), 1309\u20131342.","journal-title":"The Journal of Machine Learning Research"},{"key":"2036_CR66","doi-asserted-by":"crossref","unstructured":"Sato, T., Shen, J., Wang, N., Jia, Y.J., Lin, X., & Chen, Q. A. (2020). Security of deep learning based lane keeping system under physical-world adversarial attack. arXiv:2003.01782.","DOI":"10.14722\/autosec.2021.23026"},{"key":"2036_CR67","doi-asserted-by":"publisher","first-page":"5692","DOI":"10.1609\/aaai.v34i04.6024","volume":"34","author":"Z Shen","year":"2020","unstructured":"Shen, Z., Cui, P., Zhang, T., & Kunag, K. (2020). Stable learning via sample reweighting. In Proceedings of the AAAI Conference on Artificial Intelligence, 34, 5692\u20135699.","journal-title":"In Proceedings of the AAAI Conference on Artificial Intelligence"},{"key":"2036_CR68","unstructured":"Simonyan, K., & Zisserman, A. (2014). Very deep convolutional networks for large-scale image recognition. arXiv:1409.1556."},{"key":"2036_CR69","unstructured":"Simonyan, K., Vedaldi, A., & Zisserman, A. (2013). Deep inside convolutional networks: Visualising image classification models and saliency maps. arXiv:1312.6034."},{"key":"2036_CR70","first-page":"24791","volume":"34","author":"P Stojanov","year":"2021","unstructured":"Stojanov, P., Li, Z., Gong, M., Cai, R., Carbonell, J., & Zhang, K. (2021). Domain adaptation with invariant representation learning: What transformations to learn? Advances in Neural Information Processing Systems, 34, 24791\u201324803.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2036_CR71","doi-asserted-by":"crossref","unstructured":"Sung, Y.-L., Cho, J., & Bansal, M. (2022). Vl-adapter: Parameter-efficient transfer learning for vision-and-language tasks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 5227\u20135237.","DOI":"10.1109\/CVPR52688.2022.00516"},{"key":"2036_CR72","doi-asserted-by":"crossref","unstructured":"Torralba, A. (2011). Eaa: Unbiased look at dataset bias. In IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 1521\u20131528.","DOI":"10.1109\/CVPR.2011.5995347"},{"key":"2036_CR73","unstructured":"Tseng, H.-Y., Lee, H.-Y., Huang, J.-B., & Yang, M.-H. (2020). Cross-domain few-shot classification via learned feature-wise transformation. arXiv:2001.08735."},{"key":"2036_CR74","unstructured":"Wang, H., Ge, S., Lipton, Z., & Xing, E. P. (2019). Learning robust global representations by penalizing local predictive power. arXiv:1905.13549v2"},{"issue":"8","key":"2036_CR75","first-page":"8052","volume":"35","author":"J Wang","year":"2022","unstructured":"Wang, J., Lan, C., Liu, C., Ouyang, Y., Qin, T., Lu, W., Chen, Y., Zeng, W., & Yu, P. (2022). Generalizing to unseen domains: A survey on domain generalization. IEEE Transactions on Knowledge and Data Engineering, 35(8), 8052\u20138072.","journal-title":"IEEE Transactions on Knowledge and Data Engineering"},{"key":"2036_CR76","unstructured":"Weber, M.G., Li, L., Wang, B., Zhao, Z., Li, B., & Zhang, C. (2022). Certifying out-of-domain generalization for blackbox functions. In Conference on Machine Learning, pp. 23527\u201323548. PMLR."},{"key":"2036_CR77","unstructured":"Wortsman, M., Gururangan, S., Li, S., Farhadi, A., Schmidt, L., Rabbat, M., & Morcos, A. S. (2022). Lo-fi: distributed fine-tuning without communication. arXiv:2210.11948"},{"key":"2036_CR78","unstructured":"Wortsman, M., Ilharco, G., Gadre, S. Y., Roelofs, R., Gontijo-Lopes, R., Morcos, A. S., Namkoong, H., Farhadi, A., Carmon, Y., & Kornblith, S., et\u00a0al. (2022). Model soups: Averaging weights of multiple fine-tuned models improves accuracy without increasing inference time. In International Conference on Machine Learning, pp. 23965\u201323998. PMLR."},{"key":"2036_CR79","doi-asserted-by":"crossref","unstructured":"Wortsman, M., Ilharco, G., Kim, J. W., Li, M., Kornblith, S., Roelofs, R., Lopes, R. G., Hajishirzi, H., Farhadi, A., & Namkoong, H., et\u00a0al. (2022). Robust fine-tuning of zero-shot models. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7959\u20137971.","DOI":"10.1109\/CVPR52688.2022.00780"},{"key":"2036_CR80","doi-asserted-by":"crossref","unstructured":"Wu, C.-E., Tian, Y., Yu, H., Wang, H., Morgado, P., Hu, Y. H., & Yang, L. (2023). Why is prompt tuning for vision-language models robust to noisy labels? In Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 15488\u201315497.","DOI":"10.1109\/ICCV51070.2023.01420"},{"key":"2036_CR81","first-page":"33041","volume":"35","author":"J Wu","year":"2022","unstructured":"Wu, J., Zou, D., Braverman, V., Gu, Q., & Kakade, S. (2022). The power and limitation of pretraining-finetuning for linear regression under covariate shift. Advances in Neural Information Processing Systems, 35, 33041\u201333053.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2036_CR82","unstructured":"Xing, Y., Wu, Q., Cheng, D., Zhang, S., Liang, G., & Zhang, Y. (2022). Class-aware visual prompt tuning for vision-language pre-trained model. arXiv:2208.08340."},{"key":"2036_CR83","unstructured":"Ye, N., Li, K., Hong, L., Bai, H., Chen, Y., Zhou, F., & Li, Z. (2021). Ood-bench: Benchmarking and understanding out-of-distribution generalization datasets and algorithms. arXiv:2106.03721 1(3), 5."},{"key":"2036_CR84","unstructured":"You, K., Liu, Y., Wang, J., & Long, M. (2021). Logme: Practical assessment of pre-trained models for transfer learning. In International Conference on Machine Learning, pp. 12133\u201312143. PMLR."},{"key":"2036_CR85","unstructured":"Zhang, R., Fang, R., Gao, P., Zhang, W., Li, K., Dai, J., Qiao, Y., & Li, H. (2021). Tip-adapter: Training-free clip-adapter for better vision-language modeling. arXiv:2111.03930."},{"key":"2036_CR86","unstructured":"Zhang, X., Iwasawa, Y., Matsuo, Y., & Gu, S. S. (2021). Amortized prompt: Guide clip to domain transfer learning. arXiv:2111.12853."},{"key":"2036_CR87","doi-asserted-by":"crossref","unstructured":"Zhang, P., Li, X., Hu, X., Yang, J., Zhang, L., Wang, L., Choi, Y., & Gao, J. (2021). Vinvl: Revisiting visual representations in vision-language models. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5579\u20135588.","DOI":"10.1109\/CVPR46437.2021.00553"},{"issue":"1","key":"2036_CR88","doi-asserted-by":"publisher","first-page":"56","DOI":"10.1214\/aos\/1079120130","volume":"32","author":"T Zhang","year":"2004","unstructured":"Zhang, T. (2004). Statistical behavior and consistency of classification methods based on convex risk minimization. The Annals of Statistics, 32(1), 56\u201385.","journal-title":"The Annals of Statistics"},{"key":"2036_CR89","first-page":"10957","volume":"34","author":"G Zhang","year":"2021","unstructured":"Zhang, G., Zhao, H., Yu, Y., & Poupart, P. (2021). Quantifying and improving transferability in domain generalization. Advances in Neural Information Processing Systems, 34, 10957\u201310970.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2036_CR90","unstructured":"Zhou, K., Yang, J., Loy, C. C., & Liu, Z. (2021). Learning to prompt for vision-language models. arXiv:2109.01134."},{"key":"2036_CR91","doi-asserted-by":"crossref","unstructured":"Zhou, K., Yang, J., Loy, C.C., & Liu, Z. (2022). Conditional prompt learning for vision-language models. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR).","DOI":"10.1109\/CVPR52688.2022.01631"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-024-02036-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-024-02036-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-024-02036-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,27]],"date-time":"2024-08-27T07:21:37Z","timestamp":1724743297000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-024-02036-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,3,18]]},"references-count":91,"journal-issue":{"issue":"9","published-print":{"date-parts":[[2024,9]]}},"alternative-id":["2036"],"URL":"https:\/\/doi.org\/10.1007\/s11263-024-02036-4","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,3,18]]},"assertion":[{"value":"4 April 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 February 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 March 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}