{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,6]],"date-time":"2026-05-06T15:21:34Z","timestamp":1778080894251,"version":"3.51.4"},"reference-count":64,"publisher":"Springer Science and Business Media LLC","issue":"9","license":[{"start":{"date-parts":[[2025,6,15]],"date-time":"2025-06-15T00:00:00Z","timestamp":1749945600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,6,15]],"date-time":"2025-06-15T00:00:00Z","timestamp":1749945600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100004826","name":"Natural Science Foundation of Beijing Municipality","doi-asserted-by":"publisher","award":["No. L247029"],"award-info":[{"award-number":["No. L247029"]}],"id":[{"id":"10.13039\/501100004826","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["No. 62371009"],"award-info":[{"award-number":["No. 62371009"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2025,9]]},"DOI":"10.1007\/s11263-025-02497-1","type":"journal-article","created":{"date-parts":[[2025,6,15]],"date-time":"2025-06-15T13:27:24Z","timestamp":1749994044000},"page":"6513-6534","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Multi-modal Prompt Alignment with Fine-grained LLM Knowledge for Unsupervised Domain Adaptation"],"prefix":"10.1007","volume":"133","author":[{"given":"Bowei","family":"Xing","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9785-0727","authenticated-orcid":false,"given":"Xianghua","family":"Ying","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ruibin","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ruohao","family":"Guo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,6,15]]},"reference":[{"key":"2497_CR1","doi-asserted-by":"crossref","unstructured":"Bai, S., Zhang, M., Zhou, W., Huang, S., Luan, Z., Wang, D., & Chen, B. (2024). Prompt-based distribution alignment for unsupervised domain adaptation. In: Proceedings of the AAAI Conference on Artificial Intelligence, pp 729\u2013737","DOI":"10.1609\/aaai.v38i2.27830"},{"key":"2497_CR2","unstructured":"Baktash, J.A., & Dawodi, M. (2023). Gpt-4: A review on advancements and opportunities in natural language processing. arXiv preprint arXiv:2305.03195"},{"key":"2497_CR3","unstructured":"Chen, G., Yao, W., Song, X., Li, X., Rao, Y., & Zhang, K. (2022). Plot: Prompt learning with optimal transport for vision-language models. In: The Eleventh International Conference on Learning Representations"},{"key":"2497_CR4","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., Weissenborn, D., Zhai, X., Unterthiner, T., Dehghani, M., Minderer, M., Heigold, G., Gelly, S., et\u00a0al. (2021). An image is worth 16x16 words: Transformers for image recognition at scale. In: International Conference on Learning Representations"},{"key":"2497_CR5","doi-asserted-by":"crossref","unstructured":"Du, Y., Wei, F., Zhang, Z., Shi, M., Gao, Y., & Li, G. (2022). Learning to prompt for open-vocabulary object detection with vision-language model. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 14084\u201314093","DOI":"10.1109\/CVPR52688.2022.01369"},{"key":"2497_CR6","doi-asserted-by":"crossref","unstructured":"Du, Z., Li, X., Li, F., Lu, K., Zhu, L., & Li, J. (2024). Domain-agnostic mutual prompting for unsupervised domain adaptation. arXiv preprint arXiv:2403.02899","DOI":"10.1109\/CVPR52733.2024.02206"},{"key":"2497_CR7","unstructured":"Ganin, Y., & Lempitsky, V. (2015a). Unsupervised domain adaptation by backpropagation. In: International conference on machine learning, PMLR, pp 1180\u20131189"},{"key":"2497_CR8","unstructured":"Ganin, Y., & Lempitsky, V. (2015b). Unsupervised domain adaptation by backpropagation. In: International conference on machine learning, PMLR, pp 1180\u20131189"},{"issue":"59","key":"2497_CR9","first-page":"1","volume":"17","author":"Y Ganin","year":"2016","unstructured":"Ganin, Y., Ustinova, E., Ajakan, H., Germain, P., Larochelle, H., Laviolette, F., March, M., & Lempitsky, V. (2016). Domain-adversarial training of neural networks. Journal of machine learning research, 17(59), 1\u201335.","journal-title":"Journal of machine learning research"},{"issue":"2","key":"2497_CR10","doi-asserted-by":"publisher","first-page":"581","DOI":"10.1007\/s11263-023-01891-x","volume":"132","author":"P Gao","year":"2024","unstructured":"Gao, P., Geng, S., Zhang, R., Ma, T., Fang, R., Zhang, Y., Li, H., & Qiao, Y. (2024). Clip-adapter: Better vision-language models with feature adapters. International Journal of Computer Vision, 132(2), 581\u2013595.","journal-title":"International Journal of Computer Vision"},{"key":"2497_CR11","unstructured":"Ge, C., Huang, R., Xie, M., Lai, Z., Song, S., Li, S., & Huang, G. (2023). Domain adaptation via prompt learning. IEEE Transactions on Neural Networks and Learning Systems"},{"key":"2497_CR12","doi-asserted-by":"crossref","unstructured":"Gu, X., Yu, X., Yang, Y., Sun, J., & Xu, Z. (2024). Adversarial reweighting with $$\\alpha $$-power maximization for domain adaptation. International Journal of Computer Vision pp 1\u201324","DOI":"10.1007\/s11263-024-02107-6"},{"key":"2497_CR13","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. (2016). Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"2497_CR14","doi-asserted-by":"crossref","unstructured":"Hu, L., Kan, M., Shan, S., & Chen, X. (2020). Unsupervised domain adaptation with hierarchical gradient synchronization. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 4043\u20134052","DOI":"10.1109\/CVPR42600.2020.00410"},{"key":"2497_CR15","unstructured":"Jia, C., Yang, Y., Xia, Y., Chen, Y.T., Parekh, Z., Pham, H., Le, Q., Sung, Y.H., Li, Z., & Duerig, T. (2021). Scaling up visual and vision-language representation learning with noisy text supervision. In: International conference on machine learning, PMLR, pp 4904\u20134916"},{"key":"2497_CR16","doi-asserted-by":"crossref","unstructured":"Jia, M., Tang, L., Chen, B.C., Cardie, C., Belongie, S., Hariharan, B., & Lim, S.N. (2022). Visual prompt tuning. In: European Conference on Computer Vision, Springer, pp 709\u2013727","DOI":"10.1007\/978-3-031-19827-4_41"},{"key":"2497_CR17","doi-asserted-by":"crossref","unstructured":"Kang, G., Jiang, L., Yang, Y., & Hauptmann, A.G. (2019a). Contrastive adaptation network for unsupervised domain adaptation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 4893\u20134902","DOI":"10.1109\/CVPR.2019.00503"},{"key":"2497_CR18","doi-asserted-by":"crossref","unstructured":"Kang, G., Jiang, L., Yang, Y., & Hauptmann, A.G. (2019b). Contrastive adaptation network for unsupervised domain adaptation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 4893\u20134902","DOI":"10.1109\/CVPR.2019.00503"},{"key":"2497_CR19","doi-asserted-by":"crossref","unstructured":"Khattak, M.U., Rasheed, H., Maaz, M., Khan, S., & Khan, F.S. (2023). Maple: Multi-modal prompt learning. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 19113\u201319122","DOI":"10.1109\/CVPR52729.2023.01832"},{"issue":"11","key":"2497_CR20","doi-asserted-by":"publisher","first-page":"2888","DOI":"10.1007\/s11263-023-01810-0","volume":"131","author":"V Kumar","year":"2023","unstructured":"Kumar, V., Patil, H., Lal, R., & Chakraborty, A. (2023). Improving domain adaptation through class aware frequency transformation. International Journal of Computer Vision, 131(11), 2888\u20132907.","journal-title":"International Journal of Computer Vision"},{"key":"2497_CR21","doi-asserted-by":"crossref","unstructured":"Lai, Z., Vesdapunt, N., Zhou, N., Wu, J., Huynh, C.P., Li, X., Fu, K.K., & Chuah, C.N. (2023). Padclip: Pseudo-labeling with adaptive debiasing in clip for unsupervised domain adaptation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 16155\u201316165","DOI":"10.1109\/ICCV51070.2023.01480"},{"issue":"11","key":"2497_CR22","doi-asserted-by":"publisher","first-page":"3918","DOI":"10.1109\/TPAMI.2020.2991050","volume":"43","author":"J Li","year":"2020","unstructured":"Li, J., Chen, E., Ding, Z., Zhu, L., Lu, K., & Shen, H. T. (2020). Maximum density divergence for domain adaptation. IEEE transactions on pattern analysis and machine intelligence, 43(11), 3918\u20133930.","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"key":"2497_CR23","doi-asserted-by":"crossref","unstructured":"Liang, F., Wu, B., Dai, X., Li, K., Zhao, Y., Zhang, H., Zhang, P., Vajda, P., & Marculescu, D. (2023). Open-vocabulary semantic segmentation with mask-adapted clip. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 7061\u20137070","DOI":"10.1109\/CVPR52729.2023.00682"},{"key":"2497_CR24","unstructured":"Liang, J., Hu, D., & Feng, J. (2020). Do we really need to access the source data? source hypothesis transfer for unsupervised domain adaptation. In: Proceedings of the International Conference on Machine Learning, pp 6028\u20136039"},{"issue":"11","key":"2497_CR25","first-page":"8602","volume":"44","author":"J Liang","year":"2021","unstructured":"Liang, J., Hu, D., Wang, Y., He, R., & Feng, J. (2021). Source data-absent unsupervised domain adaptation through hypothesis transfer and labeling transfer. IEEE Transactions on Pattern Analysis and Machine Intelligence, 44(11), 8602\u20138617.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2497_CR26","first-page":"22968","volume":"34","author":"H Liu","year":"2021","unstructured":"Liu, H., Wang, J., & Long, M. (2021). Cycle self-training for domain adaptation. Advances in Neural Information Processing Systems, 34, 22968\u201322981.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2497_CR27","unstructured":"Long, M., Cao, Z., Wang, J., Jordan, M.I. (2018). Conditional adversarial domain adaptation. Advances in neural information processing systems 31"},{"key":"2497_CR28","doi-asserted-by":"crossref","unstructured":"Mei, K., Zhu, C., Zou, J., & Zhang, S. (2020). Instance adaptive self-training for unsupervised domain adaptation. In: European Conference on Computer Vision, Springer, pp 415\u2013430","DOI":"10.1007\/978-3-030-58574-7_25"},{"key":"2497_CR29","unstructured":"Menon, S., & Vondrick, C. (2023). Visual classification via description from large language models. In: International Conference on Learning Representations"},{"key":"2497_CR30","doi-asserted-by":"crossref","unstructured":"Minderer, M., Gritsenko, A., Stone, A., Neumann, M., Weissenborn, D., Dosovitskiy, A., Mahendran, A., Arnab, A., Dehghani, M., Shen, Z., et\u00a0al. (2022). Simple open-vocabulary object detection. In: European Conference on Computer Vision, pp 728\u2013755","DOI":"10.1007\/978-3-031-20080-9_42"},{"key":"2497_CR31","doi-asserted-by":"crossref","unstructured":"Naeem, M.F., Khan, M.G.Z.A., Xian, Y., Afzal, M.Z., Stricker, D., Van\u00a0Gool, L., & Tombari, F. (2023). I2mvformer: Large language model generated multi-view document supervision for zero-shot image classification. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 15169\u201315179","DOI":"10.1109\/CVPR52729.2023.01456"},{"key":"2497_CR32","doi-asserted-by":"crossref","unstructured":"Peng, X., Bai, Q., Xia, X., Huang, Z., Saenko, K., & Wang, B. (2019). Moment matching for multi-source domain adaptation. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 1406\u20131415","DOI":"10.1109\/ICCV.2019.00149"},{"key":"2497_CR33","doi-asserted-by":"crossref","unstructured":"Pratt, S., Covert, I., Liu, R., & Farhadi, A. (2023). What does a platypus look like? generating customized prompts for zero-shot image classification. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 15691\u201315701","DOI":"10.1109\/ICCV51070.2023.01438"},{"key":"2497_CR34","unstructured":"Radford, A., Narasimhan, K., Salimans, T., Sutskever, I., et\u00a0al. (2018). Improving language understanding by generative pre-training"},{"key":"2497_CR35","unstructured":"Radford, A., Kim, J.W., Hallacy, C., Ramesh, A., Goh, G., Agarwal, S., Sastry, G., Askell, A., Mishkin, P., Clark, J., et\u00a0al. (2021). Learning transferable visual models from natural language supervision. In: International conference on machine learning, pp 8748\u20138763"},{"key":"2497_CR36","unstructured":"Rangwani, H., Aithal, S.K., Mishra, M., Jain, A., Radhakrishnan, V.B. (2022). A closer look at smoothness in domain adversarial training. In: International conference on machine learning, PMLR, pp 18378\u201318399"},{"key":"2497_CR37","doi-asserted-by":"crossref","unstructured":"Roth, K., Kim, J.M., Koepke, A., Vinyals, O., Schmid, C., & Akata, Z. (2023). Waffling around for performance: Visual classification with random words and broad concepts. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 15746\u201315757","DOI":"10.1109\/ICCV51070.2023.01443"},{"key":"2497_CR38","doi-asserted-by":"crossref","unstructured":"Saenko, K., Kulis, B., Fritz, M., & Darrell, T. (2010). Adapting visual category models to new domains. In: Proceedings of the European Conference on Computer Vision, pp 213\u2013226","DOI":"10.1007\/978-3-642-15561-1_16"},{"key":"2497_CR39","doi-asserted-by":"crossref","unstructured":"Saito, K., Watanabe, K., Ushiku, Y., & Harada, T. (2018). Maximum classifier discrepancy for unsupervised domain adaptation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 3723\u20133732","DOI":"10.1109\/CVPR.2018.00392"},{"key":"2497_CR40","unstructured":"Santurkar, S., Dubois, Y., Taori, R., Liang, P., & Hashimoto, T. (2022). Is a caption worth a thousand images? a controlled study for representation learning. arXiv preprint arXiv:2207.07635"},{"key":"2497_CR41","doi-asserted-by":"crossref","unstructured":"Singha, M., Pal, H., Jha, A., & Banerjee, B. (2023). Ad-clip: Adapting domains in prompt space using clip. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 4355\u20134364","DOI":"10.1109\/ICCVW60793.2023.00470"},{"key":"2497_CR42","first-page":"596","volume":"33","author":"K Sohn","year":"2020","unstructured":"Sohn, K., Berthelot, D., Carlini, N., Zhang, Z., Zhang, H., Raffel, C. A., Cubuk, E. D., Kurakin, A., & Li, C. L. (2020). Fixmatch: Simplifying semi-supervised learning with consistency and confidence. Advances in neural information processing systems, 33, 596\u2013608.","journal-title":"Advances in neural information processing systems"},{"key":"2497_CR43","doi-asserted-by":"crossref","unstructured":"Sun, B., & Saenko, K. (2016). Deep coral: Correlation alignment for deep domain adaptation. In: Computer Vision\u2013ECCV 2016 Workshops: Amsterdam, The Netherlands, October 8-10 and 15-16, 2016, Proceedings, Part III 14, Springer, pp 443\u2013450","DOI":"10.1007\/978-3-319-49409-8_35"},{"key":"2497_CR44","doi-asserted-by":"crossref","unstructured":"Sun, T., Lu, C., Zhang, T., & Ling, H. (2022). Safe self-refinement for transformer-based domain adaptation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 7191\u20137200","DOI":"10.1109\/CVPR52688.2022.00705"},{"key":"2497_CR45","doi-asserted-by":"crossref","unstructured":"Tang, H., Chen, K., & Jia, K. (2020a). Unsupervised domain adaptation via structurally regularized deep clustering. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 8725\u20138735","DOI":"10.1109\/CVPR42600.2020.00875"},{"key":"2497_CR46","doi-asserted-by":"crossref","unstructured":"Tang, H., Chen, K., & Jia, K. (2020b). Unsupervised domain adaptation via structurally regularized deep clustering. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 8725\u20138735","DOI":"10.1109\/CVPR42600.2020.00875"},{"issue":"3","key":"2497_CR47","doi-asserted-by":"publisher","first-page":"654","DOI":"10.1007\/s11263-023-01892-w","volume":"132","author":"S Tang","year":"2024","unstructured":"Tang, S., Chang, A., Zhang, F., Zhu, X., Ye, M., & Zhang, C. (2024). Source-free domain adaptation via target prediction distribution searching. International journal of computer vision, 132(3), 654\u2013672.","journal-title":"International journal of computer vision"},{"key":"2497_CR48","unstructured":"Touvron, H., Cord, M., Douze, M., Massa, F., Sablayrolles, A., & J\u00e9gou, H. (2021). Training data-efficient image transformers & distillation through attention. In: International conference on machine learning, PMLR, pp 10347\u201310357"},{"key":"2497_CR49","doi-asserted-by":"crossref","unstructured":"Tzeng, E., Hoffman, J., Saenko, K., & Darrell, T. (2017). Adversarial discriminative domain adaptation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 7167\u20137176","DOI":"10.1109\/CVPR.2017.316"},{"key":"2497_CR50","unstructured":"Tzeng, E., Hoffman, J., Zhang, N., Saenko, K., & Darrell, T. (2019). Deep domain confusion: Maximizing for domain invariance. arxiv 2014. arXiv preprint arXiv:1412.3474"},{"key":"2497_CR51","doi-asserted-by":"crossref","unstructured":"Venkateswara, H., Eusebio, J., Chakraborty, S., & Panchanathan, S. (2017). Deep hashing network for unsupervised domain adaptation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 5018\u20135027","DOI":"10.1109\/CVPR.2017.572"},{"key":"2497_CR52","doi-asserted-by":"crossref","unstructured":"Vu, T.H., Jain, H., Bucher, M., Cord, M., & P\u00e9rez, P. (2019). Advent: Adversarial entropy minimization for domain adaptation in semantic segmentation. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 2517\u20132526","DOI":"10.1109\/CVPR.2019.00262"},{"key":"2497_CR53","doi-asserted-by":"crossref","unstructured":"Wang, Q., & Breckon, T. (2020). Unsupervised domain adaptation via structured prediction based selective pseudo-labeling. In: Proceedings of the AAAI conference on artificial intelligence, pp 6243\u20136250","DOI":"10.1609\/aaai.v34i04.6091"},{"key":"2497_CR54","first-page":"13834","volume":"34","author":"G Wei","year":"2021","unstructured":"Wei, G., Lan, C., Zeng, W., Zhang, Z., & Chen, Z. (2021). Toalign: Task-oriented alignment for unsupervised domain adaptation. Advances in Neural Information Processing Systems, 34, 13834\u201313846.","journal-title":"Advances in Neural Information Processing Systems"},{"issue":"2","key":"2497_CR55","doi-asserted-by":"publisher","first-page":"392","DOI":"10.1007\/s11263-023-01876-w","volume":"132","author":"W Wu","year":"2024","unstructured":"Wu, W., Sun, Z., Song, Y., Wang, J., & Ouyang, W. (2024). Transferring vision-language models for visual recognition: A classifier perspective. International Journal of Computer Vision, 132(2), 392\u2013409.","journal-title":"International Journal of Computer Vision"},{"issue":"3","key":"2497_CR56","first-page":"3434","volume":"45","author":"H Xia","year":"2022","unstructured":"Xia, H., Jing, T., & Ding, Z. (2022). Maximum structural generation discrepancy for unsupervised domain adaptation. IEEE Transactions on Pattern Analysis and Machine Intelligence, 45(3), 3434\u20133445.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2497_CR57","unstructured":"Xu, T., Chen, W., Pichao, W., Wang, F., Li, H., & Jin, R. (2022). Cdtrans: Cross-domain transformer for unsupervised domain adaptation. In: International Conference on Learning Representations"},{"key":"2497_CR58","doi-asserted-by":"crossref","unstructured":"Yan, H., Ding, Y., Li, P., Wang, Q., Xu, Y., & Zuo, W. (2017). Mind the class weight bias: Weighted maximum mean discrepancy for unsupervised domain adaptation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 2272\u20132281","DOI":"10.1109\/CVPR.2017.107"},{"key":"2497_CR59","doi-asserted-by":"crossref","unstructured":"Yang, J., Liu, J., Xu, N., & Huang, J. (2023a). Tvt: Transferable vision transformer for unsupervised domain adaptation. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp 520\u2013530","DOI":"10.1109\/WACV56688.2023.00059"},{"key":"2497_CR60","doi-asserted-by":"crossref","unstructured":"Yang, Y., Panagopoulou, A., Zhou, S., Jin, D., Callison-Burch, C., & Yatskar, M. (2023b). Language in a bottle: Language model guided concept bottlenecks for interpretable image classification. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 19187\u201319197","DOI":"10.1109\/CVPR52729.2023.01839"},{"key":"2497_CR61","unstructured":"Yao, L., Huang, R., Hou, L., Lu, G., Niu, M., Xu, H., Liang, X., Li, Z., Jiang, X., & Xu, C. (2021). Filip: Fine-grained interactive language-image pre-training. arXiv preprint arXiv:2111.07783"},{"key":"2497_CR62","unstructured":"Zhang, Y., Liu, T., Long, M., & Jordan, M. (2019). Bridging theory and algorithm for domain adaptation. In: Proceedings of the International Conference on Machine Learning, pp 7404\u20137413"},{"key":"2497_CR63","doi-asserted-by":"crossref","unstructured":"Zhou, K., Yang, J., Loy, C.C., & Liu, Z. (2022a). Conditional prompt learning for vision-language models. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 16816\u201316825","DOI":"10.1109\/CVPR52688.2022.01631"},{"issue":"9","key":"2497_CR64","doi-asserted-by":"publisher","first-page":"2337","DOI":"10.1007\/s11263-022-01653-1","volume":"130","author":"K Zhou","year":"2022","unstructured":"Zhou, K., Yang, J., Loy, C. C., & Liu, Z. (2022). Learning to prompt for vision-language models. International Journal of Computer Vision, 130(9), 2337\u20132348.","journal-title":"International Journal of Computer Vision"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02497-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-025-02497-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02497-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T07:59:28Z","timestamp":1757404768000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-025-02497-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,15]]},"references-count":64,"journal-issue":{"issue":"9","published-print":{"date-parts":[[2025,9]]}},"alternative-id":["2497"],"URL":"https:\/\/doi.org\/10.1007\/s11263-025-02497-1","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,6,15]]},"assertion":[{"value":"26 June 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 June 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 June 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}