{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T16:56:57Z","timestamp":1777654617571,"version":"3.51.4"},"reference-count":92,"publisher":"Springer Science and Business Media LLC","issue":"7","license":[{"start":{"date-parts":[[2025,3,10]],"date-time":"2025-03-10T00:00:00Z","timestamp":1741564800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,3,10]],"date-time":"2025-03-10T00:00:00Z","timestamp":1741564800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100012166","name":"National Key R&D Program of China","doi-asserted-by":"crossref","award":["2022YFC3301000"],"award-info":[{"award-number":["2022YFC3301000"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62172177"],"award-info":[{"award-number":["62172177"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2025,7]]},"DOI":"10.1007\/s11263-025-02394-7","type":"journal-article","created":{"date-parts":[[2025,3,10]],"date-time":"2025-03-10T12:33:32Z","timestamp":1741610012000},"page":"4504-4521","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":13,"title":["Semantics-Conditioned Generative Zero-Shot Learning via Feature Refinement"],"prefix":"10.1007","volume":"133","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-9633-3392","authenticated-orcid":false,"given":"Shiming","family":"Chen","sequence":"first","affiliation":[]},{"given":"Ziming","family":"Hong","sequence":"additional","affiliation":[]},{"given":"Xinge","family":"You","sequence":"additional","affiliation":[]},{"given":"Ling","family":"Shao","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,3,10]]},"reference":[{"key":"2394_CR1","doi-asserted-by":"crossref","unstructured":"Akata, Z., Reed, S., Walter, D., Lee, H., & Schiele, B. (2015). Evaluation of output embeddings for fine-grained image classification. In: CVPR, pp 2927\u20132936","DOI":"10.1109\/CVPR.2015.7298911"},{"key":"2394_CR2","doi-asserted-by":"publisher","first-page":"1425","DOI":"10.1109\/TPAMI.2015.2487986","volume":"38","author":"Z Akata","year":"2016","unstructured":"Akata, Z., Perronnin, F., Harchaoui, Z., & Schmid, C. (2016). Label-embedding for image classification. IEEE Transactions on Pattern Analysis and Machine Intelligence, 38, 1425\u20131438.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2394_CR3","doi-asserted-by":"crossref","unstructured":"Arora, G., Verma, V., Mishra, A., & Rai, P. (2018). Generalized zero-shot learning via synthesized examples. In: CVPR, pp 4281\u20134289","DOI":"10.1109\/CVPR.2018.00450"},{"key":"2394_CR4","doi-asserted-by":"publisher","first-page":"115","DOI":"10.1037\/0033-295X.94.2.115","volume":"94","author":"I Biederman","year":"1987","unstructured":"Biederman, I. (1987). Recognition-by-components: A theory of human image understanding. Psychological review, 94, 115\u2013147.","journal-title":"Psychological review"},{"key":"2394_CR5","doi-asserted-by":"crossref","unstructured":"Bucher, M., Herbin, S., & Jurie, F. (2017). Generating visual representations for zero-shot classification. In: ICCV Workshop, pp 2666\u20132673","DOI":"10.1109\/ICCVW.2017.308"},{"key":"2394_CR6","unstructured":"\u00c7etin, S., Baran, O. B., & Cinbis, R. G. (2022) Closed-form sample probing for learning generative models in zero-shot learning. In: ICLR"},{"key":"2394_CR7","doi-asserted-by":"crossref","unstructured":"Chen, S., Hong, Z., Liu, Y., Xie, GS., Sun, B., Li, H., Peng, Q., Lu, K., & You, X. (2022a). Transzero: Attribute-guided transformer for zero-shot learning. In: AAAI","DOI":"10.1609\/aaai.v36i1.19909"},{"key":"2394_CR8","unstructured":"Chen, S., Hou, WQ., Hong, Z., Ding, X., Song, Y., You, X., Liu, T., & Zhang, K. (2023). Evolving semantic prototype improves generative zero-shot learning. In: ICML"},{"key":"2394_CR9","doi-asserted-by":"crossref","unstructured":"Chen, S., Hou, WQ., Khan, SH., & Khan, FS. (2024). Progressive semantic-guided vision transformer for zero-shot learning. In: CVPR","DOI":"10.1109\/CVPR52733.2024.02262"},{"key":"2394_CR10","doi-asserted-by":"crossref","unstructured":"Chen, X., Lan, X., Sun, FC., & Zheng, N. (2020). A boundary based out-of-distribution classifier for generalized zero-shot learning. In: ECCV","DOI":"10.1007\/978-3-030-58586-0_34"},{"key":"2394_CR11","doi-asserted-by":"crossref","unstructured":"Chen, S., Wang, W., Xia, B., Peng, Q., You, X., Zheng, F., & Shao, L. (2021a). Free: Feature refinement for generalized zero-shot learning. In: ICCV","DOI":"10.1109\/ICCV48922.2021.00019"},{"key":"2394_CR12","unstructured":"Chen, S., Xie, GS., Yang\u00a0Liu, Y., Peng, Q., Sun, B., Li, H., You, X., & Shao, L. (2021b), Hsva: Hierarchical semantic-visual adaptation for zero-shot learning. In: NeurIPS"},{"key":"2394_CR13","doi-asserted-by":"crossref","unstructured":"Chen, L., Zhang, H., Xiao, J., Liu, W., & Chang, S. (2018) Zero-shot visual recognition using semantics-preserving adversarial embedding networks. In: CVPR, pp 1043\u20131052","DOI":"10.1109\/CVPR.2018.00115"},{"issue":"11","key":"2394_CR14","first-page":"12844","volume":"45","author":"S Chen","year":"2022","unstructured":"Chen, S., Hong, Z., Hou, W., Xie, G. S., Song, Y., Zhao, J., & Shao, L. (2022). TransZero++: Cross attribute-guided transformer for zero-shot learning. IEEE Transactions on Pattern Analysis and Machine Intelligence, 45(11), 12844\u201312861.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2394_CR15","doi-asserted-by":"publisher","first-page":"4516","DOI":"10.1109\/TNNLS.2022.3155602","volume":"35","author":"S Chen","year":"2022","unstructured":"Chen, S., Hong, Z., Xie, G., Peng, Q., You, X., Ding, W., & Shao, L. (2022). Gndan: Graph navigated dual attention network for zero-shot learning. IEEE Transactions on Neural Networks and Learning Systems, 35, 4516\u20134529.","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"key":"2394_CR16","doi-asserted-by":"crossref","unstructured":"Christensen, A., Mancini, M., Koepke, A. S., Winther, O., & Akata, Z. (2023). Image-free classifier injection for zero-shot classification. In: ICCV","DOI":"10.1109\/ICCV51070.2023.01748"},{"key":"2394_CR17","unstructured":"Cui, J., Li, Z., Yan, Y., Chen, B., & Yuan, L. (2023). Chatlaw: Open-source legal large language model with integrated external knowledge bases. arXiv preprint arXiv:2306.16092"},{"key":"2394_CR18","doi-asserted-by":"crossref","unstructured":"Ding, Z., & Liu, H. (2019) Marginalized latent semantic encoder for zero-shot learning. In: CVPR, pp 6184\u20136192","DOI":"10.1109\/CVPR.2019.00635"},{"key":"2394_CR19","unstructured":"Ding, M., Yang, Z., Hong, W., Zheng, W., Zhou, C., Yin, D., Lin, J., Zou, X., Shao, Z., Yang, H., & Tang, J. (2021). Cogview: Mastering text-to-image generation via transformers. In: NeurIPS"},{"key":"2394_CR20","doi-asserted-by":"crossref","unstructured":"Felix, R., Kumar, BV., Reid, I., Carneiro, G. (2018). Multi-modal cycle-consistent generalized zero-shot learning. In: ECCV","DOI":"10.1007\/978-3-030-01231-1_2"},{"key":"2394_CR21","unstructured":"Frome, A., Corrado, GS., Shlens, J., Bengio, S., Dean, J., Ranzato, M., Mikolov, T. (2013). Devise: A deep visual-semantic embedding model. In: NeurIPS"},{"key":"2394_CR22","unstructured":"Ge, Y., Ren, JJ., Wang, Y., Gallagher, A., Yang, M., Itti, L., Adam, H., Lakshminarayanan, B., Zhao, & J. (2022). Improving zero-shot generalization and robustness of multi-modal models. arXiv preprint arXiv: 2212.01758"},{"key":"2394_CR23","volume-title":"Caltech-256 object category dataset","author":"G Griffin","year":"2007","unstructured":"Griffin, G., Holub, A., & Perona, P. (2007). Caltech-256 object category dataset. California Institute of Technology."},{"key":"2394_CR24","unstructured":"Gu, X., Lin, TY., Kuo, W., Cui, Y. (2021). Open-vocabulary object detection via vision and language knowledge distillation. In: ICLR"},{"key":"2394_CR25","doi-asserted-by":"publisher","first-page":"2606","DOI":"10.1007\/s11263-022-01656-y","volume":"130","author":"Z Han","year":"2022","unstructured":"Han, Z., Fu, Z., Chen, S., & Yang, J. (2022). Semantic contrastive embedding for generalized zero-shot learning. International Journal of Computer Vision, 130, 2606\u20132622.","journal-title":"International Journal of Computer Vision"},{"key":"2394_CR26","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. (2016) Deep residual learning for image recognition. In: CVPR, pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"2394_CR27","unstructured":"Hendrycks, D., Lee, K., Mazeika, M. (2019). Using pre-training can improve model robustness and uncertainty. In: ICML"},{"key":"2394_CR28","unstructured":"Ho, J., Jain, A., & Abbeel, P. (2020) Denoising diffusion probabilistic models. In: NeurIPS"},{"key":"2394_CR29","unstructured":"Huynh, DT., & Elhamifar, E. (2020b). Compositional zero-shot learning via fine-grained dense feature composition. In: NeurIPS"},{"key":"2394_CR30","doi-asserted-by":"crossref","unstructured":"Huynh, D., & Elhamifar, E. (2020a). Fine-grained generalized zero-shot learning via dense attribute-based attention. In: CVPR, pp 4482\u20134492","DOI":"10.1109\/CVPR42600.2020.00454"},{"key":"2394_CR31","doi-asserted-by":"crossref","unstructured":"Keshari, R., Singh, R., & Vatsa, M. (2020). Generalized zero-shot learning via over-complete distribution. In: CVPR, pp 13297\u201313305","DOI":"10.1109\/CVPR42600.2020.01331"},{"key":"2394_CR32","doi-asserted-by":"crossref","unstructured":"Kim, S., Jo, D., Lee, D., & Kim, J. (2023), Magvlt: Masked generative vision-and-language transformer. In: CVPR, pp 23338\u201323348","DOI":"10.1109\/CVPR52729.2023.02235"},{"key":"2394_CR33","unstructured":"Kingma, D. P., & Ba, J. (2015) Adam: A method for stochastic optimization. In: ICLR"},{"key":"2394_CR34","unstructured":"Kingma, D. P., & Welling, M. (2014). Auto-encoding variational bayes. In: ICLR"},{"key":"2394_CR35","unstructured":"Kuo, W., Cui, Y., Gu, X., Piergiovanni, A. J., & Angelova, A. (2022) F-vlm: Open-vocabulary object detection upon frozen vision and language models. In: ICLR"},{"key":"2394_CR36","doi-asserted-by":"crossref","unstructured":"Lampert, C. H., Nickisch, H., & Harmeling, S. (2009) Learning to detect unseen object classes by between-class attribute transfer. In: CVPR, pp 951\u2013958","DOI":"10.1109\/CVPR.2009.5206594"},{"key":"2394_CR37","doi-asserted-by":"publisher","first-page":"453","DOI":"10.1109\/TPAMI.2013.140","volume":"36","author":"CH Lampert","year":"2014","unstructured":"Lampert, C. H., Nickisch, H., & Harmeling, S. (2014). Attribute-based classification for zero-shot visual object categorization. IEEE Transactions on Pattern Analysis and Machine Intelligence, 36, 453\u2013465.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2394_CR38","unstructured":"Larochelle, H., Erhan, D., & Bengio, Y. (2008) Zero-data learning of new tasks. In: AAAI, pp 646\u2013651"},{"key":"2394_CR39","unstructured":"Li, H., Chaudhari, P., Yang, H., Lam, M., Ravichandran, A., Bhotika, R., & Soatto, S. (2020) Rethinking the hyperparameters for fine-tuning. In: ICLR"},{"key":"2394_CR40","doi-asserted-by":"crossref","unstructured":"Li, J., Jing, M., Lu, K., Ding, Z., Zhu, L., & Huang, Z. (2019a). Leveraging the invariant side of generative zero-shot learning. In: CVPR, pp 7394\u20137403","DOI":"10.1109\/CVPR.2019.00758"},{"key":"2394_CR41","doi-asserted-by":"crossref","unstructured":"Li, K., Min, MR., & Fu, Y. (2019b). Rethinking zero-shot learning: A conditional visual classification perspective. In: ICCV, pp 3582\u20133591","DOI":"10.1109\/ICCV.2019.00368"},{"key":"2394_CR42","unstructured":"Li, Y., Swersky, K., & Zemel, R. S. (2015). Generative moment matching networks. In: ICML"},{"key":"2394_CR43","doi-asserted-by":"crossref","unstructured":"Li, X., Zhang, Y., Bian, S., Qu, Y., Xie, Y., Shi, Z., & Fan, J. (2023). Vs-boost: Boosting visual-semantic association for generalized zero-shot learning. In: IJCAI","DOI":"10.24963\/ijcai.2023\/123"},{"key":"2394_CR44","doi-asserted-by":"crossref","unstructured":"Liu, Y., Guo, J., Cai, D., & He, X. (2019a). Attribute attention for semantic disambiguation in zero-shot learning. In: ICCV, pp 6697\u20136706","DOI":"10.1109\/ICCV.2019.00680"},{"key":"2394_CR45","unstructured":"Liu, S., Long, M., Wang, J., & Jordan, M. I. (2018) Generalized zero-shot learning with deep calibration network. In: NeurIPS"},{"key":"2394_CR46","doi-asserted-by":"crossref","unstructured":"Liu, Y., Xie, D., Gao, Q., Han, J., Wang, S., & Gao, X. (2019b). Graph and autoencoder based feature extraction for zero-shot learning. In: IJCAI","DOI":"10.24963\/ijcai.2019\/421"},{"key":"2394_CR47","doi-asserted-by":"crossref","unstructured":"Liu, Y., Zhou, L., Bai, X., Huang, Y., Gu, L., Zhou, J., Harada, T. (2021). Goal-oriented gaze estimation for zero-shot learning. In: CVPR","DOI":"10.1109\/CVPR46437.2021.00379"},{"key":"2394_CR48","first-page":"2579","volume":"9","author":"LVD Maaten","year":"2008","unstructured":"Maaten, L. V. D., & Hinton, G. E. (2008). Visualizing data using t-SNE. Journal of Machine Learning Research, 9, 2579\u20132605.","journal-title":"Journal of Machine Learning Research"},{"key":"2394_CR49","doi-asserted-by":"crossref","unstructured":"Min, S., Yao, H., Xie, H., Wang, C., Zha, Z., & Zhang, Y. (2020), Domain-aware visual bias eliminating for generalized zero-shot learning. In: CVPR, pp 12661\u201312670","DOI":"10.1109\/CVPR42600.2020.01268"},{"key":"2394_CR50","doi-asserted-by":"crossref","unstructured":"Mishra, A., Reddy, M. K., Mittal, A., & Murthy, H. (2018). A generative model for zero shot learning using conditional variational autoencoders. In: CVPR Workshop, pp 2269\u20132277","DOI":"10.1109\/CVPRW.2018.00294"},{"key":"2394_CR51","unstructured":"Naeem, M. F., Xian, Y., Gool, L. V., & Tombari, F. (2022). I2dformer: Learning image to document attention for zero-shot image classification. In: NeurIPS"},{"key":"2394_CR52","doi-asserted-by":"crossref","unstructured":"Narayan, S., Gupta, A., Khan, F., Snoek, C. G. M., & Shao, L. (2020). Latent embedding feedback and discriminative features for zero-shot classification. In: ECCV","DOI":"10.1007\/978-3-030-58542-6_29"},{"key":"2394_CR53","unstructured":"Palatucci, M., Pomerleau, D., Hinton, G. E., Mitchell, T. M. (2009). Zero-shot learning with semantic output codes. In: NeurIPS, pp 1410\u20131418"},{"key":"2394_CR54","doi-asserted-by":"crossref","unstructured":"Patterson, G., & Hays, J. (2012). Sun attribute database: Discovering, annotating, and recognizing scene attributes. In: CVPR, pp 2751\u20132758","DOI":"10.1109\/CVPR.2012.6247998"},{"key":"2394_CR55","doi-asserted-by":"crossref","unstructured":"Paul, A., Krishnan, N. C., & Munjal, P. (2019) Semantically aligned bias reducing zero shot learning. In: CVPR, pp 7049\u20137058","DOI":"10.1109\/CVPR.2019.00722"},{"key":"2394_CR56","unstructured":"Peng, B., Galley, M., He, P., Cheng, H., Xie, Y., Hu, Y., Huang, Q., Lid\u00e9n, L., Yu, Z., Chen, W., & Gao, J. (2023) Check your facts and try again: Improving large language models with external knowledge and automated feedback. arXiv preprint arXiv:2302.12813"},{"key":"2394_CR57","doi-asserted-by":"crossref","unstructured":"Pennington, J., Socher, R., Manning, C. D. (2014). Glove: Global vectors for word representation. In: EMNLP","DOI":"10.3115\/v1\/D14-1162"},{"key":"2394_CR58","unstructured":"Qin, Z., Yi, H., Lao, Q., & Li, K. (2023). Medical image understanding with pretrained vision language models: A comprehensive study. In: ICLR"},{"key":"2394_CR59","unstructured":"Radford, A., Kim, J. W., Hallacy, C., Ramesh, A., Goh, G., Agarwal, S., Sastry, G., Askell, A., Mishkin, P., Clark, J., Krueger, G., & Sutskever, I. (2021). Learning transferable visual models from natural language supervision. In: ICML"},{"key":"2394_CR60","unstructured":"Raghu, M., Zhang, C., Kleinberg, J., & Bengio, S. (2019), Transfusion: Understanding transfer learning for medical imaging. In: NeurIPS"},{"key":"2394_CR61","doi-asserted-by":"crossref","unstructured":"Reed, S., Akata, Z., Lee, H., & Schiele, B. (2016). Learning deep representations of fine-grained visual descriptions. In: CVPR, pp 49\u201358","DOI":"10.1109\/CVPR.2016.13"},{"key":"2394_CR62","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky, O., Deng, J., Su, H., Krause, J., Satheesh, S., Ma, S., Huang, Z., Karpathy, A., Khosla, A., Bernstein, M. S., Berg, A., & Fei-Fei, L. (2015). Imagenet large scale visual recognition challenge. International Journal of Computer Vision, 115, 211\u2013252.","journal-title":"International Journal of Computer Vision"},{"key":"2394_CR63","doi-asserted-by":"crossref","unstructured":"Saharia, C., Chan, W., Saxena, S., Li, L., Whang, J., Denton, E. L., Ghasemipour, S. K. S., Ayan, B. K., Mahdavi, S. S., Lopes, R. G., Salimans, T., Ho, J., Fleet, D. J., & Norouzi, M. (2022). Photorealistic text-to-image diffusion models with deep language understanding. In: NeurIPS","DOI":"10.1145\/3528233.3530757"},{"key":"2394_CR64","doi-asserted-by":"crossref","unstructured":"Sariyildiz, M. B., & Cinbis, R. G. (2019). Gradient matching generative networks for zero-shot learning. In: CVPR, pp 2163\u20132173","DOI":"10.1109\/CVPR.2019.00227"},{"key":"2394_CR65","doi-asserted-by":"crossref","unstructured":"Sch\u00f6nfeld, E., Ebrahimi, S., Sinha, S., Darrell, T., & Akata, Z. (2019). Generalized zero- and few-shot learning via aligned variational autoencoders. In: CVPR, pp 8239\u20138247","DOI":"10.1109\/CVPR.2019.00844"},{"key":"2394_CR66","doi-asserted-by":"crossref","unstructured":"Schroff, F., Kalenichenko, D., & Philbin, J. (2015) Facenet: A unified embedding for face recognition and clustering. In: CVPR, pp 815\u2013823","DOI":"10.1109\/CVPR.2015.7298682"},{"key":"2394_CR67","unstructured":"Shen, S., Li, C., Hu, X., Xie, Y., Yang, J., Zhang, P., Rohrbach, A., Gan, Z., Wang, L., Yuan, L., Liu, C., Keutzer, K., Darrell, T., & Gao, J. (2022). K-lite: Learning transferable visual models with external knowledge. In: NeurIPS"},{"key":"2394_CR68","doi-asserted-by":"crossref","unstructured":"Shen, Y., Qin, J., & Huang, L. (2020) Invertible zero-shot recognition flows. In: ECCV","DOI":"10.1007\/978-3-030-58517-4_36"},{"key":"2394_CR69","unstructured":"Sohl-Dickstein, J. N., Weiss, E. A., Maheswaranathan, N., & Ganguli, S. (2015). Deep unsupervised learning using nonequilibrium thermodynamics. In: ICML"},{"key":"2394_CR70","doi-asserted-by":"crossref","unstructured":"Torralba, A., & Efros, A. A. (2011) Unbiased look at dataset bias. In: CVPR","DOI":"10.1109\/CVPR.2011.5995347"},{"key":"2394_CR71","doi-asserted-by":"crossref","unstructured":"Tsai, Y. H. H., Huang, L. K., & Salakhutdinov, R. (2017). Learning robust visual-semantic embeddings. In: ICCV, pp 3591\u20133600","DOI":"10.1109\/ICCV.2017.386"},{"key":"2394_CR72","unstructured":"Umapathi, L. K., Pal, A., & Sankarasubbu, M. (2023) Med-halt: Medical domain hallucination test for large language models. arXiv preprint arXiv:2307.15343"},{"key":"2394_CR73","doi-asserted-by":"crossref","unstructured":"Vyas, M. R., Venkateswara, H., & Panchanathan, S. (2020) Leveraging seen and unseen semantic relationships for generative zero-shot learning. In: ECCV","DOI":"10.1007\/978-3-030-58577-8_5"},{"key":"2394_CR74","doi-asserted-by":"publisher","first-page":"356","DOI":"10.1007\/s11263-017-1027-5","volume":"124","author":"Q Wang","year":"2017","unstructured":"Wang, Q., & Chen, K. (2017). Zero-shot visual recognition via bidirectional latent embedding. International Journal of Computer Vision, 124, 356\u2013383.","journal-title":"International Journal of Computer Vision"},{"key":"2394_CR75","unstructured":"Welinder, P., Branson, S., Mita, T., Wah, C., Schroff, F., Belongie, S. J., & Perona, P. (2010). Caltech-ucsd birds 200. Technical Report CNS-TR-2010-001, Caltech,"},{"key":"2394_CR76","doi-asserted-by":"crossref","unstructured":"Wen, Y., Zhang, K., Li, Z., & Qiao, Y. (2016). A discriminative feature learning approach for deep face recognition. In: ECCV","DOI":"10.1007\/978-3-319-46478-7_31"},{"key":"2394_CR77","doi-asserted-by":"crossref","unstructured":"Wu, J., Zhang, T., Zha, Z., Luo, J., Zhang, Y., & Wu, F. (2020) Self-supervised domain-aware generative network for generalized zero-shot learning. In: CVPR, pp 12764\u201312773","DOI":"10.1109\/CVPR42600.2020.01278"},{"key":"2394_CR78","doi-asserted-by":"crossref","unstructured":"Xian, Y., Lorenz, T., Schiele, B., & Akata, Z. (2018) Feature generating networks for zero-shot learning. In: CVPR, pp 5542\u20135551","DOI":"10.1109\/CVPR.2018.00581"},{"key":"2394_CR79","doi-asserted-by":"crossref","unstructured":"Xian, Y., Schiele, B., & Akata, Z. (2017). Zero-shot learning - the good, the bad and the ugly. CVPR pp 3077\u20133086","DOI":"10.1109\/CVPR.2017.328"},{"key":"2394_CR80","doi-asserted-by":"crossref","unstructured":"Xian, Y., Sharma, S., Schiele, B., & Akata, Z. (2019) F-vaegan-d2: A feature generating framework for any-shot learning. In: CVPR, pp 10267\u201310276","DOI":"10.1109\/CVPR.2019.01052"},{"key":"2394_CR81","doi-asserted-by":"crossref","unstructured":"Xie, G. S., Liu, L., Jin, X., Zhu, F., Zhang, Z., Qin, J., Yao, Y., Shao, L. (2019). Attentive region embedding network for zero-shot learning. In: CVPR, pp 9376\u20139385","DOI":"10.1109\/CVPR.2019.00961"},{"key":"2394_CR82","doi-asserted-by":"crossref","unstructured":"Xie, G. S., Liu, L., Jin, X., Zhu, F., Zhang, Z., Yao, Y., Qin, J., & Shao, L. (2020). Region graph embedding network for zero-shot learning. In: ECCV","DOI":"10.1109\/CVPR.2019.00961"},{"issue":"7","key":"2394_CR83","doi-asserted-by":"publisher","first-page":"2903","DOI":"10.1109\/TNNLS.2020.3046924","volume":"33","author":"GS Xie","year":"2021","unstructured":"Xie, G. S., Zhang, Z., Liu, G., Zhu, F., Liu, L., Shao, L., & Li, X. (2021). Generalized zero-shot learning with multiple graph adaptive generative networks. IEEE Transactions on Neural Networks and Learning Systems, 33(7), 2903\u20132915.","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"key":"2394_CR84","unstructured":"Xu, W., Xian, Y., Wang, J., Schiele, B., & Akata, Z. (2020) Attribute prototype network for zero-shot learning. In: NeurIPS"},{"issue":"12","key":"2394_CR85","doi-asserted-by":"publisher","first-page":"9733","DOI":"10.1109\/TPAMI.2021.3127346","volume":"44","author":"C Yan","year":"2021","unstructured":"Yan, C., Chang, X., Li, Z., Ge, Z., Guan, W., Zhu, L., & Zheng, Q. (2021). Zeronas: Differentiable generative adversarial networks search for zero-shot learning. IEEE transactions on pattern analysis and machine intelligence, 44(12), 9733\u20139740.","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"key":"2394_CR86","unstructured":"Yu, H., & Lee, B. (2019) Zero-shot learning via simultaneous generating and learning. In: NeurIPS"},{"key":"2394_CR87","doi-asserted-by":"crossref","unstructured":"Yu, Y., Ji, Z., Han, J., & Zhang, Z. (2020) Episode-based prototype generating network for zero-shot learning. In: CVPR, pp 14032\u201314041","DOI":"10.1109\/CVPR42600.2020.01405"},{"key":"2394_CR88","doi-asserted-by":"crossref","unstructured":"Yue, Z., Wang, T., Zhang, H., Sun, Q., & Hua, X. (2021) Counterfactual zero-shot and open-set visual recognition. In: CVPR","DOI":"10.1109\/CVPR46437.2021.01515"},{"key":"2394_CR89","unstructured":"Zhang, F., & Shi, G. (2019) Co-representation network for generalized zero-shot learning. In: ICML"},{"key":"2394_CR90","unstructured":"Zhang, S., Pan, L., Zhao, J., & Wang, W. Y. (2023a). Mitigating language model hallucination with interactive question-knowledge alignment. arXiv preprint arXiv:2305.13669"},{"key":"2394_CR91","unstructured":"Zhang, Y., Zhou, D., Hooi, B., Wang, K., & Feng, J. (2023b). Expanding small-scale datasets with guided imagination. In: NeurIPS"},{"key":"2394_CR92","unstructured":"Zhu, Y., Xie, J., Tang, Z., Peng, X., & Elgammal, A. (2019) Semantic-guided multi-attention localization for zero-shot learning. In: NeurIPS"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02394-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-025-02394-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02394-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,7]],"date-time":"2025-06-07T06:00:05Z","timestamp":1749276005000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-025-02394-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,3,10]]},"references-count":92,"journal-issue":{"issue":"7","published-print":{"date-parts":[[2025,7]]}},"alternative-id":["2394"],"URL":"https:\/\/doi.org\/10.1007\/s11263-025-02394-7","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,3,10]]},"assertion":[{"value":"15 January 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 February 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"10 March 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}