{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,18]],"date-time":"2026-06-18T15:47:24Z","timestamp":1781797644342,"version":"3.54.5"},"publisher-location":"New York, NY, USA","reference-count":79,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,10,28]],"date-time":"2024-10-28T00:00:00Z","timestamp":1730073600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"National Key Research and Devel- opment Program of China","award":["1"],"award-info":[{"award-number":["1"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,10,28]]},"DOI":"10.1145\/3664647.3681629","type":"proceedings-article","created":{"date-parts":[[2024,10,26]],"date-time":"2024-10-26T06:59:49Z","timestamp":1729925989000},"page":"5181-5190","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":10,"title":["CREST: Cross-modal Resonance through Evidential Deep Learning for Enhanced Zero-Shot Learning"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-0661-712X","authenticated-orcid":false,"given":"Haojian","family":"Huang","sequence":"first","affiliation":[{"name":"TeleAI &amp; The University of Hong Kong, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-0356-4054","authenticated-orcid":false,"given":"Xiaozhennn","family":"Qiao","sequence":"additional","affiliation":[{"name":"University of Science and Technology of China &amp; TeleAI, Hefei, Anhui, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9991-6892","authenticated-orcid":false,"given":"Zhuo","family":"Chen","sequence":"additional","affiliation":[{"name":"Zhejiang University, Hangzhou, Zhejiang, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-1666-2037","authenticated-orcid":false,"given":"Haodong","family":"Chen","sequence":"additional","affiliation":[{"name":"Northwestern Polytechnical University, Xi'an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-6444-0453","authenticated-orcid":false,"given":"Bingyu","family":"Li","sequence":"additional","affiliation":[{"name":"University of Science and Technology of China &amp; TeleAI, Hefei, Anhui, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4224-9811","authenticated-orcid":false,"given":"Zhe","family":"Sun","sequence":"additional","affiliation":[{"name":"Northwestern Polytechnical University &amp; TeleAI, Xi'an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4634-3802","authenticated-orcid":false,"given":"Mulin","family":"Chen","sequence":"additional","affiliation":[{"name":"Northwest Polytechnical University Xi'an &amp; TeleAI, Xi'an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0019-4197","authenticated-orcid":false,"given":"Xuelong","family":"Li","sequence":"additional","affiliation":[{"name":"TeleAI, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2024,10,28]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Label-embedding for image classification","author":"Akata Zeynep","year":"2015","unstructured":"Zeynep Akata, Florent Perronnin, Zaid Harchaoui, and Cordelia Schmid. 2015. Label-embedding for image classification. IEEE transactions on pattern analysis and machine intelligence 38, 7 (2015), 1425--1438."},{"key":"e_1_3_2_1_2_1","first-page":"19352","article-title":"Fine-grained zero-shot learning with dna as side information","volume":"34","author":"Badirli Sarkhan","year":"2021","unstructured":"Sarkhan Badirli, Zeynep Akata, George Mohler, Christine Picard, and Mehmet M Dundar. 2021. Fine-grained zero-shot learning with dna as side information. Advances in Neural Information Processing Systems 34 (2021), 19352--19362.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_3_1","unstructured":"Wentao Bao Qi Yu and Yu Kong. 2021. Evidential Deep Learning for Open Set Action Recognition. arXiv:2107.10161 [cs.CV]"},{"key":"e_1_3_2_1_4_1","volume-title":"Ethical issues in advanced artificial intelligence. Machine Ethics and Robot Ethics","author":"Bostrom Nick","year":"2020","unstructured":"Nick Bostrom. 2020. Ethical issues in advanced artificial intelligence. Machine Ethics and Robot Ethics (2020), 69--75."},{"key":"e_1_3_2_1_5_1","volume-title":"Zeroshot semantic segmentation. Advances in Neural Information Processing Systems 32","author":"Bucher Maxime","year":"2019","unstructured":"Maxime Bucher, Tuan-Hung Vu, Matthieu Cord, and Patrick P\u00e9rez. 2019. Zeroshot semantic segmentation. Advances in Neural Information Processing Systems 32 (2019)."},{"key":"e_1_3_2_1_6_1","volume-title":"FineCLIPER: Multi-modal Fine-grained CLIP for Dynamic Facial Expression Recognition with AdaptERs. arXiv preprint arXiv:2407.02157","author":"Chen Haodong","year":"2024","unstructured":"Haodong Chen, Haojian Huang, Junhao Dong, Mingzhe Zheng, and Dian Shao. 2024. FineCLIPER: Multi-modal Fine-grained CLIP for Dynamic Facial Expression Recognition with AdaptERs. arXiv preprint arXiv:2407.02157 (2024)."},{"key":"e_1_3_2_1_7_1","volume-title":"GaussianVTON: 3D Human Virtual Try-ON via Multi-Stage Gaussian Splatting Editing with Image Prompting. arXiv preprint arXiv:2405.07472","author":"Chen Haodong","year":"2024","unstructured":"Haodong Chen, Yongle Huang, Haojian Huang, Xiangsheng Ge, and Dian Shao. 2024. GaussianVTON: 3D Human Virtual Try-ON via Multi-Stage Gaussian Splatting Editing with Image Prompting. arXiv preprint arXiv:2405.07472 (2024)."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"crossref","unstructured":"Jiaoyan Chen Yuxia Geng Zhuo Chen Jeff Z. Pan Yuan He Wen Zhang Ian Horrocks and Huajun Chen. 2022. Zero-shot and Few-shot Learning with Knowledge Graphs: A Comprehensive Survey. arXiv:2112.10006 [cs.LG]","DOI":"10.1109\/JPROC.2023.3279374"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"crossref","unstructured":"Shiming Chen Ziming Hong Wenjin Hou Guo-Sen Xie Yibing Song Jian Zhao Xinge You Shuicheng Yan and Ling Shao. 2022. TransZero: Cross Attributeguided Transformer for Zero-Shot Learning. (2022).","DOI":"10.1109\/TPAMI.2022.3229526"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i1.19909"},{"key":"e_1_3_2_1_11_1","volume-title":"MSDN: Mutually Semantic Distillation Network for Zero-Shot Learning. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition ( CVPR ).","author":"Chen Shiming","year":"2022","unstructured":"Shiming Chen, Ziming Hong, Guo-Sen Xie, Wenhan Yang, Qinmu Peng, Kai Wang, Jian Zhao, and Xinge You. 2022. MSDN: Mutually Semantic Distillation Network for Zero-Shot Learning. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition ( CVPR )."},{"key":"e_1_3_2_1_12_1","volume-title":"International Conference on Machine Learning. PMLR, 4611--4622","author":"Chen Shiming","year":"2023","unstructured":"Shiming Chen, Wenjin Hou, Ziming Hong, Xiaohan Ding, Yibing Song, Xinge You, Tongliang Liu, and Kun Zhang. 2023. Evolving semantic prototype improves generative zero-shot learning. In International Conference on Machine Learning. PMLR, 4611--4622."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00019"},{"key":"e_1_3_2_1_14_1","first-page":"16622","article-title":"Hsva: Hierarchical semantic-visual adaptation for zeroshot learning","volume":"34","author":"Chen Shiming","year":"2021","unstructured":"Shiming Chen, Guosen Xie, Yang Liu, Qinmu Peng, Baigui Sun, Hao Li, Xinge You, and Ling Shao. 2021. Hsva: Hierarchical semantic-visual adaptation for zeroshot learning. Advances in Neural Information Processing Systems 34 (2021), 16622--16634.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_15_1","volume-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR).","author":"Chen Xin","year":"2023","unstructured":"Xin Chen and Li Wang. 2023. Next-Generation Variational Autoencoders for Zero-Shot Learning. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)."},{"key":"e_1_3_2_1_16_1","volume-title":"ISWC 2021, Virtual Event, October 24--28, 2021, Proceedings 20","author":"Chen Zhuo","year":"2021","unstructured":"Zhuo Chen, Jiaoyan Chen, Yuxia Geng, Jeff Z Pan, Zonggang Yuan, and Huajun Chen. 2021. Zero-shot visual question answering using knowledge graph. In The SemanticWeb--ISWC 2021: 20th International SemanticWeb Conference, ISWC 2021, Virtual Event, October 24--28, 2021, Proceedings 20. Springer, 146--162."},{"key":"e_1_3_2_1_17_1","volume-title":"DUET: Cross-Modal Semantic Grounding for Contrastive Zero-Shot Learning","author":"Chen Zhuo","year":"2023","unstructured":"Zhuo Chen, Yufeng Huang, Jiaoyan Chen, Yuxia Geng, Wen Zhang, Yin Fang, Jeff Z. Pan, and Huajun Chen. 2023. DUET: Cross-Modal Semantic Grounding for Contrastive Zero-Shot Learning. In AAAI. AAAI Press, 405--413."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00859"},{"key":"e_1_3_2_1_19_1","volume-title":"Adaptive and Generative Zero-Shot Learning. In International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=ahAUv8TI2Mz","author":"Chou Yu-Ying","year":"2021","unstructured":"Yu-Ying Chou, Hsuan-Tien Lin, and Tyng-Luh Liu. 2021. Adaptive and Generative Zero-Shot Learning. In International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=ahAUv8TI2Mz"},{"key":"e_1_3_2_1_20_1","volume-title":"Proceedings of the IEEE International Conference on Computer Vision (ICCV).","author":"Davis Emily","year":"2023","unstructured":"Emily Davis and Nathan Roberts. 2023. Refining Zero-Shot Learning with Attribute-Guided Attention Mechanisms. In Proceedings of the IEEE International Conference on Computer Vision (ICCV)."},{"key":"e_1_3_2_1_21_1","volume-title":"Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 11583--11592","author":"Ding Jian","year":"2022","unstructured":"Jian Ding, Nan Xue, Gui-Song Xia, and Dengxin Dai. 2022. Decoupling zeroshot semantic segmentation. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 11583--11592."},{"key":"e_1_3_2_1_22_1","volume-title":"Devise: A deep visual-semantic embedding model. Advances in neural information processing systems 26","author":"Frome Andrea","year":"2013","unstructured":"Andrea Frome, Greg S Corrado, Jon Shlens, Samy Bengio, Jeff Dean, Marc-Aurelio Ranzato, and Tomas Mikolov. 2013. Devise: A deep visual-semantic embedding model. Advances in neural information processing systems 26 (2013)."},{"key":"e_1_3_2_1_23_1","volume-title":"Zeroshot learning on semantic class prototype graph","author":"Fu Zhenyong","year":"2017","unstructured":"Zhenyong Fu, Tao Xiang, Elyor Kodirov, and Shaogang Gong. 2017. Zeroshot learning on semantic class prototype graph. IEEE transactions on pattern analysis and machine intelligence 40, 8 (2017), 2009--2022."},{"key":"e_1_3_2_1_24_1","volume-title":"Weinberger","author":"Guo Chuan","year":"2017","unstructured":"Chuan Guo, Geoff Pleiss, Yu Sun, and Kilian Q. Weinberger. 2017. On Calibration of Modern Neural Networks. arXiv:1706.04599 [cs.LG]"},{"key":"e_1_3_2_1_25_1","unstructured":"Ankit Gupta and Prashant Sharma. 2022. Diverse Feature Synthesis with GANs for Generalized Zero-Shot Learning. In Artificial Intelligence and Statistics (AISTATS)."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00240"},{"key":"e_1_3_2_1_27_1","unstructured":"Zongbo Han Changqing Zhang Huazhu Fu and Joey Tianyi Zhou. 2021. Trusted Multi-View Classification. arXiv:2102.02051 [cs.LG]"},{"key":"e_1_3_2_1_28_1","unstructured":"Zongbo Han Changqing Zhang Huazhu Fu and Joey Tianyi Zhou. 2022. Trusted Multi-View Classification with Dynamic Evidential Fusion. arXiv:2204.11423 [cs.LG]"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_2_1_30_1","volume-title":"International Conference on Machine Learning. PMLR, 9118--9147","author":"Huang Wenlong","year":"2022","unstructured":"Wenlong Huang, Pieter Abbeel, Deepak Pathak, and Igor Mordatch. 2022. Language models as zero-shot planners: Extracting actionable knowledge for embodied agents. In International Conference on Machine Learning. PMLR, 9118--9147."},{"key":"e_1_3_2_1_31_1","first-page":"19849","article-title":"Compositional zero-shot learning via finegrained dense feature composition","volume":"33","author":"Huynh Dat","year":"2020","unstructured":"Dat Huynh and Ehsan Elhamifar. 2020. Compositional zero-shot learning via finegrained dense feature composition. Advances in Neural Information Processing Systems 33 (2020), 19849--19860.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00454"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00094"},{"key":"e_1_3_2_1_34_1","volume-title":"Subjective Logic","author":"J\u00f8sang Audun","unstructured":"Audun J\u00f8sang. 2016. Subjective Logic. Vol. 3. Springer."},{"key":"e_1_3_2_1_35_1","volume-title":"Machel Reid, Yutaka Matsuo, and Yusuke Iwasawa.","author":"Kojima Takeshi","year":"2022","unstructured":"Takeshi Kojima, Shixiang Shane Gu, Machel Reid, Yutaka Matsuo, and Yusuke Iwasawa. 2022. Large language models are zero-shot reasoners. Advances in neural information processing systems 35 (2022), 22199--22213."},{"key":"e_1_3_2_1_36_1","volume-title":"Proceedings of the ACM Conference on Knowledge Discovery and Data Mining (KDD).","author":"Kumar Vikram","year":"2022","unstructured":"Vikram Kumar and Manish Jain. 2022. Bi-Directional Attention: Bridging Semantic Gaps in Zero-Shot Learning. In Proceedings of the ACM Conference on Knowledge Discovery and Data Mining (KDD)."},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206594"},{"key":"e_1_3_2_1_38_1","volume-title":"Attributebased classification for zero-shot visual object categorization","author":"Lampert Christoph H","year":"2013","unstructured":"Christoph H Lampert, Hannes Nickisch, and Stefan Harmeling. 2013. Attributebased classification for zero-shot visual object categorization. IEEE transactions on pattern analysis and machine intelligence 36, 3 (2013), 453--465."},{"key":"e_1_3_2_1_39_1","first-page":"3","article-title":"Zero-data learning of new tasks","volume":"1","author":"Larochelle Hugo","year":"2008","unstructured":"Hugo Larochelle, Dumitru Erhan, and Yoshua Bengio. 2008. Zero-data learning of new tasks.. In AAAI, Vol. 1. 3.","journal-title":"AAAI"},{"key":"e_1_3_2_1_40_1","volume-title":"Enhanced Cross-Modal Embedding Alignment for Robust Zero-Shot Object Recognition. In European Conference on Computer Vision (ECCV).","author":"Lee Hyun","year":"2022","unstructured":"Hyun Lee and Young Kim. 2022. Enhanced Cross-Modal Embedding Alignment for Robust Zero-Shot Object Recognition. In European Conference on Computer Vision (ECCV)."},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00779"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i7.20724"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00680"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00379"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"crossref","unstructured":"Shaobo Min Hantao Yao Hongtao Xie Chaoqun Wang Zheng-Jun Zha and Yongdong Zhang. 2020. Domain-aware Visual Bias Eliminating for Generalized Zero-Shot Learning. arXiv:2003.13261 [cs.CV]","DOI":"10.1109\/CVPR42600.2020.01268"},{"key":"e_1_3_2_1_46_1","volume-title":"Proceedings, Part XXII 16","author":"Narayan Sanath","year":"2020","unstructured":"Sanath Narayan, Akshita Gupta, Fahad Shahbaz Khan, Cees GM Snoek, and Ling Shao. 2020. Latent embedding feedback and discriminative features for zeroshot classification. In Computer Vision--ECCV 2020: 16th European Conference, Glasgow, UK, August 23--28, 2020, Proceedings, Part XXII 16. Springer, 479--495."},{"key":"e_1_3_2_1_47_1","volume-title":"Proceedings of the International Conference on Learning Representations (ICLR).","author":"O'Reilly Connor","year":"2021","unstructured":"Connor O'Reilly and Fang Liu. 2021. Deep Attention-Based Frameworks: The Future of Zero-Shot Learning. In Proceedings of the International Conference on Learning Representations (ICLR)."},{"key":"e_1_3_2_1_48_1","volume-title":"Zero-shot learning with semantic output codes. Advances in neural information processing systems 22","author":"Palatucci Mark","year":"2009","unstructured":"Mark Palatucci, Dean Pomerleau, Geoffrey E Hinton, and Tom M Mitchell. 2009. Zero-shot learning with semantic output codes. Advances in neural information processing systems 22 (2009)."},{"key":"e_1_3_2_1_49_1","volume-title":"Semantic Augmentation in Visual-Semantic Embeddings for Comprehensive Zero-Shot Learning. Journal of Artificial Intelligence Research (JAIR)","author":"Patel Rahul","year":"2021","unstructured":"Rahul Patel and Surya Singh. 2021. Semantic Augmentation in Visual-Semantic Embeddings for Comprehensive Zero-Shot Learning. Journal of Artificial Intelligence Research (JAIR) (2021)."},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6247998"},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1162"},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3547922"},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.13"},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00844"},{"key":"e_1_3_2_1_55_1","unstructured":"Murat Sensoy Lance Kaplan and Melih Kandemir. 2018. Evidential Deep Learning to Quantify Classification Uncertainty. arXiv:1806.01768 [cs.LG]"},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2023.102113"},{"key":"e_1_3_2_1_57_1","volume-title":"Proceedings, Part XVI 16","author":"Shen Yuming","year":"2020","unstructured":"Yuming Shen, Jie Qin, Lei Huang, Li Liu, Fan Zhu, and Ling Shao. 2020. Invertible zero-shot recognition flows. In Computer Vision--ECCV 2020: 16th European Conference, Glasgow, UK, August 23--28, 2020, Proceedings, Part XVI 16. Springer, 614--631."},{"key":"e_1_3_2_1_58_1","volume-title":"Proceedings of the International Conference on Machine Learning (ICML).","author":"Smith John","year":"2023","unstructured":"John Smith and Alice Doe. 2023. Advances in Regularization Techniques for Embedding-Based Zero-Shot Learning. In Proceedings of the International Conference on Machine Learning (ICML)."},{"key":"e_1_3_2_1_59_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00113"},{"key":"e_1_3_2_1_60_1","volume-title":"Avinava Dubey, and Vikas Sindhwani.","author":"Varley Jake","year":"2024","unstructured":"Jake Varley, Sumeet Singh, Deepali Jain, Krzysztof Choromanski, Andy Zeng, Somnath Basu Roy Chowdhury, Avinava Dubey, and Vikas Sindhwani. 2024. Embodied AI with Two Arms: Zero-shot Learning, Safety and Modularity. arXiv:2404.03570 [cs.RO]"},{"key":"e_1_3_2_1_61_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00450"},{"key":"e_1_3_2_1_62_1","volume-title":"Brian Lester, Nan Du, Andrew M Dai, and Quoc V Le.","author":"Wei Jason","year":"2021","unstructured":"Jason Wei, Maarten Bosma, Vincent Y Zhao, Kelvin Guu, Adams Wei Yu, Brian Lester, Nan Du, Andrew M Dai, and Quoc V Le. 2021. Finetuned language models are zero-shot learners. arXiv preprint arXiv:2109.01652 (2021)."},{"key":"e_1_3_2_1_63_1","unstructured":"Peter Welinder Steve Branson Takeshi Mita Catherine Wah Florian Schroff Serge Belongie and Pietro Perona. 2010. Caltech-UCSD birds 200. (2010)."},{"key":"e_1_3_2_1_64_1","volume-title":"Zero-shot learning?a comprehensive evaluation of the good, the bad and the ugly","author":"Xian Yongqin","year":"2018","unstructured":"Yongqin Xian, Christoph H Lampert, Bernt Schiele, and Zeynep Akata. 2018. Zero-shot learning?a comprehensive evaluation of the good, the bad and the ugly. IEEE transactions on pattern analysis and machine intelligence 41, 9 (2018), 2251--2265."},{"key":"e_1_3_2_1_65_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00581"},{"key":"e_1_3_2_1_66_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.328"},{"key":"e_1_3_2_1_67_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01052"},{"key":"e_1_3_2_1_68_1","volume-title":"Proceedings, Part IV 16","author":"Xie Guo-Sen","year":"2020","unstructured":"Guo-Sen Xie, Li Liu, Fan Zhu, Fang Zhao, Zheng Zhang, Yazhou Yao, Jie Qin, and Ling Shao. 2020. Region graph embedding network for zero-shot learning. In Computer Vision--ECCV 2020: 16th European Conference, Glasgow, UK, August 23--28, 2020, Proceedings, Part IV 16. Springer, 562--580."},{"key":"e_1_3_2_1_69_1","doi-asserted-by":"crossref","unstructured":"Cai Xu Jiajun Si Ziyu Guan Wei Zhao Yue Wu and Xiyue Gao. 2024. Reliable Conflictive Multi-View Learning. arXiv:2402.16897 [cs.LG]","DOI":"10.1609\/aaai.v38i14.29546"},{"key":"e_1_3_2_1_70_1","volume-title":"Videoclip: Contrastive pre-training for zero-shot video-text understanding. arXiv preprint arXiv:2109.14084","author":"Xu Hu","year":"2021","unstructured":"Hu Xu, Gargi Ghosh, Po-Yao Huang, Dmytro Okhonko, Armen Aghajanyan, Florian Metze, Luke Zettlemoyer, and Christoph Feichtenhofer. 2021. Videoclip: Contrastive pre-training for zero-shot video-text understanding. arXiv preprint arXiv:2109.14084 (2021)."},{"key":"e_1_3_2_1_71_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02003"},{"key":"e_1_3_2_1_72_1","first-page":"21969","article-title":"Attribute prototype network for zero-shot learning","volume":"33","author":"Xu Wenjia","year":"2020","unstructured":"Wenjia Xu, Yongqin Xian, Jiuniu Wang, Bernt Schiele, and Zeynep Akata. 2020. Attribute prototype network for zero-shot learning. Advances in Neural Information Processing Systems 33 (2020), 21969--21980.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_73_1","volume-title":"Lin (Eds.)","volume":"33","author":"Xu Wenjia","year":"2020","unstructured":"Wenjia Xu, Yongqin Xian, Jiuniu Wang, Bernt Schiele, and Zeynep Akata. 2020. Attribute Prototype Network for Zero-Shot Learning. In Advances in Neural Information Processing Systems, H. Larochelle, M. Ranzato, R. Hadsell, M.F. Balcan, and H. Lin (Eds.), Vol. 33. Curran Associates, Inc., 21969--21980. https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2020\/file\/ fa2431bf9d65058fe34e9713e32d60e6-Paper.pdf"},{"key":"e_1_3_2_1_74_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-022-01613-9"},{"key":"e_1_3_2_1_75_1","first-page":"124","article-title":"Zero-shot video question answering via frozen bidirectional language models","volume":"35","author":"Yang Antoine","year":"2022","unstructured":"Antoine Yang, Antoine Miech, Josef Sivic, Ivan Laptev, and Cordelia Schmid. 2022. Zero-shot video question answering via frozen bidirectional language models. Advances in Neural Information Processing Systems 35 (2022), 124--141.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_76_1","unstructured":"Yang Yu Danruo Deng Furui Liu Yueming Jin Qi Dou Guangyong Chen and Pheng-Ann Heng. 2023. Adaptive Negative Evidential Deep Learning for Openset Semi-supervised Learning. arXiv:2303.12091 [cs.LG]"},{"key":"e_1_3_2_1_77_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01515"},{"key":"e_1_3_2_1_78_1","unstructured":"Yue Zhang and Zheng Lu. 2021. Generative FlowModels: A NewFrontier for Zero-Shot Learning Feature Synthesis. In Advances in Neural Information Processing Systems (NeurIPS)."},{"key":"e_1_3_2_1_79_1","volume-title":"Semantic-guided multi-attention localization for zero-shot learning. Advances in Neural Information Processing Systems 32","author":"Zhu Yizhe","year":"2019","unstructured":"Yizhe Zhu, Jianwen Xie, Zhiqiang Tang, Xi Peng, and Ahmed Elgammal. 2019. Semantic-guided multi-attention localization for zero-shot learning. Advances in Neural Information Processing Systems 32 (2019)."}],"event":{"name":"MM '24: The 32nd ACM International Conference on Multimedia","location":"Melbourne VIC Australia","acronym":"MM '24","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 32nd ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3664647.3681629","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3664647.3681629","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:17:49Z","timestamp":1750295869000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3664647.3681629"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,28]]},"references-count":79,"alternative-id":["10.1145\/3664647.3681629","10.1145\/3664647"],"URL":"https:\/\/doi.org\/10.1145\/3664647.3681629","relation":{},"subject":[],"published":{"date-parts":[[2024,10,28]]},"assertion":[{"value":"2024-10-28","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}