{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T16:59:13Z","timestamp":1777568353850,"version":"3.51.4"},"publisher-location":"Cham","reference-count":45,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031200526","type":"print"},{"value":"9783031200533","type":"electronic"}],"license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-031-20053-3_20","type":"book-chapter","created":{"date-parts":[[2022,11,5]],"date-time":"2022-11-05T16:21:52Z","timestamp":1667665312000},"page":"339-355","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":34,"title":["Learning Invariant Visual Representations for\u00a0Compositional Zero-Shot Learning"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5305-5433","authenticated-orcid":false,"given":"Tian","family":"Zhang","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4726-093X","authenticated-orcid":false,"given":"Kongming","family":"Liang","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8372-5637","authenticated-orcid":false,"given":"Ruoyi","family":"Du","sequence":"additional","affiliation":[]},{"given":"Xian","family":"Sun","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2950-2488","authenticated-orcid":false,"given":"Zhanyu","family":"Ma","sequence":"additional","affiliation":[]},{"given":"Jun","family":"Guo","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,11,6]]},"reference":[{"key":"20_CR1","first-page":"3438","volume":"34","author":"K Ahuja","year":"2021","unstructured":"Ahuja, K., et al.: Invariance principle meets information bottleneck for out-of-distribution generalization. NeurIPS 34, 3438\u20133450 (2021)","journal-title":"NeurIPS"},{"key":"20_CR2","unstructured":"Arjovsky, M., Bottou, L., Gulrajani, I., Lopez-Paz, D.: Invariant risk minimization. arXiv preprint arXiv:1907.02893 (2019)"},{"key":"20_CR3","first-page":"1462","volume":"33","author":"Y Atzmon","year":"2021","unstructured":"Atzmon, Y., Kreuk, F., Shalit, U., Chechik, G.: A causal view of compositional zero-shot recognition. NeurIPS 33, 1462\u20131473 (2021)","journal-title":"NeurIPS"},{"key":"20_CR4","unstructured":"Bengio, Y., et al.: A meta-transfer objective for learning to disentangle causal mechanisms. arXiv preprint arXiv:1901.10912 (2019)"},{"key":"20_CR5","unstructured":"Blanchard, G., Lee, G., Scott, C.: Generalizing from several related classification tasks to a new unlabeled sample. NeurIPS (2011)"},{"key":"20_CR6","doi-asserted-by":"crossref","unstructured":"Carlucci, F.M., D\u2019Innocente, A., Bucci, S., Caputo, B., Tommasi, T.: Domain generalization by solving jigsaw puzzles. In: CVPR (2020)","DOI":"10.1109\/CVPR.2019.00233"},{"key":"20_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"52","DOI":"10.1007\/978-3-319-46475-6_4","volume-title":"Computer Vision \u2013 ECCV 2016","author":"W-L Chao","year":"2016","unstructured":"Chao, W.-L., Changpinyo, S., Gong, B., Sha, F.: An empirical study and analysis of generalized zero-shot learning for object recognition in the wild. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9906, pp. 52\u201368. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46475-6_4"},{"key":"20_CR8","doi-asserted-by":"crossref","unstructured":"Chen, C.Y., Grauman, K.: Inferring analogous attributes. In: CVPR, pp. 200\u2013207 (2014)","DOI":"10.1109\/CVPR.2014.33"},{"key":"20_CR9","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.J., Li, K., Fei-Fei, L.: ImageNet: a large-scale hierarchical image database. In: CVPR, pp. 248\u2013255 (2009)","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"20_CR10","unstructured":"Geirhos, R., Rubisch, P., Michaelis, C., Bethge, M., Wichmann, F.A., Brendel, W.: ImageNet-trained CNNs are biased towards texture; increasing shape bias improves accuracy and robustness. arXiv preprint arXiv:1811.12231 (2018)"},{"key":"20_CR11","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: CVPR, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"20_CR12","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"124","DOI":"10.1007\/978-3-030-58536-5_8","volume-title":"Computer Vision \u2013 ECCV 2020","author":"Z Huang","year":"2020","unstructured":"Huang, Z., Wang, H., Xing, E.P., Huang, D.: Self-challenging improves cross-domain generalization. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12347, pp. 124\u2013140. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58536-5_8"},{"key":"20_CR13","doi-asserted-by":"crossref","unstructured":"Isola, P., Lim, J.J., Adelson, E.H.: Discovering states and transformations in image collections. In: CVPR, pp. 1383\u20131391 (2015)","DOI":"10.1109\/CVPR.2015.7298744"},{"key":"20_CR14","unstructured":"Khezeli, K., Blaas, A., Soboczenski, F., Chia, N., Kalantari, J.: On invariance penalties for risk minimization. arXiv preprint arXiv:2106.09777 (2021)"},{"key":"20_CR15","doi-asserted-by":"crossref","unstructured":"Kim, D., Yoo, Y., Park, S., Kim, J., Lee, J.: Selfreg: self-supervised contrastive regularization for domain generalization. In: ICCV, pp. 9619\u20139628 (2021)","DOI":"10.1109\/ICCV48922.2021.00948"},{"key":"20_CR16","unstructured":"Koyama, M., Yamaguchi, S.: Out-of-distribution generalization with maximal invariant predictor. ICLR (2021)"},{"key":"20_CR17","unstructured":"Krueger, D., et al.: Out-of-distribution generalization via risk extrapolation (rex). In: ICML, pp. 5815\u20135826 (2021)"},{"key":"20_CR18","doi-asserted-by":"crossref","unstructured":"Li, H., Pan, S.J., Wang, S., Kot, A.C.: Domain generalization with adversarial feature learning. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00566"},{"key":"20_CR19","doi-asserted-by":"crossref","unstructured":"Li, Y.L., Xu, Y., Mao, X., Lu, C.: Symmetry and group in attribute-object compositions. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.01133"},{"key":"20_CR20","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"852","DOI":"10.1007\/978-3-319-46448-0_51","volume-title":"Computer Vision \u2013 ECCV 2016","author":"C Lu","year":"2016","unstructured":"Lu, C., Krishna, R., Bernstein, M., Fei-Fei, L.: Visual relationship detection with language priors. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9905, pp. 852\u2013869. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46448-0_51"},{"key":"20_CR21","doi-asserted-by":"crossref","unstructured":"Mancini, M., Naeem, M.F., Xian, Y., Akata, Z.: Open world compositional zero-shot learning. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.00518"},{"key":"20_CR22","doi-asserted-by":"crossref","unstructured":"Misra, I., Gupta, A., Hebert, M.: From red wine to red tomato: composition with context. In: CVPR, pp. 1160\u20131169 (2017)","DOI":"10.1109\/CVPR.2017.129"},{"key":"20_CR23","unstructured":"Muandet, K., Balduzzi, D., Sch\u00f6lkopf, B.: Domain generalization via invariant feature representation. In: ICML, pp. 10\u201318 (2013)"},{"key":"20_CR24","doi-asserted-by":"crossref","unstructured":"Nagarajan, T., Grauman, K.: Attributes as operators: factorizing unseen attribute-object compositions. In: ECCV (2018)","DOI":"10.1007\/978-3-030-01246-5_11"},{"key":"20_CR25","unstructured":"Palatucci, M., Pomerleau, D., Hinton, G.E., Mitchell, T.M.: Zero-shot learning with semantic output codes. NeurIPS (2009)"},{"key":"20_CR26","unstructured":"Parascandolo, G., Neitz, A., Orvieto, A., Gresele, L., Sch\u00f6lkopf, B.: Learning explanations that are hard to vary. arXiv preprint arXiv:2009.00329 (2020)"},{"key":"20_CR27","unstructured":"Peng, X., Huang, Z., Sun, X., Saenko, K.: Domain agnostic learning with disentangled representations. In: ICML, pp. 5102\u20135112 (2019)"},{"key":"20_CR28","doi-asserted-by":"crossref","unstructured":"Pennington, J., Socher, R., Manning, C.D.: Glove: global vectors for word representation. In: EMNLP, pp. 1532\u20131543 (2014)","DOI":"10.3115\/v1\/D14-1162"},{"key":"20_CR29","doi-asserted-by":"crossref","unstructured":"Purushwalkam, S., Nickel, M., Gupta, A., Ranzato, M.: Task-driven modular networks for zero-shot compositional learning. In: ICCV (2019)","DOI":"10.1109\/ICCV.2019.00369"},{"key":"20_CR30","doi-asserted-by":"crossref","unstructured":"Qiao, F., Zhao, L., Peng, X.: Learning to learn single domain generalization. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.01257"},{"key":"20_CR31","doi-asserted-by":"crossref","unstructured":"Qui\u00f1onero-Candela, J., Sugiyama, M., Schwaighofer, A., Lawrence, N.D.: Dataset Shift in Machine Learning. MIT Press (2008)","DOI":"10.7551\/mitpress\/9780262170055.001.0001"},{"issue":"2","key":"20_CR32","doi-asserted-by":"publisher","first-page":"215","DOI":"10.1111\/rssb.12398","volume":"83","author":"D Rothenh\u00e4usler","year":"2021","unstructured":"Rothenh\u00e4usler, D., Meinshausen, N., B\u00fchlmann, P., Peters, J.: Anchor regression: heterogeneous data meet causality. J. Royal Stat. Soc.: Ser. B (Stat. Methodol.) 83(2), 215\u2013246 (2021)","journal-title":"J. Royal Stat. Soc.: Ser. B (Stat. Methodol.)"},{"key":"20_CR33","unstructured":"Shahtalebi, S., Gagnon-Audet, J.C., Laleh, T., Faramarzi, M., Ahuja, K., Rish, I.: Sand-mask: an enhanced gradient masking strategy for the discovery of invariances in domain generalization. arXiv preprint arXiv:2106.02266 (2021)"},{"key":"20_CR34","unstructured":"Shankar, S., Piratla, V., Chakrabarti, S., Chaudhuri, S., Jyothi, P., Sarawagi, S.: Generalizing across domains via cross-gradient training. arXiv preprint arXiv:1804.10745 (2018)"},{"key":"20_CR35","unstructured":"Shi, Y., et al.: Gradient matching for domain generalization. arXiv preprint arXiv:2104.09937 (2021)"},{"key":"20_CR36","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"443","DOI":"10.1007\/978-3-319-49409-8_35","volume-title":"Computer Vision \u2013 ECCV 2016 Workshops","author":"B Sun","year":"2016","unstructured":"Sun, B., Saenko, K.: Deep CORAL: correlation alignment for deep domain adaptation. In: Hua, G., J\u00e9gou, H. (eds.) ECCV 2016. LNCS, vol. 9915, pp. 443\u2013450. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-49409-8_35"},{"key":"20_CR37","unstructured":"Tolstikhin, I., Bousquet, O., Gelly, S., Schoelkopf, B.: Wasserstein auto-encoders. arXiv preprint arXiv:1711.01558 (2017)"},{"key":"20_CR38","doi-asserted-by":"crossref","unstructured":"Wang, J., Lan, C., Liu, C., Ouyang, Y., Zeng, W., Qin, T.: Generalizing to unseen domains: a survey on domain generalization. arXiv preprint arXiv:2103.03097 (2021)","DOI":"10.24963\/ijcai.2021\/628"},{"key":"20_CR39","doi-asserted-by":"crossref","unstructured":"Wei, K., Yang, M., Wang, H., Deng, C., Liu, X.: Adversarial fine-grained composition learning for unseen attribute-object recognition. In: ICCV, pp. 3741\u20133749 (2019)","DOI":"10.1109\/ICCV.2019.00384"},{"key":"20_CR40","doi-asserted-by":"crossref","unstructured":"Xian, Y., Lorenz, T., Schiele, B., Akata, Z.: Feature generating networks for zero-shot learning. In: CVPR, pp. 5542\u20135551 (2018)","DOI":"10.1109\/CVPR.2018.00581"},{"key":"20_CR41","doi-asserted-by":"crossref","unstructured":"Xian, Y., Schiele, B., Akata, Z.: Zero-shot learning-the good, the bad and the ugly. In: CVPR, pp. 4582\u20134591 (2017)","DOI":"10.1109\/CVPR.2017.328"},{"key":"20_CR42","doi-asserted-by":"crossref","unstructured":"Yu, A., Grauman, K.: Fine-grained visual comparisons with local learning. In: CVPR, pp. 192\u2013199 (2014)","DOI":"10.1109\/CVPR.2014.32"},{"key":"20_CR43","doi-asserted-by":"crossref","unstructured":"Zhang, H., Zhang, Y.F., Liu, W., Weller, A., Sch\u00f6lkopf, B., Xing, E.P.: Towards principled disentanglement for domain generalization. arXiv preprint arXiv:2111.13839 (2021)","DOI":"10.1109\/CVPR52688.2022.00786"},{"key":"20_CR44","unstructured":"Zhang, H., Cisse, M., Dauphin, Y.N., Lopez-Paz, D.: mixup: beyond empirical risk minimization. arXiv preprint arXiv:1710.09412 (2017)"},{"key":"20_CR45","doi-asserted-by":"crossref","unstructured":"Zhou, K., Liu, Z., Qiao, Y., Xiang, T., Change Loy, C.: Domain generalization: a survey. arXiv preprint arXiv:2103.02503 (2021)","DOI":"10.1109\/TPAMI.2022.3195549"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2022"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-20053-3_20","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,11,5]],"date-time":"2022-11-05T16:27:32Z","timestamp":1667665652000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-20053-3_20"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"ISBN":["9783031200526","9783031200533"],"references-count":45,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-20053-3_20","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022]]},"assertion":[{"value":"6 November 2022","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Tel Aviv","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Israel","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2022","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23 October 2022","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 October 2022","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2022","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2022.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"CMT","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"5804","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1645","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"28% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.21","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.91","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}