{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,7]],"date-time":"2026-01-07T07:48:31Z","timestamp":1767772111297,"version":"3.37.3"},"reference-count":120,"publisher":"Springer Science and Business Media LLC","issue":"9","license":[{"start":{"date-parts":[[2024,4,27]],"date-time":"2024-04-27T00:00:00Z","timestamp":1714176000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,4,27]],"date-time":"2024-04-27T00:00:00Z","timestamp":1714176000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2024,9]]},"DOI":"10.1007\/s11263-024-02041-7","type":"journal-article","created":{"date-parts":[[2024,4,27]],"date-time":"2024-04-27T10:01:22Z","timestamp":1714212082000},"page":"3954-3976","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Domain-Agnostic Priors for Semantic Segmentation Under Unsupervised Domain Adaptation and Domain Generalization"],"prefix":"10.1007","volume":"132","author":[{"given":"Xinyue","family":"Huo","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4831-9451","authenticated-orcid":false,"given":"Lingxi","family":"Xie","sequence":"additional","affiliation":[]},{"given":"Hengtong","family":"Hu","sequence":"additional","affiliation":[]},{"given":"Wengang","family":"Zhou","sequence":"additional","affiliation":[]},{"given":"Houqiang","family":"Li","sequence":"additional","affiliation":[]},{"given":"Qi","family":"Tian","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,4,27]]},"reference":[{"doi-asserted-by":"crossref","unstructured":"Akuzawa, K., Iwasawa, Y., & Matsuo, Y. (2019). Adversarial invariant feature learning with accuracy constraint for domain generalization. In Joint European conference on machine learning and knowledge discovery in databases, Springer, pp 315\u2013331.","key":"2041_CR1","DOI":"10.1007\/978-3-030-46147-8_19"},{"unstructured":"Balaji, Y., Sankaranarayanan, S., & Chellappa, R. (2018). Metareg: Towards domain generalization using meta-regularization. Advances in neural information processing systems, 31.","key":"2041_CR2"},{"unstructured":"Ben-David, E., Oved, N., & Reichart, R. (2021). Pada: A prompt-based autoregressive approach for adaptation to unseen domains. arXiv preprint arXiv:2102.12206","key":"2041_CR3"},{"issue":"1","key":"2041_CR4","doi-asserted-by":"publisher","first-page":"151","DOI":"10.1007\/s10994-009-5152-4","volume":"79","author":"S Ben-David","year":"2010","unstructured":"Ben-David, S., Blitzer, J., Crammer, K., et al. (2010). A theory of learning from different domains. Machine Learning, 79(1), 151\u2013175.","journal-title":"Machine Learning"},{"unstructured":"Blanchard, G., Lee, G., & Scott, C. (2011). Generalizing from several related classification tasks to a new unlabeled sample. Advances in Neural Information Processing Systems,24.","key":"2041_CR5"},{"doi-asserted-by":"crossref","unstructured":"Bousmalis, K., Silberman, N., Dohan, D., et al. (2017). Unsupervised pixel-level domain adaptation with generative adversarial networks. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3722\u20133731.","key":"2041_CR6","DOI":"10.1109\/CVPR.2017.18"},{"key":"2041_CR7","first-page":"468","volume":"32","author":"M Bucher","year":"2019","unstructured":"Bucher, M., Vu, T. H., Cord, M., et al. (2019). Zero-shot semantic segmentation. Advances in Neural Information Processing Systems, 32, 468\u2013479.","journal-title":"Advances in Neural Information Processing Systems"},{"doi-asserted-by":"crossref","unstructured":"Chao, C. H., Cheng, B. W., & Lee, C. Y. (2021). Rethinking ensemble-distillation for semantic segmentation based unsupervised domain adaption. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 2610\u20132620.","key":"2041_CR8","DOI":"10.1109\/CVPRW53098.2021.00295"},{"doi-asserted-by":"crossref","unstructured":"Chen, C., Xie, W., Huang, W., et\u00a0al. (2019a). Progressive feature alignment for unsupervised domain adaptation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 627\u2013636.","key":"2041_CR9","DOI":"10.1109\/CVPR.2019.00072"},{"issue":"4","key":"2041_CR10","doi-asserted-by":"publisher","first-page":"834","DOI":"10.1109\/TPAMI.2017.2699184","volume":"40","author":"LC Chen","year":"2017","unstructured":"Chen, L. C., Papandreou, G., Kokkinos, I., et al. (2017). Deeplab: Semantic image segmentation with deep convolutional nets, Atrous convolution, and fully connected CRFS. IEEE Transactions on Pattern Analysis and Machine Intelligence, 40(4), 834\u2013848.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"doi-asserted-by":"crossref","unstructured":"Chen, L. C., Zhu, Y., Papandreou, G., et\u00a0al. (2018a). Encoder-decoder with atrous separable convolution for semantic image segmentation. In Proceedings of the European conference on computer vision (ECCV), pp. 801\u2013818.","key":"2041_CR11","DOI":"10.1007\/978-3-030-01234-2_49"},{"doi-asserted-by":"crossref","unstructured":"Chen, M., Xue, H., & Cai, D. (2019b). Domain adaptation for semantic segmentation with maximum squares loss. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 2090\u20132099.","key":"2041_CR12","DOI":"10.1109\/ICCV.2019.00218"},{"doi-asserted-by":"crossref","unstructured":"Chen, Y., Li, W., Sakaridis, C., et\u00a0al. (2018b). Domain adaptive faster R-CNN for object detection in the wild. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 3339\u20133348.","key":"2041_CR13","DOI":"10.1109\/CVPR.2018.00352"},{"doi-asserted-by":"crossref","unstructured":"Cheng, Y., Wei, F., Bao, J., et\u00a0al. (2021). Dual path learning for domain adaptation of semantic segmentation. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 9082\u20139091.","key":"2041_CR14","DOI":"10.1109\/ICCV48922.2021.00895"},{"doi-asserted-by":"crossref","unstructured":"Choi, S., Jung, S., Yun, H., et\u00a0al. (2021). Robustnet: Improving domain generalization in urban-scene segmentation via instance selective whitening. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 11580\u201311590.","key":"2041_CR15","DOI":"10.1109\/CVPR46437.2021.01141"},{"doi-asserted-by":"crossref","unstructured":"Cordts, M., Omran, M., Ramos, S., et\u00a0al. (2016). The cityscapes dataset for semantic urban scene understanding. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 3213\u20133223.","key":"2041_CR16","DOI":"10.1109\/CVPR.2016.350"},{"doi-asserted-by":"crossref","unstructured":"Csurka, G. (2017). Domain adaptation for visual applications: A comprehensive survey. arXiv preprint arXiv:1702.05374.","key":"2041_CR17","DOI":"10.1007\/978-3-319-58347-1"},{"doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., et\u00a0al. (2009). Imagenet: A large-scale hierarchical image database. In 2009 IEEE conference on computer vision and pattern recognition, IEEE, pp. 248\u2013255.","key":"2041_CR18","DOI":"10.1109\/CVPR.2009.5206848"},{"unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., et\u00a0al. (2020). An image is worth 16x16 words: Transformers for image recognition at scale. arXiv preprint arXiv:2010.11929.","key":"2041_CR19"},{"unstructured":"Dou, Q., Coelho de Castro, D., Kamnitsas, K., et al. (2019). Domain generalization via model-agnostic learning of semantic features. Advances in Neural Information Processing Systems, 32.","key":"2041_CR20"},{"doi-asserted-by":"crossref","unstructured":"Feng, F., Wang, X., & Li, R. (2014). Cross-modal retrieval with correspondence autoencoder. In Proceedings of the 22nd ACM international conference on multimedia, pp. 7\u201316.","key":"2041_CR21","DOI":"10.1145\/2647868.2654902"},{"doi-asserted-by":"crossref","unstructured":"Fu, Y., Wei, Y., Wang, G., et\u00a0al. (2019) Self-similarity grouping: A simple unsupervised cross domain adaptation approach for person re-identification. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 6112\u20136121.","key":"2041_CR22","DOI":"10.1109\/ICCV.2019.00621"},{"doi-asserted-by":"crossref","unstructured":"Gan, C., Yang, T., & Gong, B. (2016). Learning attributes equals multi-source domain generalization. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 87\u201397.","key":"2041_CR23","DOI":"10.1109\/CVPR.2016.17"},{"unstructured":"Ganin, Y., & Lempitsky, V. (2015). Unsupervised domain adaptation by backpropagation. In International conference on machine learning, PMLR, pp. 1180\u20131189.","key":"2041_CR24"},{"doi-asserted-by":"crossref","unstructured":"Gao, H., Guo, J., Wang, G., et\u00a0al. (2022). Cross-domain correlation distillation for unsupervised domain adaptation in nighttime semantic segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 9913\u20139923.","key":"2041_CR25","DOI":"10.1109\/CVPR52688.2022.00968"},{"doi-asserted-by":"crossref","unstructured":"Gao, L., Zhang, J., Zhang, L., et\u00a0al. (2021). Dsp: Dual soft-paste for unsupervised domain adaptive semantic segmentation. arXiv preprint arXiv:2107.09600.","key":"2041_CR26","DOI":"10.1145\/3474085.3475186"},{"doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., et\u00a0al. (2014). Rich feature hierarchies for accurate object detection and semantic segmentation. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 580\u2013587.","key":"2041_CR27","DOI":"10.1109\/CVPR.2014.81"},{"issue":"1","key":"2041_CR28","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1007\/s11263-014-0718-4","volume":"109","author":"B Gong","year":"2014","unstructured":"Gong, B., Grauman, K., & Sha, F. (2014). Learning kernels for unsupervised domain adaptation with applications to visual object recognition. International Journal of Computer Vision, 109(1), 3\u201327.","journal-title":"International Journal of Computer Vision"},{"doi-asserted-by":"crossref","unstructured":"Gong, R., Li. W., Chen, Y., et\u00a0al. (2019). Dlow: Domain flow for adaptation and generalization. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 2477\u20132486.","key":"2041_CR29","DOI":"10.1109\/CVPR.2019.00258"},{"doi-asserted-by":"crossref","unstructured":"Guo, X., Yang, C., Li, B., et\u00a0al. (2021). Metacorrection: Domain-aware meta loss correction for unsupervised domain adaptation in semantic segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 3927\u20133936.","key":"2041_CR30","DOI":"10.1109\/CVPR46437.2021.00392"},{"doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., et\u00a0al. (2016). Deep residual learning for image recognition. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 770\u2013778.","key":"2041_CR31","DOI":"10.1109\/CVPR.2016.90"},{"issue":"1","key":"2041_CR32","doi-asserted-by":"publisher","first-page":"28","DOI":"10.1007\/s11263-014-0719-3","volume":"109","author":"J Hoffman","year":"2014","unstructured":"Hoffman, J., Rodner, E., Donahue, J., et al. (2014). Asymmetric and category invariant feature transformations for domain adaptation. International Journal of Computer Vision, 109(1), 28\u201341.","journal-title":"International Journal of Computer Vision"},{"unstructured":"Hoffman, J., Tzeng, E., Park, T., et\u00a0al. (2018). Cycada: Cycle-consistent adversarial domain adaptation. In International conference on machine learning, PMLR, pp. 1989\u20131998.","key":"2041_CR33"},{"doi-asserted-by":"crossref","unstructured":"Hoyer, L., Dai, D., & Van\u00a0Gool, L. (2022). Daformer: Improving network architectures and training strategies for domain-adaptive semantic segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition.","key":"2041_CR34","DOI":"10.1109\/CVPR52688.2022.00969"},{"doi-asserted-by":"crossref","unstructured":"Hu, H., Hong, R., Fu, W., et\u00a0al. (2019). Efficient graph based multi-view learning. In MultiMedia modeling: 25th international conference, MMM 2019, Thessaloniki, Greece, January 8\u201311, 2019, Proceedings, Part I 25, (pp. 691\u2013703), Springer.","key":"2041_CR35","DOI":"10.1007\/978-3-030-05710-7_57"},{"key":"2041_CR36","first-page":"501","volume":"33","author":"H Hu","year":"2020","unstructured":"Hu, H., Xie, L., Du, Z., et al. (2020). One-bit supervision for image classification. Advances in Neural Information Processing Systems, 33, 501\u2013511.","journal-title":"Advances in Neural Information Processing Systems"},{"doi-asserted-by":"crossref","unstructured":"Hu, H., Xie, L., Hong, R., et\u00a0al. (2020b). Creating something from nothing: Unsupervised knowledge distillation for cross-modal hashing. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 3123\u20133132.","key":"2041_CR37","DOI":"10.1109\/CVPR42600.2020.00319"},{"doi-asserted-by":"crossref","unstructured":"Hu, H., Xie, L., Huo, X., et\u00a0al. (2022). Vibration-based uncertainty estimation for learning from limited supervision. In European conference on computer vision, (pp. 160\u2013176), Springer.","key":"2041_CR38","DOI":"10.1007\/978-3-031-20056-4_10"},{"doi-asserted-by":"crossref","unstructured":"Hu, H., Xie, L., Huo, X., et\u00a0al. (2023). One-bit supervision for image classification: Problem, solution, and beyond. ACM Transactions on Multimedia Computing, Communications and Applications.","key":"2041_CR39","DOI":"10.1145\/3633779"},{"doi-asserted-by":"crossref","unstructured":"Huang, L., Zhou, Y., Zhu, F., et\u00a0al. (2019). Iterative normalization: Beyond standardization towards efficient whitening. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 4874\u20134883.","key":"2041_CR40","DOI":"10.1109\/CVPR.2019.00501"},{"issue":"7","key":"2041_CR41","doi-asserted-by":"publisher","first-page":"2244","DOI":"10.1007\/s11263-021-01474-8","volume":"129","author":"Y Huang","year":"2021","unstructured":"Huang, Y., Wu, Q., Xu, J., et al. (2021). Unsupervised domain adaptation with background shift mitigating for person re-identification. International Journal of Computer Vision, 129(7), 2244\u20132263.","journal-title":"International Journal of Computer Vision"},{"doi-asserted-by":"crossref","unstructured":"Huo, X., Xie, L., He, J., et\u00a0al. (2021). Atso: Asynchronous teacher-student optimization for semi-supervised image segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 1235\u20131244.","key":"2041_CR42","DOI":"10.1109\/CVPR46437.2021.00129"},{"doi-asserted-by":"crossref","unstructured":"Huo, X., Xie, L., Hu, H., et\u00a0al. (2022). Domain-agnostic prior for transfer semantic segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 7075\u20137085.","key":"2041_CR43","DOI":"10.1109\/CVPR52688.2022.00694"},{"doi-asserted-by":"crossref","unstructured":"Huo, X., Xie, L., Zhou, W., et\u00a0al. (2023). Focus on your target: A dual teacher-student framework for domain-adaptive semantic segmentation. arXiv preprint arXiv:2303.09083.","key":"2041_CR44","DOI":"10.1109\/ICCV51070.2023.01744"},{"unstructured":"Jia, C., Yang, Y., Xia, Y., et\u00a0al. (2021). Scaling up visual and vision-language representation learning with noisy text supervision. arXiv preprint arXiv:2102.05918.","key":"2041_CR45"},{"doi-asserted-by":"crossref","unstructured":"Kamath, A., Singh, M., LeCun, Y., et\u00a0al. (2021). Mdetr-modulated detection for end-to-end multi-modal understanding. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 1780\u20131790.","key":"2041_CR46","DOI":"10.1109\/ICCV48922.2021.00180"},{"doi-asserted-by":"crossref","unstructured":"Kim, M., & Byun, H. (2020). Learning texture invariant representation for domain adaptation of semantic segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 12975\u201312984.","key":"2041_CR47","DOI":"10.1109\/CVPR42600.2020.01299"},{"unstructured":"Larochelle, H., Erhan, D., & Bengio, Y. (2008). Zero-data learning of new tasks. In AAAI, p.\u00a03.","key":"2041_CR48"},{"unstructured":"Lee, D. H., et\u00a0al. (2013). Pseudo-label: The simple and efficient semi-supervised learning method for deep neural networks. In Workshop on challenges in representation learning, ICML, p. 896.","key":"2041_CR49"},{"doi-asserted-by":"crossref","unstructured":"Li, D., Yang, Y., Song, Y. Z., et\u00a0al. (2017a). Deeper, broader and artier domain generalization. In Proceedings of the IEEE international conference on computer vision, pp. 5542\u20135550.","key":"2041_CR50","DOI":"10.1109\/ICCV.2017.591"},{"doi-asserted-by":"crossref","unstructured":"Li, D., Zhang, J., Yang, Y., et\u00a0al. (2019a). Episodic training for domain generalization. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 1446\u20131455.","key":"2041_CR51","DOI":"10.1109\/ICCV.2019.00153"},{"doi-asserted-by":"crossref","unstructured":"Li, H., Pan, S. J., Wang, S., et\u00a0al. (2018). Domain generalization with adversarial feature learning. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 5400\u20135409.","key":"2041_CR52","DOI":"10.1109\/CVPR.2018.00566"},{"key":"2041_CR53","first-page":"10,276","volume":"32","author":"X Li","year":"2019","unstructured":"Li, X., Sun, Q., Liu, Y., et al. (2019). Learning to self-train for semi-supervised few-shot classification. Advances in Neural Information Processing Systems, 32, 10,276-10,286.","journal-title":"Advances in Neural Information Processing Systems"},{"doi-asserted-by":"crossref","unstructured":"Li, X., Yin, X., Li, C., et\u00a0al. (2020). Oscar: Object-semantics aligned pre-training for vision-language tasks. In European conference on computer vision, (pp. 121\u2013137), Springer.","key":"2041_CR54","DOI":"10.1007\/978-3-030-58577-8_8"},{"unstructured":"Li, Y., Fang, C., Yang, J., et\u00a0al. (2017b). Universal style transfer via feature transforms. Advances in Neural Information Processing Systems, 30.","key":"2041_CR55"},{"doi-asserted-by":"crossref","unstructured":"Lin, T. Y., Maire, M., Belongie, S., et\u00a0al. (2014). Microsoft coco: Common objects in context. In European conference on computer vision, (pp 740\u2013755), Springer.","key":"2041_CR56","DOI":"10.1007\/978-3-319-10602-1_48"},{"doi-asserted-by":"crossref","unstructured":"Liu, J., Song, L., & Qin, Y. (2020). Prototype rectification for few-shot learning. In Computer vision\u2013ECCV 2020: 16th European conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part I 16, (pp. 741\u2013756), Springer.","key":"2041_CR57","DOI":"10.1007\/978-3-030-58452-8_43"},{"unstructured":"Long, M., Cao, Y., Wang, J., et\u00a0al. (2015). Learning transferable features with deep adaptation networks. In International conference on machine learning, PMLR, pp. 97\u2013105.","key":"2041_CR58"},{"doi-asserted-by":"crossref","unstructured":"Lv, F., Liang, T., Chen, X., et\u00a0al. (2020). Cross-domain semantic segmentation via domain-invariant interactive relation transfer. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 4334\u20134343.","key":"2041_CR59","DOI":"10.1109\/CVPR42600.2020.00439"},{"doi-asserted-by":"crossref","unstructured":"Ma, N., Zhang, X., Zheng, H. T., et\u00a0al. (2018). Shufflenet v2: Practical guidelines for efficient CNN architecture design. In Proceedings of the European conference on computer vision (ECCV), pp. 116\u2013131.","key":"2041_CR60","DOI":"10.1007\/978-3-030-01264-9_8"},{"doi-asserted-by":"crossref","unstructured":"Mei, K., Zhu, C., Zou, J., et\u00a0al. (2020). Instance adaptive self-training for unsupervised domain adaptation. In Computer vision\u2013ECCV 2020: 16th European conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XXVI 16, (pp. 415\u2013430), Springer.","key":"2041_CR61","DOI":"10.1007\/978-3-030-58574-7_25"},{"unstructured":"Mikolov, T., Sutskever, I., Chen, K., et\u00a0al. (2013). Distributed representations of words and phrases and their compositionality. In Advances in Neural Information Processing Systems, pp. 3111\u20133119.","key":"2041_CR62"},{"issue":"1","key":"2041_CR63","doi-asserted-by":"publisher","first-page":"521","DOI":"10.1016\/j.patcog.2011.06.019","volume":"45","author":"JG Moreno-Torres","year":"2012","unstructured":"Moreno-Torres, J. G., Raeder, T., Alaiz-Rodr\u00edguez, R., et al. (2012). A unifying view on dataset shift in classification. Pattern Recognition, 45(1), 521\u2013530.","journal-title":"Pattern Recognition"},{"doi-asserted-by":"crossref","unstructured":"Mottaghi, R., Chen, X., Liu, X., et\u00a0al. (2014). The role of context for object detection and semantic segmentation in the wild. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 891\u2013898.","key":"2041_CR64","DOI":"10.1109\/CVPR.2014.119"},{"unstructured":"Muandet, K., Balduzzi, D., & Sch\u00f6lkopf, B. (2013). Domain generalization via invariant feature representation. In International conference on machine learning, PMLR, pp. 10\u201318.","key":"2041_CR65"},{"doi-asserted-by":"crossref","unstructured":"Neuhold, G., Ollmann, T., Rota\u00a0Bulo, S., et\u00a0al, (2017). The mapillary vistas dataset for semantic understanding of street scenes. In Proceedings of the IEEE international conference on computer vision, pp. 4990\u20134999.","key":"2041_CR66","DOI":"10.1109\/ICCV.2017.534"},{"doi-asserted-by":"crossref","unstructured":"Olsson, V., Tranheden, W., Pinto, J., et\u00a0al. (2021). Classmix: Segmentation-based data augmentation for semi-supervised learning. In Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp. 1369\u20131378.","key":"2041_CR67","DOI":"10.1109\/WACV48630.2021.00141"},{"doi-asserted-by":"crossref","unstructured":"Pan, X., Luo, P., Shi, J., et\u00a0al. (2018). Two at once: Enhancing learning and generalization capacities via ibn-net. In Proceedings of the European conference on computer vision (ECCV), pp. 464\u2013479.","key":"2041_CR68","DOI":"10.1007\/978-3-030-01225-0_29"},{"doi-asserted-by":"crossref","unstructured":"Pan, X., Zhan, X., Shi, J., et\u00a0al. (2019). Switchable whitening for deep representation learning. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 1863\u20131871.","key":"2041_CR69","DOI":"10.1109\/ICCV.2019.00195"},{"key":"2041_CR70","doi-asserted-by":"publisher","first-page":"6594","DOI":"10.1109\/TIP.2021.3096334","volume":"30","author":"D Peng","year":"2021","unstructured":"Peng, D., Lei, Y., Liu, L., et al. (2021). Global and local texture randomization for synthetic-to-real semantic segmentation. IEEE Transactions on Image Processing, 30, 6594\u20136608.","journal-title":"IEEE Transactions on Image Processing"},{"doi-asserted-by":"crossref","unstructured":"Peng, D., Lei, Y., Hayat, M., et\u00a0al. (2022). Semantic-aware domain generalized segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 2594\u20132605.","key":"2041_CR71","DOI":"10.1109\/CVPR52688.2022.00262"},{"doi-asserted-by":"crossref","unstructured":"Qiao, F., Zhao, L., & Peng, X. (2020). Learning to learn single domain generalization. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 12556\u201312565.","key":"2041_CR72","DOI":"10.1109\/CVPR42600.2020.01257"},{"unstructured":"Radford, A., Kim, J.W., Hallacy, C., et\u00a0al. (2021). Learning transferable visual models from natural language supervision. arXiv preprint arXiv:2103.00020.","key":"2041_CR73"},{"doi-asserted-by":"crossref","unstructured":"Rao, Y., Zhao, W., Chen, G., et\u00a0al. (2022). Denseclip: Language-guided dense prediction with context-aware prompting. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 18082\u201318091.","key":"2041_CR74","DOI":"10.1109\/CVPR52688.2022.01755"},{"doi-asserted-by":"crossref","unstructured":"Richter, S. R., Vineet, V., Roth, S., et\u00a0al. (2016). Playing for data: Ground truth from computer games. In European conference on computer vision, (pp. 102\u2013118), Springer.","key":"2041_CR75","DOI":"10.1007\/978-3-319-46475-6_7"},{"doi-asserted-by":"crossref","unstructured":"Ros, G., Sellart, L., Materzynska, J., et\u00a0al. (2016). The synthia dataset: A large collection of synthetic images for semantic segmentation of urban scenes. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 3234\u20133243.","key":"2041_CR76","DOI":"10.1109\/CVPR.2016.352"},{"doi-asserted-by":"crossref","unstructured":"Rosenberg, C., Hebert, M., & Schneiderman, H. (2005). Semi-supervised self-training of object detection models. Carnegie Mellon University.","key":"2041_CR77","DOI":"10.1109\/ACVMOT.2005.107"},{"doi-asserted-by":"crossref","unstructured":"Saito, K., Watanabe, K., Ushiku, Y., et\u00a0al. (2018). Maximum classifier discrepancy for unsupervised domain adaptation. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 3723\u20133732.","key":"2041_CR78","DOI":"10.1109\/CVPR.2018.00392"},{"doi-asserted-by":"crossref","unstructured":"Sandler, M., Howard, A., Zhu, M., et\u00a0al. (2018). Mobilenetv2: Inverted residuals and linear bottlenecks. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 4510\u20134520.","key":"2041_CR79","DOI":"10.1109\/CVPR.2018.00474"},{"doi-asserted-by":"crossref","unstructured":"Saporta, A., Douillard, A., Vu, T. H., et\u00a0al. (2022). Multi-head distillation for continual unsupervised domain adaptation in semantic segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 3751\u20133760.","key":"2041_CR80","DOI":"10.1109\/CVPRW56347.2022.00419"},{"doi-asserted-by":"crossref","unstructured":"Seo, S., Suh, Y., Kim, D., et\u00a0al. (2020). Learning to optimize domain specific normalization for domain generalization. In European conference on computer vision, (pp. 68\u201383), Springer.","key":"2041_CR81","DOI":"10.1007\/978-3-030-58542-6_5"},{"doi-asserted-by":"crossref","unstructured":"Sharma, P., Ding, N., Goodman, S., et\u00a0al. (2018). Conceptual captions: A cleaned, hypernymed, image alt-text dataset for automatic image captioning. In Proceedings of the 56th annual meeting of the association for computational linguistics (Volume 1: Long Papers), pp. 2556\u20132565.","key":"2041_CR82","DOI":"10.18653\/v1\/P18-1238"},{"doi-asserted-by":"crossref","unstructured":"Shin, I., Woo, S., Pan, F., et\u00a0al. (2020). Two-phase pseudo label densification for self-training based domain adaptation. In European conference on computer vision, (pp. 532\u2013548), Springer.","key":"2041_CR83","DOI":"10.1007\/978-3-030-58601-0_32"},{"issue":"2","key":"2041_CR84","doi-asserted-by":"publisher","first-page":"193","DOI":"10.1007\/s11263-016-0953-y","volume":"122","author":"VA Sindagi","year":"2017","unstructured":"Sindagi, V. A., & Srivastava, S. (2017). Domain adaptation for automatic OLED panel defect detection using adaptive support vector data description. International Journal of Computer Vision, 122(2), 193\u2013211.","journal-title":"International Journal of Computer Vision"},{"issue":"107","key":"2041_CR85","first-page":"173","volume":"102","author":"L Song","year":"2020","unstructured":"Song, L., Wang, C., Zhang, L., et al. (2020). Unsupervised domain adaptive re-identification: Theory and practice. Pattern Recognition, 102(107), 173.","journal-title":"Pattern Recognition"},{"key":"2041_CR86","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1016\/j.inffus.2014.12.003","volume":"24","author":"S Sun","year":"2015","unstructured":"Sun, S., Shi, H., & Wu, Y. (2015). A survey of multi-source domain adaptation. Information Fusion, 24, 84\u201392.","journal-title":"Information Fusion"},{"doi-asserted-by":"crossref","unstructured":"Tan, H., & Bansal, M. (2019). Lxmert: Learning cross-modality encoder representations from transformers. arXiv preprint arXiv:1908.07490.","key":"2041_CR87","DOI":"10.18653\/v1\/D19-1514"},{"unstructured":"Tarvainen, A., & Valpola, H. (2017). Mean teachers are better role models: Weight-averaged consistency targets improve semi-supervised deep learning results. arXiv preprint arXiv:1703.01780.","key":"2041_CR88"},{"doi-asserted-by":"crossref","unstructured":"Tobin, J., Fong, R., Ray, A., et\u00a0al. (2017). Domain randomization for transferring deep neural networks from simulation to the real world. In 2017 IEEE\/RSJ international conference on intelligent robots and systems (IROS), IEEE, pp. 23\u201330.","key":"2041_CR89","DOI":"10.1109\/IROS.2017.8202133"},{"issue":"2","key":"2041_CR90","doi-asserted-by":"publisher","first-page":"35","DOI":"10.3390\/technologies8020035","volume":"8","author":"M Toldo","year":"2020","unstructured":"Toldo, M., Maracani, A., Michieli, U., et al. (2020). Unsupervised domain adaptation in semantic segmentation: A review. Technologies, 8(2), 35.","journal-title":"Technologies"},{"doi-asserted-by":"crossref","unstructured":"Tranheden, W., Olsson, V., Pinto, J., et\u00a0al. (2021). Dacs: Domain adaptation via cross-domain mixed sampling. In Proceedings of the IEEE\/CVF winter conference on applications of computer vision, pp. 1379\u20131389.","key":"2041_CR91","DOI":"10.1109\/WACV48630.2021.00142"},{"doi-asserted-by":"crossref","unstructured":"Tsai, Y. H., Hung, W. C., Schulter, S., et\u00a0al. (2018). Learning to adapt structured output space for semantic segmentation. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 7472\u20137481.","key":"2041_CR92","DOI":"10.1109\/CVPR.2018.00780"},{"doi-asserted-by":"crossref","unstructured":"Tsai, Y. H., Sohn, K., Schulter, S., et\u00a0al. (2019). Domain adaptation for structured output via discriminative patch representations. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 1456\u20131465.","key":"2041_CR93","DOI":"10.1109\/ICCV.2019.00154"},{"doi-asserted-by":"crossref","unstructured":"Tzeng, E., Hoffman, J., Saenko, K., et\u00a0al. (2017). Adversarial discriminative domain adaptation. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 7167\u20137176.","key":"2041_CR94","DOI":"10.1109\/CVPR.2017.316"},{"unstructured":"Ulyanov, D., Vedaldi, A., & Lempitsky, V. (2016). Instance normalization: The missing ingredient for fast stylization. arXiv preprint arXiv:1607.08022.","key":"2041_CR95"},{"doi-asserted-by":"crossref","unstructured":"Ulyanov, D., Vedaldi, A., & Lempitsky, V. (2017). Improved texture networks: Maximizing quality and diversity in feed-forward stylization and texture synthesis. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 6924\u20136932.","key":"2041_CR96","DOI":"10.1109\/CVPR.2017.437"},{"unstructured":"Vaswani, A., Shazeer, N., Parmar, N., et\u00a0al. (2017). Attention is all you need. In Advances in neural information processing systems, pp. 5998\u20136008.","key":"2041_CR97"},{"doi-asserted-by":"crossref","unstructured":"Vu, T.H., Jain, H., Bucher, M., et\u00a0al. (2019). Advent: Adversarial entropy minimization for domain adaptation in semantic segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 2517\u20132526.","key":"2041_CR98","DOI":"10.1109\/CVPR.2019.00262"},{"doi-asserted-by":"crossref","unstructured":"Wang, B., Yang, Y., Xu, X., et\u00a0al. (2017). Adversarial cross-modal retrieval. In Proceedings of the 25th ACM international conference on multimedia, pp. 154\u2013162.","key":"2041_CR99","DOI":"10.1145\/3123266.3123326"},{"issue":"1","key":"2041_CR100","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40537-016-0043-6","volume":"3","author":"K Weiss","year":"2016","unstructured":"Weiss, K., Khoshgoftaar, T. M., & Wang, D. (2016). A survey of transfer learning. Journal of Big Data, 3(1), 1\u201340.","journal-title":"Journal of Big Data"},{"doi-asserted-by":"crossref","unstructured":"Yang, Y., & Soatto, S. (2020). Fda: Fourier domain adaptation for semantic segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 4085\u20134095.","key":"2041_CR101","DOI":"10.1109\/CVPR42600.2020.00414"},{"unstructured":"Yosinski, J., Clune, J., Nguyen, A., et\u00a0al. (2015). Understanding neural networks through deep visualization. arXiv preprint arXiv:1506.06579.","key":"2041_CR102"},{"unstructured":"Yu, F., Xian, W., Chen, Y., et\u00a0al. (2018). Bdd100k: A diverse driving video database with scalable annotation tooling. 2(5), 6 arXiv preprint arXiv:1805.04687","key":"2041_CR103"},{"doi-asserted-by":"crossref","unstructured":"Yu, F., Chen, H., Wang, X., et\u00a0al. (2020). Bdd100k: A diverse driving dataset for heterogeneous multitask learning. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 2636\u20132645.","key":"2041_CR104","DOI":"10.1109\/CVPR42600.2020.00271"},{"doi-asserted-by":"crossref","unstructured":"Zeiler, M. D., & Fergus, R. (2014). Visualizing and understanding convolutional networks. In Computer vision\u2013ECCV 2014: 13th European conference, Zurich, Switzerland, September 6-12, 2014, Proceedings, Part I 13, (pp. 818\u2013833), Springer.","key":"2041_CR105","DOI":"10.1007\/978-3-319-10590-1_53"},{"unstructured":"Zhang, H., Cisse, M., Dauphin, Y. N., et\u00a0al. (2017). Mixup: Beyond empirical risk minimization. arXiv preprint arXiv:1710.09412.","key":"2041_CR106"},{"doi-asserted-by":"crossref","unstructured":"Zhang, P., Zhang, B., Zhang, T., et\u00a0al. (2021). Prototypical pseudo label denoising and target structure learning for domain adaptive semantic segmentation. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 12414\u201312424.","key":"2041_CR107","DOI":"10.1109\/CVPR46437.2021.01223"},{"doi-asserted-by":"crossref","unstructured":"Zhao, H., Puig, X., Zhou, B., et\u00a0al. (2017). Open vocabulary scene parsing. In Proceedings of the IEEE international conference on computer vision, pp. 2002\u20132010.","key":"2041_CR108","DOI":"10.1109\/ICCV.2017.221"},{"issue":"8","key":"2041_CR109","doi-asserted-by":"publisher","first-page":"2399","DOI":"10.1007\/s11263-021-01479-3","volume":"129","author":"S Zhao","year":"2021","unstructured":"Zhao, S., Li, B., Xu, P., et al. (2021). Madan: Multi-source adversarial domain aggregation network for domain adaptation. International Journal of Computer Vision, 129(8), 2399\u20132424.","journal-title":"International Journal of Computer Vision"},{"doi-asserted-by":"crossref","unstructured":"Zhao, Y., Zhong, Z., Yang, F., et\u00a0al. (2021b). Learning to generalize unseen domains via memory-based multi-source meta-learning for person re-identification. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 6277\u20136286.","key":"2041_CR110","DOI":"10.1109\/CVPR46437.2021.00621"},{"doi-asserted-by":"crossref","unstructured":"Zhao, Y., Zhong, Z., Zhao, N., et\u00a0al. (2022). Style-hallucinated dual consistency learning for domain generalized semantic segmentation. arXiv preprint arXiv:2204.02548.","key":"2041_CR111","DOI":"10.1007\/978-3-031-19815-1_31"},{"issue":"4","key":"2041_CR112","doi-asserted-by":"publisher","first-page":"1106","DOI":"10.1007\/s11263-020-01395-y","volume":"129","author":"Z Zheng","year":"2021","unstructured":"Zheng, Z., & Yang, Y. (2021). Rectifying pseudo label learning via uncertainty estimation for domain adaptive semantic segmentation. International Journal of Computer Vision, 129(4), 1106\u20131120.","journal-title":"International Journal of Computer Vision"},{"doi-asserted-by":"crossref","unstructured":"Zhou, K., Yang, Y., Hospedales, T., et\u00a0al. (2020a). Learning to generate novel domains for domain generalization. In European conference on computer vision, (pp. 561\u2013578), Springer.","key":"2041_CR113","DOI":"10.1007\/978-3-030-58517-4_33"},{"unstructured":"Zhou, K., Liu, Z., Qiao, Y., et\u00a0al. (2021a). Domain generalization in vision: A survey. arXiv preprint arXiv:2103.02503","key":"2041_CR114"},{"unstructured":"Zhou, Q., Feng, Z., Gu, Q., et\u00a0al. (2020b). Uncertainty-aware consistency regularization for cross-domain semantic segmentation. arXiv preprint arXiv:2004.08878","key":"2041_CR115"},{"unstructured":"Zhou, Q., Feng, Z., Gu, Q., et\u00a0al. (2021b). Context-aware mixup for domain adaptive semantic segmentation. arXiv preprint arXiv:2108.03557","key":"2041_CR116"},{"doi-asserted-by":"crossref","unstructured":"Zhu, J. Y., Park, T., Isola, P., et\u00a0al. (2017). Unpaired image-to-image translation using cycle-consistent adversarial networks. In Proceedings of the IEEE international conference on computer vision, pp. 2223\u20132232.","key":"2041_CR117","DOI":"10.1109\/ICCV.2017.244"},{"unstructured":"Zhu, X. J. (2005). Semi-supervised learning literature survey. University of Wisconsin-Madison Department of Computer Sciences.","key":"2041_CR118"},{"doi-asserted-by":"crossref","unstructured":"Zou, Y., Yu, Z., Kumar, B., et\u00a0al. (2018). Unsupervised domain adaptation for semantic segmentation via class-balanced self-training. In Proceedings of the European conference on computer vision (ECCV), pp. 289\u2013305.","key":"2041_CR119","DOI":"10.1007\/978-3-030-01219-9_18"},{"doi-asserted-by":"crossref","unstructured":"Zou, Y., Yu, Z., Liu, X., et\u00a0al. (2019). Confidence regularized self-training. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 5982\u20135991.","key":"2041_CR120","DOI":"10.1109\/ICCV.2019.00608"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-024-02041-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-024-02041-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-024-02041-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,27]],"date-time":"2024-08-27T07:41:11Z","timestamp":1724744471000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-024-02041-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,27]]},"references-count":120,"journal-issue":{"issue":"9","published-print":{"date-parts":[[2024,9]]}},"alternative-id":["2041"],"URL":"https:\/\/doi.org\/10.1007\/s11263-024-02041-7","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"type":"print","value":"0920-5691"},{"type":"electronic","value":"1573-1405"}],"subject":[],"published":{"date-parts":[[2024,4,27]]},"assertion":[{"value":"1 December 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 February 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 April 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}