{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T04:38:16Z","timestamp":1764995896847,"version":"3.46.0"},"reference-count":72,"publisher":"Springer Science and Business Media LLC","issue":"12","license":[{"start":{"date-parts":[[2025,9,27]],"date-time":"2025-09-27T00:00:00Z","timestamp":1758931200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,9,27]],"date-time":"2025-09-27T00:00:00Z","timestamp":1758931200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2025,12]]},"DOI":"10.1007\/s11263-025-02568-3","type":"journal-article","created":{"date-parts":[[2025,9,27]],"date-time":"2025-09-27T15:45:24Z","timestamp":1758987924000},"page":"8526-8545","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Boosting Domain Generalization in Remote Sensing Image Segmentation via Style Mapping and General Prototypical Contrast"],"prefix":"10.1007","volume":"133","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9771-6229","authenticated-orcid":false,"given":"Yupei","family":"Wang","sequence":"first","affiliation":[]},{"given":"Xiaoxing","family":"Hu","sequence":"additional","affiliation":[]},{"given":"Yongkang","family":"Hu","sequence":"additional","affiliation":[]},{"given":"Zhuoran","family":"Sun","sequence":"additional","affiliation":[]},{"given":"Shanghang","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Liang","family":"Chen","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,9,27]]},"reference":[{"key":"2568_CR1","doi-asserted-by":"crossref","unstructured":"Ahn, W.-J., Yang, G.-Y., Choi, H.-D., & Lim, M.-T.(2024). Style blind domain generalized semantic segmentation via covariance alignment and semantic consistence contrastive learning. In: Proceedings of the Ieee\/cvf Conference on Computer Vision and Pattern Recognition, pp. 3616\u20133626","DOI":"10.1109\/CVPR52733.2024.00347"},{"key":"2568_CR2","doi-asserted-by":"crossref","unstructured":"Bi, Q., You, S., & Gevers, T.(2024). Generalized foggy-scene semantic segmentation by frequency decoupling. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 1389\u20131399","DOI":"10.1109\/CVPRW63382.2024.00146"},{"key":"2568_CR3","doi-asserted-by":"crossref","unstructured":"Chattopadhyay, P., Sarangmath, K., Vijaykumar, V., & Hoffman, J.(2023). Pasta: Proportional amplitude spectrum training augmentation for syn-to-real domain generalization. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 19288\u201319300","DOI":"10.1109\/ICCV51070.2023.01767"},{"key":"2568_CR4","doi-asserted-by":"crossref","unstructured":"Chen, C., Xie, W., Huang, W., Rong, Y., Ding, X., Huang, Y., Xu, T., & Huang, J.(2019). Progressive feature alignment for unsupervised domain adaptation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 627\u2013636","DOI":"10.1109\/CVPR.2019.00072"},{"issue":"4","key":"2568_CR5","doi-asserted-by":"publisher","first-page":"834","DOI":"10.1109\/TPAMI.2017.2699184","volume":"40","author":"L-C Chen","year":"2017","unstructured":"Chen, L.-C., Papandreou, G., Kokkinos, I., Murphy, K., & Yuille, A. L. (2017). deeplab: Semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected crfs. IEEE transactions on pattern analysis and machine intelligence, 40(4), 834\u2013848.","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"key":"2568_CR6","doi-asserted-by":"crossref","unstructured":"Cho, S., Shin, H., Hong, S., Arnab, A., Seo, P.H., & Kim, S.(2024). Cat-seg: Cost aggregation for open-vocabulary semantic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4113\u20134123","DOI":"10.1109\/CVPR52733.2024.00394"},{"key":"2568_CR7","doi-asserted-by":"crossref","unstructured":"Choi, S., Jung, S., Yun, H., Kim, J.T., Kim, S., & Choo, J.(2021). Robustnet: Improving domain generalization in urban-scene segmentation via instance selective whitening. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11580\u201311590","DOI":"10.1109\/CVPR46437.2021.01141"},{"key":"2568_CR8","unstructured":"Contributors, M.(2020). MMSegmentation: Openmmlab semantic segmentation toolbox and benchmark"},{"key":"2568_CR9","doi-asserted-by":"crossref","unstructured":"Ding, J., Xue, N., Xia, G.-S., & Dai, D.(2022). Decoupling zero-shot semantic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11583\u201311592","DOI":"10.1109\/CVPR52688.2022.01129"},{"key":"2568_CR10","doi-asserted-by":"crossref","unstructured":"Ding, J., Xue, N., Xia, G.-S., Schiele, B., & Dai, D.(2023). Hgformer: Hierarchical grouping transformer for domain generalized semantic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 15413\u201315423","DOI":"10.1109\/CVPR52729.2023.01479"},{"key":"2568_CR11","doi-asserted-by":"crossref","unstructured":"Fang, Y., Wang, W., Xie, B., Sun, Q., Wu, L., Wang, X., Huang, T., Wang, X., & Cao, Y.(2023). Eva: Exploring the limits of masked visual representation learning at scale. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 19358\u201319369","DOI":"10.1109\/CVPR52729.2023.01855"},{"key":"2568_CR12","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2024.105171","volume":"149","author":"Y Fang","year":"2024","unstructured":"Fang, Y., Sun, Q., Wang, X., Huang, T., Wang, X., & Cao, Y. (2024). Eva-02: A visual representation for neon genesis. Image and Vision Computing, 149, Article 105171.","journal-title":"Image and Vision Computing"},{"key":"2568_CR13","unstructured":"Ganin, Y., & Lempitsky, V.(2015). Unsupervised domain adaptation by backpropagation. In: International Conference on Machine Learning, pp. 1180\u20131189 . PMLR"},{"key":"2568_CR14","doi-asserted-by":"crossref","unstructured":"Ghiasi, G., Gu, X., Cui, Y., & Lin, T.-Y.(2022). Scaling open-vocabulary image segmentation with image-level labels. In: European Conference on Computer Vision, pp. 540\u2013557 . Springer","DOI":"10.1007\/978-3-031-20059-5_31"},{"key":"2568_CR15","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TGRS.2022.3230846","volume":"60","author":"X He","year":"2022","unstructured":"He, X., Zhou, Y., Zhao, J., Zhang, D., Yao, R., & Xue, Y. (2022). Swin transformer embedding unet for remote sensing image semantic segmentation. IEEE Transactions on Geoscience and Remote Sensing, 60, 1\u201315.","journal-title":"IEEE Transactions on Geoscience and Remote Sensing"},{"key":"2568_CR16","unstructured":"Hoffman, J., Tzeng, E., Park, T., Zhu, J.-Y., Isola, P., Saenko, K., Efros, A., & Darrell, T.(2018). Cycada: Cycle-consistent adversarial domain adaptation. In: International Conference on Machine Learning, pp. 1989\u20131998 . Pmlr"},{"key":"2568_CR17","unstructured":"Hoffman, J., Wang, D., Yu, F., & Darrell, T.(2016). Fcns in the wild: Pixel-level adversarial and constraint-based adaptation. arXiv preprint arXiv:1612.02649"},{"key":"2568_CR18","doi-asserted-by":"publisher","DOI":"10.1016\/j.rse.2023.113856","volume":"299","author":"D Hong","year":"2023","unstructured":"Hong, D., Zhang, B., Li, H., Li, Y., Yao, J., Li, C., Werner, M., Chanussot, J., Zipf, A., & Zhu, X. X. (2023). Cross-city matters: A multimodal remote sensing benchmark dataset for cross-city semantic segmentation using high-resolution domain adaptation networks. Remote Sensing of Environment, 299, Article 113856.","journal-title":"Remote Sensing of Environment"},{"key":"2568_CR19","doi-asserted-by":"crossref","unstructured":"Huang, X., & Belongie, S.(2017). Arbitrary style transfer in real-time with adaptive instance normalization. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1501\u20131510","DOI":"10.1109\/ICCV.2017.167"},{"key":"2568_CR20","doi-asserted-by":"crossref","unstructured":"Huang, W., Chen, C., Li, Y., Li, J., Li, C., Song, F., Yan, Y., & Xiong, Z.(2023). Style projected clustering for domain generalized semantic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3061\u20133071","DOI":"10.1109\/CVPR52729.2023.00299"},{"key":"2568_CR21","doi-asserted-by":"crossref","unstructured":"Huang, J., Guan, D., Xiao, A., & Lu, S.(2021). Fsdr: Frequency space domain randomization for domain generalization. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6891\u20136902","DOI":"10.1109\/CVPR46437.2021.00682"},{"key":"2568_CR22","doi-asserted-by":"crossref","unstructured":"Iizuka, R., Xia, J., & Yokoya, N.(2023). Frequency-based optimal style mix for domain generalization in semantic segmentation of remote sensing images. IEEE Transactions on Geoscience and Remote Sensing","DOI":"10.1109\/TGRS.2023.3344670"},{"key":"2568_CR23","doi-asserted-by":"crossref","unstructured":"Jia, Y., Hoyer, L., Huang, S., Wang, T., Van\u00a0Gool, L., Schindler, K., & Obukhov, A.(2023). Dginstyle: Domain-generalizable semantic segmentation with image diffusion models and stylized semantic control. In: Synthetic Data for Computer Vision Workshop@ CVPR 2024","DOI":"10.1007\/978-3-031-72933-1_6"},{"key":"2568_CR24","doi-asserted-by":"crossref","unstructured":"Jiang, X., Huang, J., Jin, S., & Lu, S.(2023). Domain generalization via balancing training difficulty and model capability. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 18993\u201319003","DOI":"10.1109\/ICCV51070.2023.01741"},{"key":"2568_CR25","doi-asserted-by":"crossref","unstructured":"Jing, M., Zhen, X., Li, J., & Snoek, C.G.(2023) Order-preserving consistency regularization for domain adaptation and generalization. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 18916\u201318927","DOI":"10.1109\/ICCV51070.2023.01734"},{"key":"2568_CR26","doi-asserted-by":"crossref","unstructured":"Kim, S., Kim, D.-h., & Kim, H.(2023). Texture learning domain randomization for domain generalized segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 677\u2013687","DOI":"10.1109\/ICCV51070.2023.00069"},{"key":"2568_CR27","doi-asserted-by":"crossref","unstructured":"Lee, S., Seong, H., Lee, S., & Kim, E. (2022). Wildnet: Learning domain generalized semantic segmentation from the wild. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9936\u20139946","DOI":"10.1109\/CVPR52688.2022.00970"},{"key":"2568_CR28","unstructured":"Li, B., Weinberger, K.Q., Belongie, S., Koltun, V., & Ranftl, R.(2022). Language-driven semantic segmentation. arXiv preprint arXiv:2201.03546"},{"key":"2568_CR29","doi-asserted-by":"crossref","unstructured":"Li, Y., Yuan, L., & Vasconcelos, N.(2019). Bidirectional learning for domain adaptation of semantic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6936\u20136945","DOI":"10.1109\/CVPR.2019.00710"},{"key":"2568_CR30","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1016\/j.isprsjprs.2021.09.005","volume":"181","author":"R Li","year":"2021","unstructured":"Li, R., Zheng, S., Zhang, C., Duan, C., Wang, L., & Atkinson, P. M. (2021). Abcnet: Attentive bilateral contextual network for efficient semantic segmentation of fine-resolution remotely sensed imagery. ISPRS journal of photogrammetry and remote sensing, 181, 84\u201398.","journal-title":"ISPRS journal of photogrammetry and remote sensing"},{"key":"2568_CR31","doi-asserted-by":"crossref","unstructured":"Liang, C., Li, W., Dong, Y., & Fu, W(2024). Single domain generalization method for remote sensing image segmentation via category consistency on domain randomization. IEEE Transactions on Geoscience and Remote Sensing","DOI":"10.1109\/TGRS.2024.3379669"},{"key":"2568_CR32","doi-asserted-by":"crossref","unstructured":"Liang, F., Wu, B., Dai, X., Li, K., Zhao, Y., Zhang, H., Zhang, P., Vajda, P., & Marculescu, D.(2023). Open-vocabulary semantic segmentation with mask-adapted clip. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7061\u20137070","DOI":"10.1109\/CVPR52729.2023.00682"},{"key":"2568_CR33","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TGRS.2024.3379669","volume":"62","author":"C Liang","year":"2024","unstructured":"Liang, C., Li, W., Dong, Y., & Fu, W. (2024). Single domain generalization method for remote sensing image segmentation via category consistency on domain randomization. IEEE Transactions on Geoscience and Remote Sensing, 62, 1\u201316. https:\/\/doi.org\/10.1109\/TGRS.2024.3379669","journal-title":"IEEE Transactions on Geoscience and Remote Sensing"},{"key":"2568_CR34","doi-asserted-by":"crossref","unstructured":"Luo, Y., Liu, P., & Yang, Y.(2024). Kill two birds with one stone: Domain generalization for semantic segmentation via network pruning. International Journal of Computer Vision, 1\u201318","DOI":"10.1007\/s11263-024-02194-5"},{"key":"2568_CR35","unstructured":"Markus\u00a0Gerke, I.(2014). Use of the stair vision library within the isprs 2d semantic labeling benchmark (vaihingen). Use of the stair vision library within the isprs 2d semantic labeling benchmark (vaihingen)"},{"key":"2568_CR36","doi-asserted-by":"crossref","unstructured":"Mei, K., Zhu, C., Zou, J., & Zhang, S.(2020). Instance adaptive self-training for unsupervised domain adaptation. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XXVI 16, pp. 415\u2013430 . Springer","DOI":"10.1007\/978-3-030-58574-7_25"},{"key":"2568_CR37","doi-asserted-by":"crossref","unstructured":"Naeem, M.F., Khan, M.G.Z.A., Xian, Y., Afzal, M.Z., Stricker, D., Van\u00a0Gool, L., & Tombari, F.(2023a). I2mvformer: Large language model generated multi-view document supervision for zero-shot image classification. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 15169\u201315179","DOI":"10.1109\/CVPR52729.2023.01456"},{"key":"2568_CR38","doi-asserted-by":"crossref","unstructured":"Naeem, M.F., Xian, Y., Zhai, X., Hoyer, L., Van\u00a0Gool, L., & Tombari, F.(2023b). Silc: Improving vision language pretraining with self-distillation. arXiv preprint arXiv:2310.13355","DOI":"10.1007\/978-3-031-72664-4_3"},{"key":"2568_CR39","first-page":"12283","volume":"35","author":"MF Naeem","year":"2022","unstructured":"Naeem, M. F., Xian, Y., Gool, L. V., & Tombari, F. (2022). I2dformer: Learning image to document attention for zero-shot image classification. Advances in Neural Information Processing Systems, 35, 12283\u201312294.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2568_CR40","doi-asserted-by":"crossref","unstructured":"Pan, X., Luo, P., Shi, J., & Tang, X.(2018). Two at once: Enhancing learning and generalization capacities via ibn-net. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 464\u2013479","DOI":"10.1007\/978-3-030-01225-0_29"},{"key":"2568_CR41","doi-asserted-by":"crossref","unstructured":"Peng, D., Lei, Y., Hayat, M., Guo, Y., & Li, W.(2022) Semantic-aware domain generalized segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2594\u20132605","DOI":"10.1109\/CVPR52688.2022.00262"},{"key":"2568_CR42","doi-asserted-by":"publisher","first-page":"6594","DOI":"10.1109\/TIP.2021.3096334","volume":"30","author":"D Peng","year":"2021","unstructured":"Peng, D., Lei, Y., Liu, L., Zhang, P., & Liu, J. (2021). Global and local texture randomization for synthetic-to-real semantic segmentation. IEEE Transactions on Image Processing, 30, 6594\u20136608.","journal-title":"IEEE Transactions on Image Processing"},{"key":"2568_CR43","doi-asserted-by":"crossref","unstructured":"Qi, M., Li, W., Yang, Z., Wang, Y., & Luo, J.(2019). Attentive relational networks for mapping images to scene graphs. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3957\u20133966","DOI":"10.1109\/CVPR.2019.00408"},{"issue":"2","key":"2568_CR44","doi-asserted-by":"publisher","first-page":"549","DOI":"10.1109\/TCSVT.2019.2894161","volume":"30","author":"M Qi","year":"2019","unstructured":"Qi, M., Wang, Y., Qin, J., Li, A., Luo, J., & Van Gool, L. (2019). Stagnet: An attentive semantic rnn for group activity and individual action recognition. IEEE Transactions on Circuits and Systems for Video Technology, 30(2), 549\u2013565.","journal-title":"IEEE Transactions on Circuits and Systems for Video Technology"},{"key":"2568_CR45","doi-asserted-by":"publisher","first-page":"5420","DOI":"10.1109\/TIP.2020.2983567","volume":"29","author":"M Qi","year":"2020","unstructured":"Qi, M., Wang, Y., Li, A., & Luo, J. (2020). Stc-gan: Spatio-temporally coupled generative adversarial networks for predictive scene parsing. IEEE Transactions on Image Processing, 29, 5420\u20135430.","journal-title":"IEEE Transactions on Image Processing"},{"key":"2568_CR46","doi-asserted-by":"publisher","first-page":"2989","DOI":"10.1109\/TIP.2020.3048680","volume":"30","author":"M Qi","year":"2021","unstructured":"Qi, M., Qin, J., Yang, Y., Wang, Y., & Luo, J. (2021). Semantics-aware spatial-temporal binaries for cross-modal video retrieval. IEEE Transactions on Image Processing, 30, 2989\u20133004.","journal-title":"IEEE Transactions on Image Processing"},{"key":"2568_CR47","unstructured":"Radford, A., Kim, J.W., Hallacy, C., Ramesh, A., Goh, G., Agarwal, S., Sastry, G., Askell, A., Mishkin, P., & Clark, J., et al (2021). Learning transferable visual models from natural language supervision. In: International Conference on Machine Learning, pp. 8748\u20138763 . PMLR"},{"issue":"18","key":"2568_CR48","doi-asserted-by":"publisher","first-page":"3715","DOI":"10.3390\/rs13183715","volume":"13","author":"H Shi","year":"2021","unstructured":"Shi, H., Fan, J., Wang, Y., & Chen, L. (2021). Dual attention feature fusion and adaptive context for accurate segmentation of very high-resolution remote sensing images. Remote Sensing, 13(18), 3715.","journal-title":"Remote Sensing"},{"issue":"2","key":"2568_CR49","doi-asserted-by":"publisher","first-page":"35","DOI":"10.3390\/technologies8020035","volume":"8","author":"M Toldo","year":"2020","unstructured":"Toldo, M., Maracani, A., Michieli, U., & Zanuttigh, P. (2020). Unsupervised domain adaptation in semantic segmentation: a review. Technologies, 8(2), 35.","journal-title":"Technologies"},{"key":"2568_CR50","doi-asserted-by":"publisher","DOI":"10.1016\/j.rse.2019.111322","volume":"237","author":"X-Y Tong","year":"2020","unstructured":"Tong, X.-Y., Xia, G.-S., Lu, Q., Shen, H., Li, S., You, S., & Zhang, L. (2020). Land-cover classification with high-resolution remote sensing images using transferable deep models. Remote Sensing of Environment, 237, Article 111322.","journal-title":"Remote Sensing of Environment"},{"key":"2568_CR51","doi-asserted-by":"crossref","unstructured":"Tsai, Y.-H., Hung, W.-C., Schulter, S., Sohn, K., Yang, M.-H., & Chandraker, M.(2018). Learning to adapt structured output space for semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7472\u20137481","DOI":"10.1109\/CVPR.2018.00780"},{"key":"2568_CR52","doi-asserted-by":"crossref","unstructured":"Tsai, Y.-H., Sohn, K., Schulter, S., & Chandraker, M.(2019). Domain adaptation for structured output via discriminative patch representations. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 1456\u20131465","DOI":"10.1109\/ICCV.2019.00154"},{"key":"2568_CR53","unstructured":"Ulyanov, D.(2016). Instance normalization: The missing ingredient for fast stylization. arXiv preprint arXiv:1607.08022"},{"key":"2568_CR54","doi-asserted-by":"crossref","unstructured":"Vu, T.-H., Jain, H., Bucher, M., Cord, M., & P\u00e9rez, P.(2019). Advent: Adversarial entropy minimization for domain adaptation in semantic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2517\u20132526","DOI":"10.1109\/CVPR.2019.00262"},{"key":"2568_CR55","unstructured":"Wang, J., Zheng, Z., Ma, A., Lu, X., & Zhong, Y.(2021). Loveda: A remote sensing land-cover dataset for domain adaptive semantic segmentation. arXiv preprint arXiv:2110.08733"},{"key":"2568_CR56","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1016\/j.neucom.2018.05.083","volume":"312","author":"M Wang","year":"2018","unstructured":"Wang, M., & Deng, W. (2018). Deep visual domain adaptation: A survey. Neurocomputing, 312, 135\u2013153.","journal-title":"Neurocomputing"},{"key":"2568_CR57","first-page":"12077","volume":"34","author":"E Xie","year":"2021","unstructured":"Xie, E., Wang, W., Yu, Z., Anandkumar, A., Alvarez, J. M., & Luo, P. (2021). Segformer: Simple and efficient design for semantic segmentation with transformers. Advances in neural information processing systems, 34, 12077\u201312090.","journal-title":"Advances in neural information processing systems"},{"key":"2568_CR58","doi-asserted-by":"crossref","unstructured":"Xu, M., Zhang, Z., Wei, F., Hu, H., & Bai, X.(2023). Side adapter network for open-vocabulary semantic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2945\u20132954","DOI":"10.1109\/CVPR52729.2023.00288"},{"key":"2568_CR59","doi-asserted-by":"crossref","unstructured":"Xu, M., Zhang, Z., Wei, F., Lin, Y., Cao, Y., Hu, H., & Bai, X.(2022). A simple baseline for open-vocabulary semantic segmentation with pre-trained vision-language model. In: European Conference on Computer Vision, pp. 736\u2013753 . Springer","DOI":"10.1007\/978-3-031-19818-2_42"},{"key":"2568_CR60","doi-asserted-by":"crossref","unstructured":"Yang, J., Xu, R., Li, R., Qi, X., Shen, X., Li, G., & Lin, L.(2020). An adversarial perturbation oriented domain adaptation approach for semantic segmentation. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 34, pp. 12613\u201312620","DOI":"10.1609\/aaai.v34i07.6952"},{"key":"2568_CR61","doi-asserted-by":"crossref","unstructured":"Zang, Q., Wang, S., Zhao, D., Zhong, Z., Hou, B., & Jiao, L.(2024). Joint style and layout synthesizing: Toward generalizable remote sensing semantic segmentation. IEEE Transactions on Circuits and Systems for Video Technology","DOI":"10.1109\/TCSVT.2024.3522936"},{"key":"2568_CR62","unstructured":"Zhang, Q., Zhang, J., Liu, W., & Tao, D.(2019). Category anchor-guided unsupervised domain adaptation for semantic segmentation. Advances in neural information processing systems 32"},{"key":"2568_CR63","doi-asserted-by":"publisher","first-page":"693","DOI":"10.1007\/s11119-012-9274-5","volume":"13","author":"C Zhang","year":"2012","unstructured":"Zhang, C., & Kovacs, J. M. (2012). The application of small unmanned aerial systems for precision agriculture: a review. Precision agriculture, 13, 693\u2013712.","journal-title":"Precision agriculture"},{"key":"2568_CR64","unstructured":"Zhao, S., Li, B., Yue, X., Gu, Y., Xu, P., Hu, R., Chai, H., & Keutzer, K.(2019). Multi-source domain adaptation for semantic segmentation. Advances in neural information processing systems 32"},{"key":"2568_CR65","doi-asserted-by":"crossref","unstructured":"Zhao, Y., Zhong, Z., Zhao, N., Sebe, N., & Lee, G.H.(2022). Style-hallucinated dual consistency learning for domain generalized semantic segmentation. In: European Conference on Computer Vision, pp. 535\u2013552 . Springer","DOI":"10.1007\/978-3-031-19815-1_31"},{"key":"2568_CR66","first-page":"338","volume":"35","author":"Z Zhong","year":"2022","unstructured":"Zhong, Z., Zhao, Y., Lee, G. H., & Sebe, N. (2022). Adversarial style augmentation for domain generalized urban-scene segmentation. Advances in neural information processing systems, 35, 338\u2013350.","journal-title":"Advances in neural information processing systems"},{"key":"2568_CR67","first-page":"338","volume":"35","author":"Z Zhong","year":"2022","unstructured":"Zhong, Z., Zhao, Y., Lee, G. H., & Sebe, N. (2022). Adversarial style augmentation for domain generalized urban-scene segmentation. Advances in neural information processing systems, 35, 338\u2013350.","journal-title":"Advances in neural information processing systems"},{"key":"2568_CR68","doi-asserted-by":"crossref","unstructured":"Zhou, C., Loy, C.C., & Dai, B.(2022). Extract free dense labels from clip. In: European Conference on Computer Vision, pp. 696\u2013712 . Springer","DOI":"10.1007\/978-3-031-19815-1_40"},{"key":"2568_CR69","doi-asserted-by":"crossref","unstructured":"Zhou, C., Loy, C.C., & Dai, B.(2022). Extract free dense labels from clip. In: European Conference on Computer Vision, pp. 696\u2013712 . Springer","DOI":"10.1007\/978-3-031-19815-1_40"},{"key":"2568_CR70","doi-asserted-by":"crossref","unstructured":"Zhu, P., Qi, M., Li, X., Li, W., & Ma, H.(2023). Unsupervised self-driving attention prediction via uncertainty mining and knowledge embedding. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 8558\u20138568","DOI":"10.1109\/ICCV51070.2023.00786"},{"key":"2568_CR71","doi-asserted-by":"crossref","unstructured":"Zou, Y., Yu, Z., Kumar, B., & Wang, J.(2018). Unsupervised domain adaptation for semantic segmentation via class-balanced self-training. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 289\u2013305","DOI":"10.1007\/978-3-030-01219-9_18"},{"key":"2568_CR72","doi-asserted-by":"crossref","unstructured":"Zou, Y., Yu, Z., Liu, X., Kumar, B., & Wang, J.(2019). Confidence regularized self-training. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 5982\u20135991","DOI":"10.1109\/ICCV.2019.00608"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02568-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-025-02568-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02568-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T04:03:40Z","timestamp":1764993820000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-025-02568-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,27]]},"references-count":72,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2025,12]]}},"alternative-id":["2568"],"URL":"https:\/\/doi.org\/10.1007\/s11263-025-02568-3","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"type":"print","value":"0920-5691"},{"type":"electronic","value":"1573-1405"}],"subject":[],"published":{"date-parts":[[2025,9,27]]},"assertion":[{"value":"30 September 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 July 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 September 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}