{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,11]],"date-time":"2025-10-11T00:25:03Z","timestamp":1760142303979,"version":"build-2065373602"},"reference-count":82,"publisher":"Springer Science and Business Media LLC","issue":"10","license":[{"start":{"date-parts":[[2025,7,18]],"date-time":"2025-07-18T00:00:00Z","timestamp":1752796800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,7,18]],"date-time":"2025-07-18T00:00:00Z","timestamp":1752796800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100020084","name":"Guangzhou Municipal Science and Technology Bureau","doi-asserted-by":"publisher","award":["025A03J3656"],"award-info":[{"award-number":["025A03J3656"]}],"id":[{"id":"10.13039\/501100020084","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2025,10]]},"DOI":"10.1007\/s11263-025-02519-y","type":"journal-article","created":{"date-parts":[[2025,7,18]],"date-time":"2025-07-18T19:27:55Z","timestamp":1752866875000},"page":"7293-7311","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Towards Balanced Representation Learning with Semantic Anchor Regularization"],"prefix":"10.1007","volume":"133","author":[{"given":"Chengjie","family":"Wang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2778-4058","authenticated-orcid":false,"given":"Qiang","family":"Nie","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ying","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jialin","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yong","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xi","family":"Jiang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yanqi","family":"Ge","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yunsheng","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Feng","family":"Zheng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lizhuang","family":"Ma","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,7,18]]},"reference":[{"key":"2519_CR1","unstructured":"Arik, S\u00d6., & Pfister, T. (1902) Attention-based prototypical learning towards interpretable, confident and robust deep neural networks. corr abs\/1902.06292 (2019)"},{"key":"2519_CR2","unstructured":"Berthelot, D., Carlini, N., & Goodfellow, I., et\u00a0al (2019) Mixmatch: A holistic approach to semi-supervised learning. Advances in neural information processing systems 32"},{"key":"2519_CR3","unstructured":"Cao, K., Wei, C., & Gaidon, A., et\u00a0al (2019) Learning imbalanced datasets with label-distribution-aware margin loss. Advances in neural information processing systems 32"},{"key":"2519_CR4","unstructured":"Chen, C., Li, O., & Tao, D., et\u00a0al (2019) This looks like that: deep learning for interpretable image recognition. Advances in neural information processing systems 32"},{"issue":"4","key":"2519_CR5","doi-asserted-by":"publisher","first-page":"834","DOI":"10.1109\/TPAMI.2017.2699184","volume":"40","author":"LC Chen","year":"2017","unstructured":"Chen, L. C., Papandreou, G., Kokkinos, I., et al. (2017). Deeplab: Semantic Image Segmentation with Deep Convolutional Nets, Atrous Convolution, and Fully Connected Crfs. TPAMI, 40(4), 834\u2013848.","journal-title":"TPAMI"},{"key":"2519_CR6","unstructured":"Chen, L.C., Papandreou, G., & Schroff, F., et\u00a0al (2017b) Rethinking atrous convolution for semantic image segmentation. arXiv preprint arXiv:1706.05587"},{"key":"2519_CR7","doi-asserted-by":"crossref","unstructured":"Chen, X., Yuan, Y., & Zeng, G., et\u00a0al (2021) Semi-supervised semantic segmentation with cross pseudo supervision. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 2613\u20132622","DOI":"10.1109\/CVPR46437.2021.00264"},{"key":"2519_CR8","doi-asserted-by":"crossref","unstructured":"Chu, P., Bian, X., & Liu, S., et\u00a0al (2020) Feature space augmentation for long-tailed data. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XXIX 16, Springer, pp 694\u2013710","DOI":"10.1007\/978-3-030-58526-6_41"},{"key":"2519_CR9","first-page":"8765","volume":"33","author":"CY Chuang","year":"2020","unstructured":"Chuang, C. Y., Robinson, J., Lin, Y. C., et al. (2020). Debiased Contrastive Learning. Advances in neural information processing systems, 33, 8765\u20138775.","journal-title":"Advances in neural information processing systems"},{"key":"2519_CR10","unstructured":"Contributors, M. (2020) MMSegmentation: Openmmlab semantic segmentation toolbox and benchmark. https:\/\/github.com\/open-mmlab\/mmsegmentation"},{"key":"2519_CR11","unstructured":"Contributors, M. (2023) Openmmlab\u2019s pre-training toolbox and benchmark. https:\/\/github.com\/open-mmlab\/mmpretrain"},{"key":"2519_CR12","doi-asserted-by":"crossref","unstructured":"Cordts, M., Omran, M., & Ramos, S., et\u00a0al (2016) The cityscapes dataset for semantic urban scene understanding. In: CVPR, pp 3213\u20133223","DOI":"10.1109\/CVPR.2016.350"},{"issue":"1","key":"2519_CR13","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1109\/TIT.1967.1053964","volume":"13","author":"T Cover","year":"1967","unstructured":"Cover, T., & Hart, P. (1967). Nearest Neighbor Pattern Classification. IEEE transactions on information theory, 13(1), 21\u201327.","journal-title":"IEEE transactions on information theory"},{"key":"2519_CR14","doi-asserted-by":"crossref","unstructured":"Cui, J., Zhong, Z., & Liu, S., et\u00a0al (2021) Parametric contrastive learning. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 715\u2013724","DOI":"10.1109\/ICCV48922.2021.00075"},{"key":"2519_CR15","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., & Socher, R., et\u00a0al (2009) Imagenet: A large-scale hierarchical image database. In: CVPR, pp 248\u2013255","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"2519_CR16","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1007\/s11263-014-0733-5","volume":"111","author":"M Everingham","year":"2015","unstructured":"Everingham, M., Eslami, S. A., Van Gool, L., et al. (2015). The Pascal Visual Object Classes Challenge: A Retrospective. International journal of computer vision, 111, 98\u2013136.","journal-title":"International journal of computer vision"},{"key":"2519_CR17","doi-asserted-by":"crossref","unstructured":"French, G., Laine, S., & Aila, T., et\u00a0al (2019) Semi-supervised semantic segmentation needs strong, varied perturbations. arXiv preprint arXiv:1906.01916","DOI":"10.5244\/C.34.154"},{"key":"2519_CR18","doi-asserted-by":"crossref","unstructured":"Ge, W. (2018) Deep metric learning with hierarchical triplet loss. In: Proceedings of the European Conference on Computer Vision (ECCV), pp 269\u2013285","DOI":"10.1007\/978-3-030-01231-1_17"},{"key":"2519_CR19","unstructured":"Graf, F., Hofer, C., Niethammer, M., et\u00a0al (2021) Dissecting supervised contrastive learning. In: International Conference on Machine Learning, PMLR, pp 3821\u20133830"},{"key":"2519_CR20","doi-asserted-by":"crossref","unstructured":"Hariharan, B., Arbel\u00e1ez, P., & Bourdev, L., et\u00a0al (2011) Semantic contours from inverse detectors. In: 2011 international conference on computer vision, IEEE, pp 991\u2013998","DOI":"10.1109\/ICCV.2011.6126343"},{"key":"2519_CR21","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., & Ren, S., et\u00a0al (2016) Deep residual learning for image recognition. In: CVPR, pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"2519_CR22","doi-asserted-by":"crossref","unstructured":"He, K., Fan, H., & Wu, Y., et\u00a0al (2020) Momentum contrast for unsupervised visual representation learning. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 9729\u20139738","DOI":"10.1109\/CVPR42600.2020.00975"},{"key":"2519_CR23","doi-asserted-by":"crossref","unstructured":"Hu, H., Cui, J., & Wang, L. (2021a) Region-aware contrastive learning for semantic segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 16291\u201316301","DOI":"10.1109\/ICCV48922.2021.01598"},{"key":"2519_CR24","doi-asserted-by":"crossref","unstructured":"Hu, Z., Yang, Z., & Hu, X., et\u00a0al (2021b) Simple: Similar pseudo label exploitation for semi-supervised classification. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 15099\u201315108","DOI":"10.1109\/CVPR46437.2021.01485"},{"key":"2519_CR25","unstructured":"Huang, J., Dong, Q., & Gong, S., et\u00a0al (2019) Unsupervised deep learning by neighbourhood discovery. In: International Conference on Machine Learning, PMLR, pp 2849\u20132858"},{"key":"2519_CR26","doi-asserted-by":"crossref","unstructured":"Huang, Y., Kang, D., & Chen, L., et\u00a0al (2022) Car: Class-aware regularizations for semantic segmentation. In: Computer Vision\u2013ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23\u201327, 2022, Proceedings, Part XXVIII, Springer, pp 518\u2013534","DOI":"10.1007\/978-3-031-19815-1_30"},{"key":"2519_CR27","doi-asserted-by":"crossref","unstructured":"Jiang, Z., Li, Y., Yang, C., et\u00a0al (2022) Prototypical contrast adaptation for domain adaptive semantic segmentation. In: Computer Vision\u2013ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23\u201327, 2022, Proceedings, Part XXXIV, Springer, pp 36\u201354","DOI":"10.1007\/978-3-031-19830-4_3"},{"key":"2519_CR28","unstructured":"Kang, B., Li, Y., & Xie, S., et\u00a0al (2020) Exploring balanced feature spaces for representation learning. In: International Conference on Learning Representations"},{"key":"2519_CR29","unstructured":"Kondratyuk, D., Yu, L., & Gu, X., et\u00a0al (2023) Videopoet: A large language model for zero-shot video generation. arXiv preprint arXiv:2312.14125"},{"key":"2519_CR30","doi-asserted-by":"crossref","unstructured":"Krause, J., Stark, M., & Deng, J., et\u00a0al (2013) 3d object representations for fine-grained categorization. In: Proceedings of the IEEE international conference on computer vision workshops, pp 554\u2013561","DOI":"10.1109\/ICCVW.2013.77"},{"key":"2519_CR31","unstructured":"Krizhevsky, A., Hinton, G., et\u00a0al (2009) Learning multiple layers of features from tiny images"},{"key":"2519_CR32","unstructured":"Kwon, H., Jeong, S., & Kim, S., et\u00a0al (2021) Dual prototypical contrastive learning for few-shot semantic segmentation. arXiv preprint arXiv:2111.04982"},{"key":"2519_CR33","doi-asserted-by":"crossref","unstructured":"Liu, Y., Deng, J., & Tao, J., et\u00a0al (2022) Undoing the damage of label shift for cross-domain semantic segmentation. In: CVPR","DOI":"10.1109\/CVPR52688.2022.00691"},{"key":"2519_CR34","doi-asserted-by":"crossref","unstructured":"Liu, Z., Miao, Z., & Zhan, X., et\u00a0al (2019) Large-scale long-tailed recognition in an open world. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 2537\u20132546","DOI":"10.1109\/CVPR.2019.00264"},{"key":"2519_CR35","doi-asserted-by":"crossref","unstructured":"Liu, Z., Lin, Y., & Cao, Y., et\u00a0al (2021) Swin transformer: Hierarchical vision transformer using shifted windows. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 10012\u201310022","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"2519_CR36","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., Darrell, T. (2015) Fully convolutional networks for semantic segmentation. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3431\u20133440","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"2519_CR37","unstructured":"Loshchilov, I., & Hutter, F. (2017) Decoupled weight decay regularization. arXiv preprint arXiv:1711.05101"},{"key":"2519_CR38","doi-asserted-by":"crossref","unstructured":"Lu, Y., Luo, Y., & Zhang, L., et\u00a0al (2022) Bidirectional self-training with multiple anisotropic prototypes for domain adaptive semantic segmentation. In: Proceedings of the 30th ACM International Conference on Multimedia, pp 1405\u20131415","DOI":"10.1145\/3503161.3548225"},{"key":"2519_CR39","doi-asserted-by":"crossref","unstructured":"Ma, Y., Jiao, L., & Liu, F., et\u00a0al (2023) Curvature-balanced feature manifold learning for long-tailed classification. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 15824\u201315835","DOI":"10.1109\/CVPR52729.2023.01519"},{"key":"2519_CR40","first-page":"5151","volume":"1306","author":"S Maji","year":"2013","unstructured":"Maji, S., Kannala, J., Rahtu, E., et al. (2013). Fine-grained Visual Classification of Aircraft. Tech. rep., 1306, 5151.","journal-title":"Tech. rep."},{"key":"2519_CR41","doi-asserted-by":"crossref","unstructured":"Mottaghi, R., Chen, X., & Liu, X., et\u00a0al (2014) The role of context for object detection and semantic segmentation in the wild. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 891\u2013898","DOI":"10.1109\/CVPR.2014.119"},{"key":"2519_CR42","doi-asserted-by":"crossref","unstructured":"Nauta, M., Van\u00a0Bree, R., Seifert, C. (2021) Neural prototype trees for interpretable fine-grained image recognition. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 14933\u201314943","DOI":"10.1109\/CVPR46437.2021.01469"},{"key":"2519_CR43","doi-asserted-by":"crossref","unstructured":"Nguyen, K., Todorovic, S. (2019) Feature weighting and boosting for few-shot segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 622\u2013631","DOI":"10.1109\/ICCV.2019.00071"},{"key":"2519_CR44","unstructured":"Oord, Avd, Li Y, Vinyals O (2018) Representation learning with contrastive predictive coding. arXiv preprint arXiv:1807.03748"},{"issue":"40","key":"2519_CR45","doi-asserted-by":"publisher","first-page":"24652","DOI":"10.1073\/pnas.2015509117","volume":"117","author":"V Papyan","year":"2020","unstructured":"Papyan, V., Han, X., & Donoho, D. L. (2020). Prevalence of Neural Collapse During the Terminal Phase of Deep Learning Training. Proceedings of the National Academy of Sciences, 117(40), 24652\u201324663.","journal-title":"Proceedings of the National Academy of Sciences"},{"key":"2519_CR46","unstructured":"Radford, A., Kim, J.W., Hallacy, C., et\u00a0al (2021) Learning transferable visual models from natural language supervision. In: International conference on machine learning, PMLR, pp 8748\u20138763"},{"key":"2519_CR47","doi-asserted-by":"crossref","unstructured":"Robbins, H., Monro, S. (1951) A stochastic approximation method. The annals of mathematical statistics pp 400\u2013407","DOI":"10.1214\/aoms\/1177729586"},{"issue":"3","key":"2519_CR48","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky, O., Deng, J., Su, H., et al. (2015). Imagenet Large Scale Visual Recognition Challenge. International journal of computer vision, 115(3), 211\u2013252.","journal-title":"International journal of computer vision"},{"key":"2519_CR49","doi-asserted-by":"crossref","unstructured":"Schroff, F., Kalenichenko, D., Philbin, J. (2015) Facenet: A unified embedding for face recognition and clustering. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 815\u2013823","DOI":"10.1109\/CVPR.2015.7298682"},{"issue":"1","key":"2519_CR50","doi-asserted-by":"publisher","first-page":"7146","DOI":"10.1038\/s41598-020-63649-6","volume":"10","author":"Y Shu","year":"2020","unstructured":"Shu, Y., Shi, Y., Wang, Y., et al. (2020). P-odn: Prototype-based Open Deep Network for Open Set Recognition. Scientific reports, 10(1), 7146.","journal-title":"Scientific reports"},{"key":"2519_CR51","unstructured":"Sohn, K. (2016) Improved deep metric learning with multi-class n-pair loss objective. Advances in neural information processing systems 29"},{"key":"2519_CR52","first-page":"596","volume":"33","author":"K Sohn","year":"2020","unstructured":"Sohn, K., Berthelot, D., Carlini, N., et al. (2020). Fixmatch: Simplifying Semi-supervised Learning with Consistency and Confidence. Advances in neural information processing systems, 33, 596\u2013608.","journal-title":"Advances in neural information processing systems"},{"key":"2519_CR53","doi-asserted-by":"crossref","unstructured":"Strudel, R., Garcia, R., Laptev, I., et\u00a0al (2021) Segmenter: Transformer for semantic segmentation. In: Proceedings of the IEEE\/CVF international conference on computer vision, pp 7262\u20137272","DOI":"10.1109\/ICCV48922.2021.00717"},{"key":"2519_CR54","unstructured":"Tarvainen, A., Valpola, H. (2017) Mean teachers are better role models: Weight-averaged consistency targets improve semi-supervised deep learning results. Advances in neural information processing systems 30"},{"key":"2519_CR55","unstructured":"Van Den\u00a0Oord, A., Vinyals, O., et\u00a0al (2017) Neural discrete representation learning. Advances in neural information processing systems 30"},{"key":"2519_CR56","unstructured":"Wah, C., Branson, S., Welinder, P., et\u00a0al (2011) The caltech-ucsd birds-200-2011 dataset"},{"key":"2519_CR57","doi-asserted-by":"crossref","unstructured":"Wang, C., Xie, H., Yuan, Y., et\u00a0al (2023a) Space engage: Collaborative space supervision for contrastive-based semi-supervised semantic segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 931\u2013942","DOI":"10.1109\/ICCV51070.2023.00092"},{"key":"2519_CR58","doi-asserted-by":"crossref","unstructured":"Wang, F., Liu, H. (2021) Understanding the behaviour of contrastive loss. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 2495\u20132504","DOI":"10.1109\/CVPR46437.2021.00252"},{"issue":"10","key":"2519_CR59","doi-asserted-by":"publisher","first-page":"3349","DOI":"10.1109\/TPAMI.2020.2983686","volume":"43","author":"J Wang","year":"2020","unstructured":"Wang, J., Sun, K., Cheng, T., et al. (2020). Deep High-resolution Representation Learning for Visual Recognition. IEEE transactions on pattern analysis and machine intelligence, 43(10), 3349\u20133364.","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"key":"2519_CR60","doi-asserted-by":"crossref","unstructured":"Wang, K., Liew, J.H., & Zou, Y., et\u00a0al (2019) Panet: Few-shot image semantic segmentation with prototype alignment. In: proceedings of the IEEE\/CVF international conference on computer vision, pp 9197\u20139206","DOI":"10.1109\/ICCV.2019.00929"},{"key":"2519_CR61","doi-asserted-by":"crossref","unstructured":"Wang, P., Han, K., & Wei, X.S., et\u00a0al (2021a) Contrastive learning based hybrid networks for long-tailed image classification. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 943\u2013952","DOI":"10.1109\/CVPR46437.2021.00100"},{"key":"2519_CR62","unstructured":"Wang ,T., Isola, P. (2020) Understanding contrastive representation learning through alignment and uniformity on the hypersphere. In: International Conference on Machine Learning, PMLR, pp 9929\u20139939"},{"key":"2519_CR63","doi-asserted-by":"crossref","unstructured":"Wang, W., Zhou, T., Yu, F., et\u00a0al (2021b) Exploring cross-image pixel contrast for semantic segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 7303\u20137313","DOI":"10.1109\/ICCV48922.2021.00721"},{"key":"2519_CR64","doi-asserted-by":"crossref","unstructured":"Wang, Y., Wang, H., Shen, Y., et\u00a0al (2022) Semi-supervised semantic segmentation using unreliable pseudo-labels. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 4248\u20134257","DOI":"10.1109\/CVPR52688.2022.00421"},{"key":"2519_CR65","doi-asserted-by":"publisher","unstructured":"Wang, Z., Shi, S., & Wu, Y., et\u00a0al (2023b) Prototype calibration for long tailed recognition. In: 2023 IEEE International Conference on Multimedia and Expo (ICME), pp 2123\u20132128, https:\/\/doi.org\/10.1109\/ICME55011.2023.00363","DOI":"10.1109\/ICME55011.2023.00363"},{"key":"2519_CR66","doi-asserted-by":"crossref","unstructured":"Wu, D., Guo, Z., & Li, A., et\u00a0al (2023) Semantic segmentation via pixel-to-center similarity calculation. arXiv preprint arXiv:2301.04870","DOI":"10.1049\/cit2.12245"},{"key":"2519_CR67","doi-asserted-by":"crossref","unstructured":"Wu, Z., Xiong, Y., Yu, & S.X., et\u00a0al (2018) Unsupervised feature learning via non-parametric instance discrimination. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 3733\u20133742","DOI":"10.1109\/CVPR.2018.00393"},{"key":"2519_CR68","doi-asserted-by":"crossref","unstructured":"Xiao, T., Liu, Y., & Zhou, B., et\u00a0al (2018) Unified perceptual parsing for scene understanding. In: Proceedings of the European conference on computer vision (ECCV), pp 418\u2013434","DOI":"10.1007\/978-3-030-01228-1_26"},{"key":"2519_CR69","unstructured":"Xie, E., Wang, W., & Yu, Z., et\u00a0al (2021) Segformer: Simple and efficient design for semantic segmentation with transformers. NeurIPS 34"},{"key":"2519_CR70","first-page":"26007","volume":"35","author":"H Xu","year":"2022","unstructured":"Xu, H., Liu, L., Bian, Q., et al. (2022). Semi-supervised Semantic Segmentation with Prototype-based Consistency Regularization. Advances in Neural Information Processing Systems, 35, 26007\u201326020.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2519_CR71","first-page":"21969","volume":"33","author":"W Xu","year":"2020","unstructured":"Xu, W., Xian, Y., Wang, J., et al. (2020). Attribute Prototype Network for Zero-shot Learning. Advances in Neural Information Processing Systems, 33, 21969\u201321980.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2519_CR72","doi-asserted-by":"crossref","unstructured":"Yang, L., Qi, L., & Feng, L., et\u00a0al (2023) Revisiting weak-to-strong consistency in semi-supervised semantic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 7236\u20137246","DOI":"10.1109\/CVPR52729.2023.00699"},{"key":"2519_CR73","first-page":"19290","volume":"33","author":"Y Yang","year":"2020","unstructured":"Yang, Y., & Xu, Z. (2020). Rethinking the Value of Labels for Improving Class-imbalanced Learning. Advances in neural information processing systems, 33, 19290\u201319301.","journal-title":"Advances in neural information processing systems"},{"key":"2519_CR74","doi-asserted-by":"crossref","unstructured":"Yu, L., Cheng, Y., & Sohn, K., et\u00a0al (2023) Magvit: Masked generative video transformer. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 10459\u201310469","DOI":"10.1109\/CVPR52729.2023.01008"},{"key":"2519_CR75","doi-asserted-by":"crossref","unstructured":"Yuan, Y., Chen, X., & Wang, J. (2020) Object-contextual representations for semantic segmentation. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part VI 16, Springer, pp 173\u2013190","DOI":"10.1007\/978-3-030-58539-6_11"},{"key":"2519_CR76","doi-asserted-by":"crossref","unstructured":"Yun, S., Han, D., & Oh, S.J., et\u00a0al (2019) Cutmix: Regularization strategy to train strong classifiers with localizable features. In: ICCV, pp 6023\u20136032","DOI":"10.1109\/ICCV.2019.00612"},{"key":"2519_CR77","unstructured":"Zhang, H., Cisse, M., & Dauphin, Y.N., et\u00a0al (2018) mixup: Beyond empirical risk minimization. In: ICLR"},{"key":"2519_CR78","doi-asserted-by":"crossref","unstructured":"Zhang, P., Zhang, B., Zhang, T., et\u00a0al (2021a) Prototypical pseudo label denoising and target structure learning for domain adaptive semantic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 12414\u201312424","DOI":"10.1109\/CVPR46437.2021.01223"},{"key":"2519_CR79","doi-asserted-by":"crossref","unstructured":"Zhang, S., Li, Z., Yan, S., et\u00a0al (2021b) Distribution alignment: A unified framework for long-tail visual recognition. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 2361\u20132370","DOI":"10.1109\/CVPR46437.2021.00239"},{"key":"2519_CR80","doi-asserted-by":"crossref","unstructured":"Zhou, B., Zhao, H., & Puig, X., et\u00a0al (2017) Scene parsing through ade20k dataset. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 633\u2013641","DOI":"10.1109\/CVPR.2017.544"},{"key":"2519_CR81","doi-asserted-by":"crossref","unstructured":"Zhou, T., Wang, W., & Konukoglu, E., et\u00a0al (2022) Rethinking semantic segmentation: A prototype view. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 2582\u20132593","DOI":"10.1109\/CVPR52688.2022.00261"},{"key":"2519_CR82","doi-asserted-by":"crossref","unstructured":"Zhu, J., Wang, Z., & Chen, J., et\u00a0al (2022) Balanced contrastive learning for long-tailed visual recognition. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 6908\u20136917","DOI":"10.1109\/CVPR52688.2022.00679"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02519-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-025-02519-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02519-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,10]],"date-time":"2025-10-10T08:49:09Z","timestamp":1760086149000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-025-02519-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,7,18]]},"references-count":82,"journal-issue":{"issue":"10","published-print":{"date-parts":[[2025,10]]}},"alternative-id":["2519"],"URL":"https:\/\/doi.org\/10.1007\/s11263-025-02519-y","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"type":"print","value":"0920-5691"},{"type":"electronic","value":"1573-1405"}],"subject":[],"published":{"date-parts":[[2025,7,18]]},"assertion":[{"value":"20 June 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 June 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 July 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}