{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,12]],"date-time":"2025-11-12T06:32:57Z","timestamp":1762929177499,"version":"3.45.0"},"reference-count":47,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2025,8,4]],"date-time":"2025-08-04T00:00:00Z","timestamp":1754265600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,8,4]],"date-time":"2025-08-04T00:00:00Z","timestamp":1754265600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"National Key Research and Development Program of China","award":["2023YFC2705700"],"award-info":[{"award-number":["2023YFC2705700"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U23A20318"],"award-info":[{"award-number":["U23A20318"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Science and Technology Major Project of Hubei Province","award":["2024BAB046"],"award-info":[{"award-number":["2024BAB046"]}]},{"DOI":"10.13039\/501100001809","name":"Joint Funds of the National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["U2336211","62225113"],"award-info":[{"award-number":["U2336211","62225113"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100012556","name":"Foundation for Innovative Research Groups of Hubei Province","doi-asserted-by":"publisher","award":["2024AFA017"],"award-info":[{"award-number":["2024AFA017"]}],"id":[{"id":"10.13039\/501100012556","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2025,11]]},"DOI":"10.1007\/s11263-025-02545-w","type":"journal-article","created":{"date-parts":[[2025,8,4]],"date-time":"2025-08-04T16:32:56Z","timestamp":1754325176000},"page":"7553-7569","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["DM-PCL: Text-Driven Dual-Modal Prototype Consistency Learning for Weakly-Supervised Few-Shot Part Segmentation"],"prefix":"10.1007","volume":"133","author":[{"given":"Mengya","family":"Han","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2296-6370","authenticated-orcid":false,"given":"Yong","family":"Luo","sequence":"additional","affiliation":[]},{"given":"Han","family":"Hu","sequence":"additional","affiliation":[]},{"given":"Zengmao","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Lefei","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Bo","family":"Du","sequence":"additional","affiliation":[]},{"given":"Ling-Yu","family":"Duan","sequence":"additional","affiliation":[]},{"given":"Dacheng","family":"Tao","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,8,4]]},"reference":[{"key":"2545_CR1","first-page":"17864","volume":"34","author":"B Cheng","year":"2021","unstructured":"Cheng, B., Schwing, A., & Kirillov, A. (2021). Per-pixel classification is not all you need for semantic segmentation. Advances in neural information processing systems, 34, 17864\u201317875.","journal-title":"Advances in neural information processing systems"},{"key":"2545_CR2","doi-asserted-by":"crossref","unstructured":"Strudel, R., Garcia, R., Laptev, I., & Schmid, C. (2021) Segmenter: Transformer for semantic segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 7262\u20137272","DOI":"10.1109\/ICCV48922.2021.00717"},{"key":"2545_CR3","doi-asserted-by":"crossref","unstructured":"Zhou, T., Wang, W., Konukoglu, E., & Van Gool, L. (2022) Rethinking semantic segmentation: A prototype view. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 2582\u20132593","DOI":"10.1109\/CVPR52688.2022.00261"},{"key":"2545_CR4","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., & Darrell, T. (2015) Fully convolutional networks for semantic segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 3431\u20133440","DOI":"10.1109\/CVPR.2015.7298965"},{"issue":"12","key":"2545_CR5","doi-asserted-by":"publisher","first-page":"2481","DOI":"10.1109\/TPAMI.2016.2644615","volume":"39","author":"V Badrinarayanan","year":"2017","unstructured":"Badrinarayanan, V., Kendall, A., & Cipolla, R. (2017). Segnet: A deep convolutional encoder-decoder architecture for image segmentation. IEEE Transactions on Pattern Analysis and Machine Intelligence, 39(12), 2481\u20132495.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"4","key":"2545_CR6","doi-asserted-by":"publisher","first-page":"834","DOI":"10.1109\/TPAMI.2017.2699184","volume":"40","author":"L-C Chen","year":"2017","unstructured":"Chen, L.-C., Papandreou, G., Kokkinos, I., Murphy, K., & Yuille, A. L. (2017). Deeplab: Semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected crfs. IEEE Transactions on Pattern Analysis and Machine Intelligence, 40(4), 834\u2013848.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"6","key":"2545_CR7","doi-asserted-by":"publisher","first-page":"1899","DOI":"10.1007\/s11263-023-01917-4","volume":"132","author":"X Wang","year":"2024","unstructured":"Wang, X., Zhang, S., Cen, J., Gao, C., Zhang, Y., Zhao, D., & Sang, N. (2024). Clip-guided prototype modulating for few-shot action recognition. International Journal of Computer Vision, 132(6), 1899\u20131912.","journal-title":"International Journal of Computer Vision"},{"key":"2545_CR8","doi-asserted-by":"crossref","unstructured":"Pan, M.-H., Xin, H.-Y., & Shen, H.-B. (2024) Semantic-based implicit feature transform for few-shot classification. International Journal of Computer Vision, 1\u201316","DOI":"10.1007\/s11263-024-02113-8"},{"issue":"3","key":"2545_CR9","doi-asserted-by":"publisher","first-page":"772","DOI":"10.1007\/s11263-022-01731-4","volume":"131","author":"C Ye","year":"2023","unstructured":"Ye, C., Zhu, H., Zhang, B., & Chen, T. (2023). A closer look at few-shot 3d point cloud classification. International Journal of Computer Vision, 131(3), 772\u2013795.","journal-title":"International Journal of Computer Vision"},{"issue":"5","key":"2545_CR10","doi-asserted-by":"publisher","first-page":"1211","DOI":"10.1007\/s11263-023-01760-7","volume":"131","author":"W Qiang","year":"2023","unstructured":"Qiang, W., Li, J., Su, B., Fu, J., Xiong, H., & Wen, J.-R. (2023). Meta attention-generation network for cross-granularity few-shot learning. International Journal of Computer Vision, 131(5), 1211\u20131233.","journal-title":"International Journal of Computer Vision"},{"key":"2545_CR11","doi-asserted-by":"crossref","unstructured":"Tritrong, N., Rewatbowornwong, P., & Suwajanakorn, S. (2021) Repurposing gans for one-shot semantic part segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 4475\u20134485","DOI":"10.1109\/CVPR46437.2021.00445"},{"key":"2545_CR12","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2024.111326","volume":"162","author":"M Han","year":"2025","unstructured":"Han, M., Zheng, H., Wang, C., Luo, Y., Hu, H., Zhang, J., & Du, B. (2025). Partseg: Few-shot part segmentation via part-aware prompt learning. Pattern Recognition, 162, Article 111326.","journal-title":"Pattern Recognition"},{"key":"2545_CR13","doi-asserted-by":"crossref","unstructured":"Saha, O., Cheng, Z., & Maji, S. (2022) Improving few-shot part segmentation using coarse supervision. In: European Conference on Computer Vision, 283\u2013299. Springer","DOI":"10.1007\/978-3-031-20056-4_17"},{"key":"2545_CR14","doi-asserted-by":"crossref","unstructured":"Singh, R., Gupta, P., Shenoy, P., & Sarvadevabhatla, R. (2022) Float: Factorized learning of object attributes for improved multi-object multi-part scene parsing. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 1445\u20131455","DOI":"10.1109\/CVPR52688.2022.00150"},{"key":"2545_CR15","doi-asserted-by":"crossref","unstructured":"De\u00a0Geus, D., Meletis, P., Lu, C., Wen, X., & Dubbelman, G. (2021) Part-aware panoptic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 5485\u20135494","DOI":"10.1109\/CVPR46437.2021.00544"},{"key":"2545_CR16","doi-asserted-by":"crossref","unstructured":"Li, X., Xu, S., Yang, Y., Cheng, G., Tong, Y., & Tao, D. (2022) Panoptic-partformer: Learning a unified model for panoptic part segmentation. In: European Conference on Computer Vision, 729\u2013747. Springer","DOI":"10.1007\/978-3-031-19812-0_42"},{"key":"2545_CR17","unstructured":"Xu, Z., Liu, Z., Sun, C., Murphy, K., Freeman, W. T., Tenenbaum, J. B., & Wu, J. (2019) Unsupervised discovery of parts, structure, and dynamics. In: International Conference on Learning Representations"},{"key":"2545_CR18","unstructured":"Wei, M., Yue, X., Zhang, W., Kong, S., Liu, X., & Pang, J. (2023) Ov-parts: Towards open-vocabulary part segmentation. Advances in Neural Information Processing Systems 36"},{"key":"2545_CR19","doi-asserted-by":"crossref","unstructured":"He, J., Yang, S., Yang, S., Kortylewski, A., Yuan, X., Chen, J.-N., Liu, S., Yang, C., Yu, Q., & Yuille, A. (2022) Partimagenet: A large, high-quality dataset of parts. In: European Conference on Computer Vision, 128\u2013145. Springer","DOI":"10.1007\/978-3-031-20074-8_8"},{"key":"2545_CR20","doi-asserted-by":"crossref","unstructured":"Ahn, J., Cho, S., & Kwak, S. (2019) Weakly supervised learning of instance segmentation with inter-pixel relations. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 2209\u20132218","DOI":"10.1109\/CVPR.2019.00231"},{"issue":"7","key":"2545_CR21","doi-asserted-by":"publisher","first-page":"1704","DOI":"10.1007\/s11263-023-01779-w","volume":"131","author":"F Long","year":"2023","unstructured":"Long, F., Yao, T., Qiu, Z., Tian, X., Luo, J., & Mei, T. (2023). Bi-calibration networks for weakly-supervised video representation learning. International Journal of Computer Vision, 131(7), 1704\u20131721.","journal-title":"International Journal of Computer Vision"},{"issue":"3","key":"2545_CR22","doi-asserted-by":"publisher","first-page":"750","DOI":"10.1007\/s11263-023-01919-2","volume":"132","author":"W Zhai","year":"2024","unstructured":"Zhai, W., Wu, P., Zhu, K., Cao, Y., Wu, F., & Zha, Z.-J. (2024). Background activation suppression for weakly supervised object localization and semantic segmentation. International Journal of Computer Vision, 132(3), 750\u2013775.","journal-title":"International Journal of Computer Vision"},{"issue":"8","key":"2545_CR23","doi-asserted-by":"publisher","first-page":"1892","DOI":"10.1007\/s11263-023-01796-9","volume":"131","author":"B Zhang","year":"2023","unstructured":"Zhang, B., Xiao, J., Wei, Y., & Zhao, Y. (2023). Credible dual-expert learning for weakly supervised semantic segmentation. International Journal of Computer Vision, 131(8), 1892\u20131908.","journal-title":"International Journal of Computer Vision"},{"key":"2545_CR24","doi-asserted-by":"crossref","unstructured":"Kang, D., Koniusz, P., Cho, M., & Murray, N. (2023) Distilling self-supervised vision transformers for weakly-supervised few-shot classification & segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 19627\u201319638","DOI":"10.1109\/CVPR52729.2023.01880"},{"key":"2545_CR25","doi-asserted-by":"crossref","unstructured":"Wang, H., Liu, L., Zhang, W., Zhang, J., Gan, Z., Wang, Y., Wang, C., & Wang, H. (2022) Iterative few-shot semantic segmentation from image label text. In: International Joint Conference on Artificial Intelligence","DOI":"10.24963\/ijcai.2022\/193"},{"key":"2545_CR26","doi-asserted-by":"publisher","first-page":"1784","DOI":"10.1109\/TMM.2022.3162951","volume":"25","author":"PHT Gama","year":"2023","unstructured":"Gama, P. H. T., Oliveira, H., Junior, J. M., & Santos, J. A. D. (2023). Weakly supervised few-shot segmentation via meta-learning. IEEE Transactions on Multimedia, 25, 1784\u20131797.","journal-title":"IEEE Transactions on Multimedia"},{"key":"2545_CR27","unstructured":"Vinyals, O., Blundell, C., Lillicrap, T., Wierstra, D., et al. (2016) Matching networks for one shot learning. Advances in Neural Information Processing Systems, 3637\u20133645"},{"key":"2545_CR28","unstructured":"Snell, J., Swersky, K., & Zemel, R. (2017) Prototypical networks for few-shot learning. Advances in Neural Information Processing Systems, 4080\u20134090"},{"key":"2545_CR29","doi-asserted-by":"crossref","unstructured":"Wang, K., Liew, J. H., Zou, Y., Zhou, D., & Feng, J. (2019) Panet: Few-shot image semantic segmentation with prototype alignment. In: IEEE International Conference on Computer Vision, 9197\u20139206","DOI":"10.1109\/ICCV.2019.00929"},{"issue":"9","key":"2545_CR30","doi-asserted-by":"publisher","first-page":"3855","DOI":"10.1109\/TCYB.2020.2992433","volume":"50","author":"X Zhang","year":"2020","unstructured":"Zhang, X., Wei, Y., Yang, Y., & Huang, T. S. (2020). Sg-one: Similarity guidance network for one-shot semantic segmentation. IEEE Transactions on Cybernetics, 50(9), 3855\u20133865.","journal-title":"IEEE Transactions on Cybernetics"},{"key":"2545_CR31","doi-asserted-by":"crossref","unstructured":"Wu, Z., Shi, X., Lin, G., & Cai, J. (2021) Learning meta-class memory for few-shot semantic segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 517\u2013526","DOI":"10.1109\/ICCV48922.2021.00056"},{"key":"2545_CR32","doi-asserted-by":"crossref","unstructured":"Li, G., Jampani, V., Sevilla-Lara, L., Sun, D., Kim, J., & Kim, J. (2021) Adaptive prototype learning and allocation for few-shot segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 8334\u20138343","DOI":"10.1109\/CVPR46437.2021.00823"},{"issue":"1","key":"2545_CR33","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1007\/s11263-023-01886-8","volume":"132","author":"C Lang","year":"2024","unstructured":"Lang, C., Cheng, G., Tu, B., & Han, J. (2024). Few-shot segmentation via divide-and-conquer proxies. International Journal of Computer Vision, 132(1), 261\u2013283.","journal-title":"International Journal of Computer Vision"},{"key":"2545_CR34","doi-asserted-by":"crossref","unstructured":"Han, M., Zheng, H., Wang, C., Luo, Y., Hu, H., & Du, B. (2022) Leveraging gan priors for few-shot part segmentation. In: ACM International Conference on Multimedia","DOI":"10.1145\/3503161.3548398"},{"key":"2545_CR35","unstructured":"Radford, A., Kim, J. W., Hallacy, C., Ramesh, A., Goh, G., Agarwal, S., Sastry, G., Askell, A., Mishkin, P., Clark, J., et al. (2021) Learning transferable visual models from natural language supervision. In: International Conference on Machine Learning, 8748\u20138763. PMLR"},{"issue":"9","key":"2545_CR36","doi-asserted-by":"publisher","first-page":"2337","DOI":"10.1007\/s11263-022-01653-1","volume":"130","author":"K Zhou","year":"2022","unstructured":"Zhou, K., Yang, J., Loy, C. C., & Liu, Z. (2022). Learning to prompt for vision-language models. International Journal of Computer Vision, 130(9), 2337\u20132348.","journal-title":"International Journal of Computer Vision"},{"key":"2545_CR37","doi-asserted-by":"crossref","unstructured":"Rao, Y., Zhao, W., Chen, G., Tang, Y., Zhu, Z., Huang, G., Zhou, J., & Lu, J. (2022) Denseclip: Language-guided dense prediction with context-aware prompting. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 18082\u201318091","DOI":"10.1109\/CVPR52688.2022.01755"},{"key":"2545_CR38","doi-asserted-by":"crossref","unstructured":"Zhou, K., Yang, J., Loy, C. C., & Liu, Z. (2022) Conditional prompt learning for vision-language models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 16816\u201316825","DOI":"10.1109\/CVPR52688.2022.01631"},{"key":"2545_CR39","doi-asserted-by":"publisher","first-page":"2352","DOI":"10.1109\/TIP.2022.3141868","volume":"31","author":"C Chen","year":"2022","unstructured":"Chen, C., Ye, M., Qi, M., Wu, J., Jiang, J., & Lin, C.-W. (2022). Structure-aware positional transformer for visible-infrared person re-identification. IEEE Transactions on Image Processing, 31, 2352\u20132364. https:\/\/doi.org\/10.1109\/TIP.2022.3141868","journal-title":"IEEE Transactions on Image Processing"},{"key":"2545_CR40","doi-asserted-by":"crossref","unstructured":"Ranftl, R., Bochkovskiy, A., & Koltun, V. (2021) Vision transformers for dense prediction. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 12179\u201312188","DOI":"10.1109\/ICCV48922.2021.01196"},{"key":"2545_CR41","doi-asserted-by":"crossref","unstructured":"Chen, C., Ye, M., Qi, M., & Du, B. (2022) Sketch transformer: Asymmetrical disentanglement learning from dynamic synthesis. In: ACM International Conference on Multimedia","DOI":"10.1145\/3503161.3547993"},{"issue":"5","key":"2545_CR42","doi-asserted-by":"publisher","first-page":"2950","DOI":"10.1109\/TPAMI.2023.3337005","volume":"46","author":"C Chen","year":"2024","unstructured":"Chen, C., Ye, M., Qi, M., & Du, B. (2024). Sketchtrans: Disentangled prototype learning with transformer for sketch-photo recognition. IEEE Transactions on Pattern Analysis and Machine Intelligence, 46(5), 2950\u20132964. https:\/\/doi.org\/10.1109\/TPAMI.2023.3337005","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2545_CR43","unstructured":"Jia, Y., Huang, W., Gao, J., Wang, Q., & Li, Q. (2024) Embedding generalized semantic knowledge into few-shot remote sensing segmentation. arXiv preprint arXiv:2405.13686"},{"key":"2545_CR44","doi-asserted-by":"crossref","unstructured":"Zhao, X., Vemulapalli, R., Mansfield, P. A., Gong, B., Green, B., Shapira, L., & Wu, Y. (2021) Contrastive learning for label efficient semantic segmentation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 10623\u201310633","DOI":"10.1109\/ICCV48922.2021.01045"},{"key":"2545_CR45","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","volume":"88","author":"M Everingham","year":"2010","unstructured":"Everingham, M., Van Gool, L., Williams, C. K., Winn, J., & Zisserman, A. (2010). The pascal visual object classes (voc) challenge. International Journal of Computer Vision, 88, 303\u2013338.","journal-title":"International Journal of Computer Vision"},{"key":"2545_CR46","unstructured":"Li, B., Weinberger, K. Q., Belongie, S., Koltun, V., & Ranftl, R. (2022) Language-driven semantic segmentation. In: International Conference on Learning Representations"},{"key":"2545_CR47","doi-asserted-by":"crossref","unstructured":"Boudiaf, M., Kervadec, H., Masud, Z. I., Piantanida, P., Ben Ayed, I., & Dolz, J. (2021) Few-shot segmentation without meta-learning: A good transductive inference is all you need? In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 13979\u201313988","DOI":"10.1109\/CVPR46437.2021.01376"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02545-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-025-02545-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02545-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,12]],"date-time":"2025-11-12T06:27:29Z","timestamp":1762928849000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-025-02545-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,4]]},"references-count":47,"journal-issue":{"issue":"11","published-print":{"date-parts":[[2025,11]]}},"alternative-id":["2545"],"URL":"https:\/\/doi.org\/10.1007\/s11263-025-02545-w","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"type":"print","value":"0920-5691"},{"type":"electronic","value":"1573-1405"}],"subject":[],"published":{"date-parts":[[2025,8,4]]},"assertion":[{"value":"7 November 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 July 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 August 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}