{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,23]],"date-time":"2026-07-23T21:32:14Z","timestamp":1784842334488,"version":"3.55.0"},"reference-count":71,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,1,20]],"date-time":"2026-01-20T00:00:00Z","timestamp":1768867200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,20]],"date-time":"2026-01-20T00:00:00Z","timestamp":1768867200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62371157"],"award-info":[{"award-number":["62371157"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2026,2]]},"DOI":"10.1007\/s11263-025-02728-5","type":"journal-article","created":{"date-parts":[[2026,1,20]],"date-time":"2026-01-20T09:30:03Z","timestamp":1768901403000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Weakly Supervised Salient Object Detection with Text Supervision"],"prefix":"10.1007","volume":"134","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-2704-0614","authenticated-orcid":false,"given":"Zhihao","family":"Wu","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jie","family":"Wen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Linlin","family":"Shen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Xiaopeng","family":"Fan","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yong","family":"Xu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jian","family":"Yang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"David","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2026,1,20]]},"reference":[{"key":"2728_CR1","doi-asserted-by":"crossref","unstructured":"Achanta, R., Hemami, S., Estrada, F., & Susstrunk, S. (2009). Frequency-tuned salient region detection. In: 2009 IEEE Conference on Computer Vision and Pattern Recognition, pp. 1597\u20131604. IEEE","DOI":"10.1109\/CVPR.2009.5206596"},{"key":"2728_CR2","doi-asserted-by":"crossref","unstructured":"Araslanov, N., & Roth, S. (2020). Single-stage semantic segmentation from image labels. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4253\u20134262.","DOI":"10.1109\/CVPR42600.2020.00431"},{"key":"2728_CR3","doi-asserted-by":"crossref","unstructured":"Bylinskii, Z., Recasens, A., Borji, A., Oliva, A., Torralba, A., & Durand, F. (2016). Where should saliency models look next? In: Proceedings of the European Conference on Computer Vision, pp. 809\u2013824. Springer","DOI":"10.1007\/978-3-319-46454-1_49"},{"key":"2728_CR4","unstructured":"Chen, G., & Fan, X. (2018). Autofocus window selection algorithm based on saliency detection. In: Sixth International Conference on Optical and Photonic Engineering, vol. 10827, pp. 340\u2013346. SPIE"},{"key":"2728_CR5","unstructured":"Chen, X., Fan, H., Girshick, R., & He, K. (2020). Improved baselines with momentum contrastive learning. arXiv preprint arXiv:2003.04297"},{"issue":"11","key":"2728_CR6","doi-asserted-by":"publisher","first-page":"8006","DOI":"10.1109\/TPAMI.2021.3107956","volume":"44","author":"M-M Cheng","year":"2021","unstructured":"Cheng, M.-M., Gao, S.-H., Borji, A., Tan, Y.-Q., Lin, Z., & Wang, M. (2021). A highly efficient model to study the semantics of salient object detection. IEEE Transactions on Pattern Analysis and Machine Intelligence,44(11), 8006\u20138021.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2728_CR7","doi-asserted-by":"publisher","first-page":"443","DOI":"10.1007\/s00371-013-0867-4","volume":"30","author":"M-M Cheng","year":"2014","unstructured":"Cheng, M.-M., Mitra, N. J., Huang, X., & Hu, S.-M. (2014). Salientshape: group saliency in image collections. The visual Computer,30, 443\u2013453.","journal-title":"The visual Computer"},{"issue":"2","key":"2728_CR8","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3177745","volume":"14","author":"M Cornia","year":"2018","unstructured":"Cornia, M., Baraldi, L., Serra, G., & Cucchiara, R. (2018). Paying more attention to saliency: Image captioning with saliency and context attention. ACM Transactions on Multimedia Computing, Communications, and Applications,14(2), 1\u201321.","journal-title":"ACM Transactions on Multimedia Computing, Communications, and Applications"},{"key":"2728_CR9","doi-asserted-by":"publisher","first-page":"90","DOI":"10.1016\/j.cviu.2017.10.001","volume":"163","author":"A Das","year":"2017","unstructured":"Das, A., Agrawal, H., Zitnick, L., Parikh, D., & Batra, D. (2017). Human attention in visual question answering: Do humans and deep networks look at the same regions? Computer Vision and Image Understanding,163, 90\u2013100.","journal-title":"Computer Vision and Image Understanding"},{"key":"2728_CR10","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.-J., Li, K., & Fei-Fei, L. (2009). Imagenet: A large-scale hierarchical image database. In: Proceedings of the 2009 IEEE Conference on Computer Vision and Pattern Recognition, pp. 248\u2013255.","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"2728_CR11","doi-asserted-by":"crossref","unstructured":"Fan, D.-P., Gong, C., Cao, Y., Ren, B., Cheng, M.-M., & Borji, A. (2018). Enhanced-alignment measure for binary foreground map evaluation. arXiv preprint arXiv:1805.10421","DOI":"10.24963\/ijcai.2018\/97"},{"issue":"2","key":"2728_CR12","doi-asserted-by":"publisher","first-page":"2344","DOI":"10.1109\/TPAMI.2022.3166451","volume":"45","author":"D-P Fan","year":"2022","unstructured":"Fan, D.-P., Zhang, J., Xu, G., Cheng, M.-M., & Shao, L. (2022). Salient objects in clutter. IEEE Transactions on Pattern Analysis and Machine Intelligence,45(2), 2344\u20132366.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2728_CR13","unstructured":"Fu, C., Chen, P., Shen, Y., Qin, Y., Zhang, M., Lin, X., Qiu, Z., Lin, W., Yang, J., Zheng, X., et al. (2023). Mme: A comprehensive evaluation benchmark for multimodal large language models. arXiv preprint arXiv:2306.13394"},{"key":"2728_CR14","doi-asserted-by":"crossref","unstructured":"Gao, S., Zhang, W., Wang, Y., Guo, Q., Zhang, C., He, Y., & Zhang, W. (2022). Weakly-supervised salient object detection using point supervison. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 36, pp. 670\u2013678.","DOI":"10.1609\/aaai.v36i1.19947"},{"key":"2728_CR15","doi-asserted-by":"crossref","unstructured":"He, S., Tavakoli, H.R., Borji, A., & Pugeault, N. (2019). Human attention in image captioning: Dataset and analysis. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 8529\u20138538.","DOI":"10.1109\/ICCV.2019.00862"},{"key":"2728_CR16","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. (2016). Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778.","DOI":"10.1109\/CVPR.2016.90"},{"key":"2728_CR17","doi-asserted-by":"crossref","unstructured":"Hu, J., Shen, L., & Sun, G. (2018). Squeeze-and-excitation networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7132\u20137141.","DOI":"10.1109\/CVPR.2018.00745"},{"key":"2728_CR18","doi-asserted-by":"crossref","unstructured":"Kirillov, A., Mintun, E., Ravi, N., Mao, H., Rolland, C., Gustafson, L., Xiao, T., Whitehead, S., Berg, A.C., & Lo, W.-Y. (2023). Segment anything. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 4015\u20134026","DOI":"10.1109\/ICCV51070.2023.00371"},{"key":"2728_CR19","unstructured":"Kr\u00e4henb\u00fchl, P., & Koltun, V. (2011). Efficient inference in fully connected crfs with gaussian edge potentials. In: Advances in Neural Information Processing Systems, vol. 24."},{"key":"2728_CR20","doi-asserted-by":"crossref","unstructured":"Li, G., & Yu, Y. (2015). Visual saliency based on multiscale deep features. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5455\u20135463.","DOI":"10.1109\/CVPR.2015.7299184"},{"key":"2728_CR21","doi-asserted-by":"crossref","unstructured":"Li, Y., Hou, X., Koch, C., Rehg, J.M., & Yuille, A.L. (2014). The secrets of salient object segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 280\u2013287.","DOI":"10.1109\/CVPR.2014.43"},{"key":"2728_CR22","doi-asserted-by":"crossref","unstructured":"Li, G., Xie, Y., & Lin, L. (2018). Weakly supervised salient object detection using image labels. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 32.","DOI":"10.1609\/aaai.v32i1.12308"},{"key":"2728_CR23","doi-asserted-by":"crossref","unstructured":"Lin, Y., Chen, M., Wang, W., Wu, B., Li, K., Lin, B., Liu, H., & He, X. (2023). Clip is also an efficient segmenter: A text-driven approach for weakly supervised semantic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 15305\u201315314","DOI":"10.1109\/CVPR52729.2023.01469"},{"key":"2728_CR24","doi-asserted-by":"crossref","unstructured":"Lin, X., Wu, Z., Chen, G., Li, G., & Yu, Y. (2022). A causal debiasing framework for unsupervised salient object detection. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 36, pp. 1610\u20131619.","DOI":"10.1609\/aaai.v36i2.20052"},{"key":"2728_CR25","doi-asserted-by":"publisher","first-page":"9165","DOI":"10.1109\/TIP.2020.3023774","volume":"29","author":"X Li","year":"2020","unstructured":"Li, X., Song, D., & Dong, Y. (2020). Hierarchical feature fusion network for salient object detection. IEEE Transactions on Image Processing,29, 9165\u20139175.","journal-title":"IEEE Transactions on Image Processing"},{"issue":"1","key":"2728_CR26","doi-asserted-by":"publisher","first-page":"887","DOI":"10.1109\/TPAMI.2021.3140168","volume":"45","author":"J-J Liu","year":"2022","unstructured":"Liu, J.-J., Hou, Q., Liu, Z.-A., & Cheng, M.-M. (2022). Poolnet+: Exploring the potential of pooling for salient object detection. IEEE Transactions on Pattern Analysis and Machine Intelligence,45(1), 887\u2013904.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2728_CR27","doi-asserted-by":"publisher","first-page":"4423","DOI":"10.1109\/TIP.2021.3071691","volume":"30","author":"Y Liu","year":"2021","unstructured":"Liu, Y., Wang, P., Cao, Y., Liang, Z., & Lau, R. W. (2021). Weakly-supervised salient object detection with saliency bounding boxes. IEEE Transactions on Image Processing,30, 4423\u20134435.","journal-title":"IEEE Transactions on Image Processing"},{"issue":"2","key":"2728_CR28","doi-asserted-by":"crossref","first-page":"353","DOI":"10.1109\/TPAMI.2010.70","volume":"33","author":"T Liu","year":"2010","unstructured":"Liu, T., Yuan, Z., Sun, J., Wang, J., Zheng, N., Tang, X., & Shum, H.-Y. (2010). Learning to detect a salient object. IEEE Transactions on Pattern Analysis and Machine Intelligence,33(2), 353\u2013367.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"3","key":"2728_CR29","doi-asserted-by":"publisher","first-page":"541","DOI":"10.1109\/TPAMI.2012.98","volume":"35","author":"V Mahadevan","year":"2012","unstructured":"Mahadevan, V., & Vasconcelos, N. (2012). Biologically inspired object tracking using center-surround saliency mechanisms. IEEE Transactions on Pattern Analysis and Machine Intelligence,35(3), 541\u2013554.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"11","key":"2728_CR30","doi-asserted-by":"publisher","first-page":"2415","DOI":"10.1109\/TMM.2017.2694219","volume":"19","author":"C Ma","year":"2017","unstructured":"Ma, C., Miao, Z., Zhang, X.-P., & Li, M. (2017). A saliency prior context model for real-time object tracking. IEEE Transactions on Multimedia,19(11), 2415\u20132424.","journal-title":"IEEE Transactions on Multimedia"},{"key":"2728_CR31","doi-asserted-by":"publisher","first-page":"124","DOI":"10.1016\/j.patrec.2019.04.011","volume":"125","author":"N Mu","year":"2019","unstructured":"Mu, N., Xu, X., & Zhang, X. (2019). Finding autofocus region in low contrast surveillance images using cnn-based saliency algorithm. Pattern Recognition Letters,125, 124\u2013132.","journal-title":"Pattern Recognition Letters"},{"key":"2728_CR32","unstructured":"Nguyen, T., Dax, M., Mummadi, C.K., Ngo, N., Nguyen, T.H.P., Lou, Z., & Brox, T. (2019). Deepusps: Deep robust unsupervised saliency prediction via self-supervision. In: Advances in Neural Information Processing Systems, vol. 32."},{"key":"2728_CR33","doi-asserted-by":"crossref","unstructured":"Peng, S., Jiang, W., Pi, H., Li, X., Bao, H., & Zhou, X. (2020). Deep snake for real-time instance segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8533\u20138542.","DOI":"10.1109\/CVPR42600.2020.00856"},{"key":"2728_CR34","doi-asserted-by":"crossref","unstructured":"Perazzi, F., Kr\u00e4henb\u00fchl, P., Pritch, Y., & Hornung, A. (2012). Saliency filters: Contrast based filtering for salient region detection. In: 2012 IEEE Conference on Computer Vision and Pattern Recognition, pp. 733\u2013740. IEEE","DOI":"10.1109\/CVPR.2012.6247743"},{"key":"2728_CR35","doi-asserted-by":"crossref","unstructured":"Piao, Y., Wang, J., Zhang, M., & Lu, H. (2021). Mfnet: Multi-filter directive network for weakly supervised salient object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 4136\u20134145.","DOI":"10.1109\/ICCV48922.2021.00410"},{"key":"2728_CR36","doi-asserted-by":"crossref","unstructured":"Piao, Y., Wu, W., Zhang, M., Jiang, Y., Lu, H.: Noise-sensitive adversarial learning for weakly supervised salient object detection. IEEE Transactions on Multimedia (2022)","DOI":"10.1109\/TMM.2022.3152567"},{"key":"2728_CR37","unstructured":"Radford, A., Kim, J.W., Hallacy, C., Ramesh, A., Goh, G., Agarwal, S., Sastry, G., Askell, A., Mishkin, P., & Clark, J. (2021). Learning transferable visual models from natural language supervision. In: International Conference on Machine Learning, pp. 8748\u20138763. PMLR"},{"key":"2728_CR38","doi-asserted-by":"crossref","unstructured":"Selvaraju, R.R., Cogswell, M., Das, A., Vedantam, R., Parikh, D., & Batra, D. (2017). Grad-cam: Visual explanations from deep networks via gradient-based localization. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 618\u2013626.","DOI":"10.1109\/ICCV.2017.74"},{"key":"2728_CR39","doi-asserted-by":"crossref","unstructured":"Shin, G., Albanie, S., & Xie, W. (2022). Unsupervised salient object detection with spectral cluster voting. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3971\u20133980.","DOI":"10.1109\/CVPRW56347.2022.00442"},{"key":"2728_CR40","unstructured":"Shin, G., Xie, W., & Albanie, S. (2022). Reco: Retrieve and co-segment for zero-shot transfer. In: Advances in Neural Information Processing Systems, vol. 35, pp. 33754\u201333767."},{"key":"2728_CR41","doi-asserted-by":"crossref","unstructured":"Sim\u00e9oni, O., Sekkat, C., Puy, G., Vobeck\u1ef3, A., Zablocki, \u00c9., & P\u00e9rez, P. (2023). Unsupervised object localization: Observing the background to discover objects. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3176\u20133186","DOI":"10.1109\/CVPR52729.2023.00310"},{"key":"2728_CR42","doi-asserted-by":"crossref","unstructured":"Song, D., Dong, Y., & Li, X. (2023). Adjacent complementary network for salient object detection in optical remote sensing images. IEEE Transactions on Geoscience and Remote Sensing","DOI":"10.1109\/TGRS.2023.3276894"},{"key":"2728_CR43","doi-asserted-by":"publisher","first-page":"7567","DOI":"10.1109\/TIP.2021.3106798","volume":"30","author":"D Song","year":"2021","unstructured":"Song, D., Dong, Y., & Li, X. (2021). Hierarchical edge refinement network for saliency detection. IEEE Transactions on Image Processing,30, 7567\u20137577.","journal-title":"IEEE Transactions on Image Processing"},{"key":"2728_CR44","doi-asserted-by":"crossref","unstructured":"Tian, X., Zhang, J., Xiang, M., & Dai, Y. (2023). Modeling the distributional uncertainty for salient object detection models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 19660\u201319670.","DOI":"10.1109\/CVPR52729.2023.01883"},{"key":"2728_CR45","doi-asserted-by":"crossref","unstructured":"Veksler, O. (2023). Test time adaptation with regularized loss for weakly supervised salient object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7360\u20137369.","DOI":"10.1109\/CVPR52729.2023.00711"},{"key":"2728_CR46","doi-asserted-by":"crossref","unstructured":"Wang, L., Lu, H., Wang, Y., Feng, M., Wang, D., Yin, B., & Ruan, X. (2017). Learning to detect salient objects with image-level supervision. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 136\u2013145.","DOI":"10.1109\/CVPR.2017.404"},{"key":"2728_CR47","doi-asserted-by":"crossref","unstructured":"Wang, Y., Zhang, W., Wang, L., Liu, T., & Lu, H. (2022). Multi-source uncertainty mining for deep unsupervised saliency detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11727\u201311736.","DOI":"10.1109\/CVPR52688.2022.01143"},{"key":"2728_CR48","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2024.110579","volume":"154","author":"Y Wang","year":"2024","unstructured":"Wang, Y., Wang, R., He, X., Lin, C., Wang, T., Jia, Q., & Fan, X. (2024). Wbnet: Weakly-supervised salient object detection via scribble and pseudo-background priors. Pattern Recognition,154, Article 110579.","journal-title":"Pattern Recognition"},{"issue":"7","key":"2728_CR49","doi-asserted-by":"publisher","first-page":"1734","DOI":"10.1109\/TPAMI.2018.2846598","volume":"41","author":"L Wang","year":"2018","unstructured":"Wang, L., Wang, L., Lu, H., Zhang, P., & Ruan, X. (2018). Salient object detection with recurrent fully convolutional networks. IEEE Transactions on Pattern Analysis and Machine Intelligence,41(7), 1734\u20131746.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"5","key":"2728_CR50","doi-asserted-by":"publisher","first-page":"8565","DOI":"10.1109\/TNNLS.2024.3436519","volume":"36","author":"Z Wu","year":"2025","unstructured":"Wu, Z., Liu, C., Wen, J., Xu, Y., Yang, J., & Li, X. (2025). Spatial continuity and nonequal importance in salient object detection with image-category supervision. IEEE Transactions on Neural Networks and Learning Systems,36(5), 8565\u20138576.","journal-title":"IEEE Transactions on Neural Networks and Learning Systems"},{"key":"2728_CR51","doi-asserted-by":"crossref","unstructured":"Xie, J., Hou, X., Ye, K., Shen, L. (2022). Clims: Cross language image matching for weakly supervised semantic segmentation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4483\u20134492.","DOI":"10.1109\/CVPR52688.2022.00444"},{"issue":"1","key":"2728_CR52","doi-asserted-by":"publisher","first-page":"248","DOI":"10.1109\/TCSVT.2023.3284076","volume":"34","author":"B Xu","year":"2023","unstructured":"Xu, B., Liang, H., Gong, W., Liang, R., & Chen, P. (2023). A visual representation-guided framework with global affinity for weakly supervised salient object detection. IEEE Transactions on Circuits and Systems for Video Technology,34(1), 248\u2013259.","journal-title":"IEEE Transactions on Circuits and Systems for Video Technology"},{"key":"2728_CR53","doi-asserted-by":"crossref","unstructured":"Yan, Q., Xu, L., Shi, J., & Jia, J. (2013). Hierarchical saliency detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1155\u20131162.","DOI":"10.1109\/CVPR.2013.153"},{"key":"2728_CR54","doi-asserted-by":"crossref","unstructured":"Yang, X., & Gong, X. (2024). Foundation model assisted weakly supervised semantic segmentation. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 523\u2013532.","DOI":"10.1109\/WACV57701.2024.00058"},{"key":"2728_CR55","doi-asserted-by":"crossref","unstructured":"Yang, C., Zhang, L., Lu, H., Ruan, X., & Yang, M.-H. (2013). Saliency detection via graph-based manifold ranking. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3166\u20133173.","DOI":"10.1109\/CVPR.2013.407"},{"key":"2728_CR56","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2024.110330","volume":"150","author":"Y Yi","year":"2024","unstructured":"Yi, Y., Zhang, N., Zhou, W., Shi, Y., Xie, G., & Wang, J. (2024). Gponet: A two-stream gated progressive optimization network for salient object detection. Pattern Recognition,150, Article 110330.","journal-title":"Pattern Recognition"},{"key":"2728_CR57","doi-asserted-by":"crossref","unstructured":"Yu, S., Zhang, B., Xiao, J., & Lim, E.G. (2021). Structure-consistent weakly supervised salient object detection with local saliency coherence. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 35, pp. 3234\u20133242.","DOI":"10.1609\/aaai.v35i4.16434"},{"key":"2728_CR58","doi-asserted-by":"publisher","first-page":"4667","DOI":"10.1109\/TMM.2023.3325731","volume":"26","author":"YK Yun","year":"2023","unstructured":"Yun, Y. K., & Lin, W. (2023). Towards a complete and detail-preserved salient object detection. IEEE Transactions on Multimedia,26, 4667\u20134680.","journal-title":"IEEE Transactions on Multimedia"},{"key":"2728_CR59","doi-asserted-by":"crossref","unstructured":"Zeng, Y., Zhuge, Y., Lu, H., Zhang, L., Qian, M., Yu, Y. (2019). Multi-source weak supervision for saliency detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6074\u20136083.","DOI":"10.1109\/CVPR.2019.00623"},{"key":"2728_CR60","doi-asserted-by":"crossref","unstructured":"Zhang, D., Han, J., & Zhang, Y. (2017). Supervision by fusion: Towards unsupervised learning of deep salient object detector. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 4048\u20134056.","DOI":"10.1109\/ICCV.2017.436"},{"key":"2728_CR61","doi-asserted-by":"crossref","unstructured":"Zhang, J., Xie, J., & Barnes, N. (2020). Learning noise-aware encoder-decoder from noisy labels by alternating back-propagation for saliency detection. In: Proceedings of the European Conference on Computer Vision, pp. 349\u2013366. Springer","DOI":"10.1007\/978-3-030-58520-4_21"},{"key":"2728_CR62","doi-asserted-by":"crossref","unstructured":"Zhang, J., Yu, X., Li, A., Song, P., Liu, B., & Dai, Y. (2020) Weakly-supervised salient object detection via scribble annotations. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12546\u201312555.","DOI":"10.1109\/CVPR42600.2020.01256"},{"key":"2728_CR63","doi-asserted-by":"crossref","unstructured":"Zhang, J., Zhang, T., Dai, Y., Harandi, M., & Hartley, R. (2018). Deep unsupervised saliency detection: A multiple noisy labeling perspective. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 9029\u20139038.","DOI":"10.1109\/CVPR.2018.00941"},{"issue":"8","key":"2728_CR64","doi-asserted-by":"publisher","first-page":"2866","DOI":"10.1109\/TPAMI.2020.3046486","volume":"43","author":"J Zhang","year":"2021","unstructured":"Zhang, J., Dai, Y., Zhang, T., Harandi, M., Barnes, N., & Hartley, R. (2021). Learning saliency from single noisy labelling: A robust model fitting perspective. IEEE Transactions on Pattern Analysis and Machine Intelligence,43(8), 2866\u20132873.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2728_CR65","doi-asserted-by":"crossref","unstructured":"Zhang, F., Du, B., & Zhang, L. (2014). Saliency-guided unsupervised feature learning for scene classification. IEEE Transactions on Geoscience and Remote Sensing,53(4), 2175\u20132184.","DOI":"10.1109\/TGRS.2014.2357078"},{"key":"2728_CR66","doi-asserted-by":"crossref","unstructured":"Zhou, C., Loy, C.C., & Dai, B. (2022). Extract free dense labels from clip. In: Proceedings of the European Conference on Computer Vision, pp. 696\u2013712. Springer","DOI":"10.1007\/978-3-031-19815-1_40"},{"key":"2728_CR67","doi-asserted-by":"crossref","unstructured":"Zhou, Z., Pei, W., Li, X., Wang, H., Zheng, F., & He, Z. (2021). Saliency-associated object tracking. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 9866\u20139875","DOI":"10.1109\/ICCV48922.2021.00972"},{"key":"2728_CR68","doi-asserted-by":"crossref","unstructured":"Zhou, H., Qiao, B., Yang, L., Lai, J., & Xie, X. (2023). Texture-guided saliency distilling for unsupervised salient object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7257\u20137267.","DOI":"10.1109\/CVPR52729.2023.00701"},{"issue":"2","key":"2728_CR69","doi-asserted-by":"publisher","first-page":"743","DOI":"10.1109\/TCSVT.2022.3203595","volume":"33","author":"H Zhou","year":"2022","unstructured":"Zhou, H., Chen, P., Yang, L., Xie, X., & Lai, J. (2022). Activation to saliency: Forming high-quality labels for unsupervised salient object detection. IEEE Transactions on Circuits and Systems for Video Technology,33(2), 743\u2013755.","journal-title":"IEEE Transactions on Circuits and Systems for Video Technology"},{"key":"2728_CR70","doi-asserted-by":"publisher","first-page":"694","DOI":"10.1109\/TIP.2019.2928144","volume":"29","author":"L Zhou","year":"2019","unstructured":"Zhou, L., Zhang, Y., Jiang, Y.-G., Zhang, T., & Fan, W. (2019). Re-caption: Saliency-enhanced image captioning through two-phase learning. IEEE Transactions on Image Processing,29, 694\u2013709.","journal-title":"IEEE Transactions on Image Processing"},{"issue":"3","key":"2728_CR71","first-page":"3738","volume":"45","author":"M Zhuge","year":"2022","unstructured":"Zhuge, M., Fan, D.-P., Liu, N., Zhang, D., Xu, D., & Shao, L. (2022). Salient object detection via integrity learning. IEEE Transactions on Pattern Analysis and Machine Intelligence,45(3), 3738\u20133752.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02728-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-025-02728-5","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02728-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,17]],"date-time":"2026-02-17T15:20:49Z","timestamp":1771341649000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-025-02728-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1,20]]},"references-count":71,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2026,2]]}},"alternative-id":["2728"],"URL":"https:\/\/doi.org\/10.1007\/s11263-025-02728-5","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,1,20]]},"assertion":[{"value":"18 May 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 December 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 January 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"74"}}