{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,8]],"date-time":"2025-09-08T06:22:12Z","timestamp":1757312532765,"version":"3.28.0"},"reference-count":47,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2024,1,18]],"date-time":"2024-01-18T00:00:00Z","timestamp":1705536000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,18]],"date-time":"2024-01-18T00:00:00Z","timestamp":1705536000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"Natural Science Foundation of China under Grant","award":["No.61671283"],"award-info":[{"award-number":["No.61671283"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2024,11]]},"DOI":"10.1007\/s00371-023-03234-w","type":"journal-article","created":{"date-parts":[[2024,1,18]],"date-time":"2024-01-18T15:03:49Z","timestamp":1705590229000},"page":"8227-8242","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Salient-aware multiple instance learning optimized network for weakly supervised object detection"],"prefix":"10.1007","volume":"40","author":[{"given":"Han","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yongfang","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yingjie","family":"Yang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,1,18]]},"reference":[{"key":"3234_CR1","doi-asserted-by":"publisher","unstructured":"Bilen H, Vedaldi A.: Weakly supervised deep detection networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition. 2846\u20132854(2016). https:\/\/doi.org\/10.1109\/CVPR.2016.311.","DOI":"10.1109\/CVPR.2016.311"},{"key":"3234_CR2","doi-asserted-by":"publisher","unstructured":"Zhou B, Khosla A, Lapedriza A, et al.: Learning deep features for discriminative localization. In: Proceedings of the IEEE conference on computer vision and pattern recognition. 2921\u20132929(2016). https:\/\/doi.org\/10.1109\/CVPR.2016.319.","DOI":"10.1109\/CVPR.2016.319"},{"key":"3234_CR3","doi-asserted-by":"publisher","unstructured":"Wan F, Liu C, Ke W, et al.: C-mil: Continuation multiple instance learning for weakly supervised object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 2199\u20132208(2019). https:\/\/doi.org\/10.48550\/arXiv.1904.05647.","DOI":"10.48550\/arXiv.1904.05647"},{"key":"3234_CR4","doi-asserted-by":"publisher","unstructured":"Tang P, Wang X, Bai X, et al.: Multiple instance detection network with online instance classifier refinement. In: Proceedings of the IEEE conference on computer vision and pattern recognition. 2843\u20132851(2017). https:\/\/doi.org\/10.48550\/arXiv.1704.00138.","DOI":"10.48550\/arXiv.1704.00138"},{"issue":"1","key":"3234_CR5","doi-asserted-by":"publisher","first-page":"176","DOI":"10.1109\/TPAMI.2018.2876304","volume":"42","author":"P Tang","year":"2018","unstructured":"Tang, P., Wang, X., Bai, S., et al.: Pcl: Proposal cluster learning for weakly supervised object detection[J]. IEEE Trans. Pattern Anal. Mach. Intell. 42(1), 176\u2013191 (2018). https:\/\/doi.org\/10.1109\/TPAMI.2018.2876304","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"3234_CR6","doi-asserted-by":"publisher","unstructured":"Lin C, Wang S, Xu D, et al.: Object instance mining for weakly supervised object detection. In: Proceedings of the AAAI Conference on Artificial Intelligence. 34(07), 11482\u201311489(2020). https:\/\/doi.org\/10.48550\/arXiv.2002.01087","DOI":"10.48550\/arXiv.2002.01087"},{"key":"3234_CR7","doi-asserted-by":"publisher","unstructured":"Ren Z, Yu Z, Yang X, et al.: Instance-aware, context-focused, and memory-efficient weakly supervised object detection.In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 10598\u201310607(2020). https:\/\/doi.org\/10.48550\/arXiv.2004.04725","DOI":"10.48550\/arXiv.2004.04725"},{"key":"3234_CR8","doi-asserted-by":"publisher","unstructured":"Gao M, Li A, Yu R, et al.: C-wsl: Count-guided weakly supervised localization. In: Proceedings of the European conference on computer vision (ECCV). 152\u2013168(2018). https:\/\/doi.org\/10.48550\/arXiv.1711.05282","DOI":"10.48550\/arXiv.1711.05282"},{"key":"3234_CR9","doi-asserted-by":"publisher","unstructured":"Yang K, Li D, Dou Y.: Towards precise end-to-end weakly supervised object detection network. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision. 8372\u20138381(2019). https:\/\/doi.org\/10.48550\/arXiv.1911.12148","DOI":"10.48550\/arXiv.1911.12148"},{"key":"3234_CR10","doi-asserted-by":"publisher","unstructured":"Girshick R.: Fast r-cnn. In: Proceedings of the IEEE international conference on computer vision. 1440\u20131448(2015). https:\/\/doi.org\/10.1109\/ICCV.2015.169","DOI":"10.1109\/ICCV.2015.169"},{"key":"3234_CR11","doi-asserted-by":"publisher","unstructured":"Ren S, He K, Girshick R, et al.: Faster r-cnn: Towards real-time object detection with region proposal networks[J]. Advances in neural information processing systems, 28(2015). https:\/\/doi.org\/10.48550\/arXiv.1506.01497","DOI":"10.48550\/arXiv.1506.01497"},{"key":"3234_CR12","doi-asserted-by":"publisher","unstructured":"Tang Y, Wang X, Dellandrea E, et al.: Fusing generic objectness and deformable part-based models for weakly supervised object detection. In: 2014 IEEE International Conference on Image Processing (ICIP). IEEE, 4072\u20134076(2014). https:\/\/doi.org\/10.1109\/ICIP.2014.7025827","DOI":"10.1109\/ICIP.2014.7025827"},{"issue":"1","key":"3234_CR13","doi-asserted-by":"publisher","first-page":"62","DOI":"10.1109\/tsmc.1979.4310076","volume":"9","author":"N Otsu","year":"1979","unstructured":"Otsu, N.: A threshold selection method from gray-level histograms[J]. IEEE Trans. Syst. Man Cybern. 9(1), 62\u201366 (1979). https:\/\/doi.org\/10.1109\/tsmc.1979.4310076","journal-title":"IEEE Trans. Syst. Man Cybern."},{"issue":"3","key":"3234_CR14","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky, O., Deng, J., Su, H., et al.: Imagenet large scale visual recognition challenge[J]. Int. J. Comput. Vision 115(3), 211\u2013252 (2015). https:\/\/doi.org\/10.1007\/s11263-015-0816-y","journal-title":"Int. J. Comput. Vision"},{"key":"3234_CR15","doi-asserted-by":"publisher","unstructured":"Zeng Z, Liu B, Fu J, et al: Wsod2: Learning bottom-up and top-down objectness distillation for weakly-supervised object detection. In: Proceedings of the IEEE\/CVF international conference on computer vision. 8292\u20138300(2019). https:\/\/doi.org\/10.48550\/arXiv.1909.04972","DOI":"10.48550\/arXiv.1909.04972"},{"key":"3234_CR16","doi-asserted-by":"publisher","unstructured":"Singh K.K, Xiao F, Lee Y J.: Track and transfer: Watching videos to simulate strong human supervision for weakly-supervised object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. 3548\u20133556(2016). https:\/\/doi.org\/10.48550\/arXiv.1604.05766","DOI":"10.48550\/arXiv.1604.05766"},{"key":"3234_CR17","first-page":"16797","volume":"33","author":"ZY HuangZ","year":"2020","unstructured":"HuangZ, Z.Y., Kumar, K.B.V., et al.: Comprehensive attention self-distillation for weakly-supervised object detection[J]. Adv. Neural Inform. Process. Syst. 33, 16797\u201316807 (2020)","journal-title":"Adv. Neural Inform. Process. Syst."},{"key":"3234_CR18","doi-asserted-by":"publisher","first-page":"104356","DOI":"10.1109\/ACCESS.2021.3099497","volume":"9","author":"Q Yuan","year":"2021","unstructured":"Yuan, Q., Sun, G., Liang, J., et al.: Efficient weakly-supervised object detection with pseudo annotations[J]. IEEE Access. 9, 104356\u2013104366 (2021). https:\/\/doi.org\/10.1109\/ACCESS.2021.3099497","journal-title":"IEEE Access."},{"key":"3234_CR19","doi-asserted-by":"publisher","unstructured":"Li X, Kan M, Shan S, et al.: Weakly supervised object detection with segmentation collaboration. In: Proceedings of the IEEE\/CVF international conference on computer vision. 9735\u20139744(2019). https:\/\/doi.org\/10.48550\/arXiv.1904.00551","DOI":"10.48550\/arXiv.1904.00551"},{"key":"3234_CR20","doi-asserted-by":"publisher","unstructured":"Chen C.Y, Hsu H.W.: Saliency aware: Weakly supervised object localization.In: ICASSP 2019\u20132019 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). IEEE. 1907\u20131911(2019). https:\/\/doi.org\/10.1109\/ICASSP.2019.8682756","DOI":"10.1109\/ICASSP.2019.8682756"},{"key":"3234_CR21","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2021.107726","volume":"237","author":"R Jin","year":"2022","unstructured":"Jin, R., Lin, G., Wen, C.: Online active proposal set generation for weakly supervised object detection[J]. Knowl.-Based Syst. 237, 107726 (2022). https:\/\/doi.org\/10.1016\/j.knosys.2021.107726","journal-title":"Knowl.-Based Syst."},{"key":"3234_CR22","doi-asserted-by":"publisher","unstructured":"Zhang X, Feng J, Xiong H, et al.: Zigzag learning for weakly supervised object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. 4262\u20134270(2018). https:\/\/doi.org\/10.48550\/arXiv.1804.09466","DOI":"10.48550\/arXiv.1804.09466"},{"key":"3234_CR23","doi-asserted-by":"publisher","unstructured":"A Dib , V Sharma, A Pazandeh, et al. Weakly supervised cascaded convolutional networks. In: Proceedings of the IEEE conference on computer vision and pattern recognition. 2017: 914\u2013922. https:\/\/doi.org\/10.48550\/arXiv.1611.08258","DOI":"10.48550\/arXiv.1611.08258"},{"key":"3234_CR24","doi-asserted-by":"publisher","unstructured":"Tang P, Wang X, Wang A, et al.: Weakly supervised region proposal network and object detection. In: Proceedings of the European conference on computer vision (ECCV). 352\u2013368(2018). https:\/\/doi.org\/10.1007\/978-3-030-01252-6_22","DOI":"10.1007\/978-3-030-01252-6_22"},{"key":"3234_CR25","first-page":"7005","volume":"33","author":"Y Shen","year":"2020","unstructured":"Shen, Y., Ji, R., Chen, Z., et al.: UWSOD: Toward fully-supervised-level capacity weakly supervised object detection[J]. Adv. Neural. Inf. Process. Syst. 33, 7005\u20137019 (2020)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"3234_CR26","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3046647","author":"D Zhang","year":"2020","unstructured":"Zhang, D., Zeng, W., Yao, J., et al.: Weakly supervised object detection using proposal-and semantic-level relationships[J]. IEEE Trans. Pattern Anal. Mach. Intell. (2020). https:\/\/doi.org\/10.1109\/TPAMI.2020.3046647","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"3234_CR27","doi-asserted-by":"publisher","unstructured":"Shen Y, Ji R, Wang Y, et al.: Enabling deep residual networks for weakly supervised object detection. In: European Conference on Computer Vision. Springer, Cham. 118\u2013136(2020). https:\/\/doi.org\/10.1007\/978-3-030-58598-3_8","DOI":"10.1007\/978-3-030-58598-3_8"},{"key":"3234_CR28","doi-asserted-by":"publisher","unstructured":"Kosugi S, Yamasaki T, Aizawa K. Object-aware instance labeling for weakly supervised object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision. 6064\u20136072(2019). https:\/\/doi.org\/10.48550\/arXiv.1908.03792","DOI":"10.48550\/arXiv.1908.03792"},{"key":"3234_CR29","doi-asserted-by":"publisher","unstructured":"Li Y, Qian Y, Yang X, et al.: Activity and Relationship Modeling Driven Weakly Supervised Object Detection. In: 2020 25th International Conference on Pattern Recognition (ICPR). IEEE. 9628\u20139634(2021). https:\/\/doi.org\/10.1109\/ICPR48806.2021.9412697","DOI":"10.1109\/ICPR48806.2021.9412697"},{"key":"3234_CR30","doi-asserted-by":"publisher","unstructured":"Zhong Y, Wang J, Peng J, et al.: Boosting weakly supervised object detection with progressive knowledge transfer. In: European conference on computer vision. Springer, Cham. 615\u2013631(2020). https:\/\/doi.org\/10.48550\/arXiv.2007.07986","DOI":"10.48550\/arXiv.2007.07986"},{"key":"3234_CR31","doi-asserted-by":"publisher","unstructured":"Dong B, Huang Z, Guo Y, et al.: Boosting weakly supervised object detection via learning bounding box adjusters. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision. 2876\u20132885(2021). https:\/\/doi.org\/10.1109\/ICCV48922.2021.00287","DOI":"10.1109\/ICCV48922.2021.00287"},{"key":"3234_CR32","doi-asserted-by":"publisher","unstructured":"Wang J, Yao J, Zhang Y, et al.: Collaborative learning for weakly supervised object detection[J]. arXiv preprint arXiv:1802.03531, (2018). https:\/\/doi.org\/10.1109\/JSTARS.2022.3223845","DOI":"10.1109\/JSTARS.2022.3223845"},{"key":"3234_CR33","doi-asserted-by":"publisher","unstructured":"Gao Y, Liu B, Guo N, et al.: C-midn: Coupled multiple instance detection network with segmentation guidance for weakly supervised object detection. In: \/\/Proceedings of the IEEE\/CVF International Conference on Computer Vision. 9834\u20139843(2019). https:\/\/doi.org\/10.1109\/ICCV.2019.00993","DOI":"10.1109\/ICCV.2019.00993"},{"key":"3234_CR34","doi-asserted-by":"publisher","unstructured":"He K, Zhang X, Ren S, et al.: Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition. 770\u2013778(2016). https:\/\/doi.org\/10.1109\/CVPR.2016.90","DOI":"10.1109\/CVPR.2016.90"},{"key":"3234_CR35","doi-asserted-by":"publisher","unstructured":"Kim D, Cho D, Yoo D, et al.: Two-phase learning for weakly supervised object localization. In: Proceedings of the IEEE international conference on computer vision. 3534\u20133543(2017). https:\/\/doi.org\/10.1109\/ICCV.2017.382","DOI":"10.1109\/ICCV.2017.382"},{"key":"3234_CR36","doi-asserted-by":"publisher","unstructured":"Wei J, Wang Q, Li Z, et al.: Shallow feature matters for weakly supervised object localization. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 5993\u20136001(2021). https:\/\/doi.org\/10.48550\/arXiv.2108.00873","DOI":"10.48550\/arXiv.2108.00873"},{"key":"3234_CR37","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2022.104425","volume":"121","author":"Z Zhang","year":"2022","unstructured":"Zhang, Z., Chang, Y., Zhong, S., et al.: Learning dynamic background for weakly supervised moving object detection[J]. Image Vis. Comput. 121, 104425 (2022). https:\/\/doi.org\/10.1016\/j.imavis.2022.104425","journal-title":"Image Vis. Comput."},{"key":"3234_CR38","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.imavis.2016.08.015","volume":"56","author":"M Rochan","year":"2016","unstructured":"Rochan, M., Rahman, S., Bruce, B.N.D., et al.: Weakly supervised object localization and segmentation in videos[J]. Image Vision Comput. 56, 1\u201312 (2016)","journal-title":"Image Vision Comput."},{"issue":"2","key":"3234_CR39","doi-asserted-by":"publisher","first-page":"154","DOI":"10.1007\/s11263-013-0620-5","volume":"104","author":"JRR Uijlings","year":"2013","unstructured":"Uijlings, J.R.R., Van De Sande, K.E.A., Gevers, T., et al.: Selective search for object recognition[J]. Int. J. Comput. Vision 104(2), 154\u2013171 (2013). https:\/\/doi.org\/10.1007\/s11263-013-0620-5","journal-title":"Int. J. Comput. Vision"},{"key":"3234_CR40","doi-asserted-by":"publisher","unstructured":"Simonyan K, Zisserman A.: Very deep convolutional networks for large-scale image recognition[J]. arXiv preprint arXiv:1409.1556, (2014). https:\/\/doi.org\/10.48550\/arXiv.1409.1556","DOI":"10.48550\/arXiv.1409.1556"},{"key":"3234_CR41","doi-asserted-by":"publisher","unstructured":"Jiang H, Wang J, Yuan Z, et al.: Salient object detection: A discriminative regional feature integration approach. In: Proceedings of the IEEE conference on computer vision and pattern recognition. 2083\u20132090(2013) https:\/\/doi.org\/10.1007\/s11263-016-0977-3","DOI":"10.1007\/s11263-016-0977-3"},{"issue":"2","key":"3234_CR42","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","volume":"88","author":"M Everingham","year":"2010","unstructured":"Everingham, M., Van Gool, L., Williams, I.C.K., et al.: The pascal visual object classes (voc) challenge[J]. Int. J. Comput. Vision 88(2), 303\u2013338 (2010)","journal-title":"Int. J. Comput. Vision"},{"issue":"1","key":"3234_CR43","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1007\/s11263-014-0733-5","volume":"111","author":"M Everingham","year":"2015","unstructured":"Everingham, M., Eslami, S.M., Van Gool, L., et al.: The pascal visual object classes challenge: A retrospective[J]. Int. J. Comput. Vision 111(1), 98\u2013136 (2015). https:\/\/doi.org\/10.1007\/s11263-014-0733-5","journal-title":"Int. J. Comput. Vision"},{"issue":"11","key":"3234_CR44","doi-asserted-by":"publisher","first-page":"7885","DOI":"10.1109\/TPAMI.2021.3115815","volume":"44","author":"X Lu","year":"2021","unstructured":"Lu, X., Wang, W., Shen, J., et al.: Segmenting objects from relational visual data[J]. IEEE Trans. Pattern Anal. Mach. Intell. 44(11), 7885\u20137897 (2021). https:\/\/doi.org\/10.1109\/TPAMI.2021.3115815","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"5","key":"3234_CR45","doi-asserted-by":"publisher","first-page":"1192","DOI":"10.1109\/JAS.2023.123456","volume":"10","author":"Z Qin","year":"2023","unstructured":"Qin, Z., Lu, X., Nie, X., et al.: Coarse-to-fine video instance segmentation with factorized conditional appearance flows[J]. IEEE\/CAA J. Automat. Sinica 10(5), 1192\u20131208 (2023). https:\/\/doi.org\/10.1109\/JAS.2023.123456","journal-title":"IEEE\/CAA J. Automat. Sinica"},{"key":"3234_CR46","doi-asserted-by":"publisher","unstructured":"Lu X, Wang W, Ma C, et al. See more, know more: Unsupervised video object segmentation with co-attention siamese networks. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 3623\u20133632(2019). https:\/\/doi.org\/10.1109\/CVPR.2019.00374","DOI":"10.1109\/CVPR.2019.00374"},{"issue":"12","key":"3234_CR47","doi-asserted-by":"publisher","first-page":"8896","DOI":"10.1109\/TPAMI.2021.3127492","volume":"44","author":"J Shen","year":"2021","unstructured":"Shen, J., Liu, Y., Dong, X., et al.: Distilled Siamese networks for visual tracking[J]. IEEE Trans. Pattern Anal. Mach. Intell. 44(12), 8896\u20138909 (2021). https:\/\/doi.org\/10.1109\/TPAMI.2021.3127492","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-023-03234-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-023-03234-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-023-03234-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,6]],"date-time":"2024-11-06T16:13:42Z","timestamp":1730909622000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-023-03234-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,1,18]]},"references-count":47,"journal-issue":{"issue":"11","published-print":{"date-parts":[[2024,11]]}},"alternative-id":["3234"],"URL":"https:\/\/doi.org\/10.1007\/s00371-023-03234-w","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"type":"print","value":"0178-2789"},{"type":"electronic","value":"1432-2315"}],"subject":[],"published":{"date-parts":[[2024,1,18]]},"assertion":[{"value":"14 December 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 January 2024","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}