{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,4,7]],"date-time":"2025-04-07T04:10:07Z","timestamp":1743999007792,"version":"3.40.3"},"reference-count":25,"publisher":"Springer Science and Business Media LLC","license":[{"start":{"date-parts":[[2012,8,24]],"date-time":"2012-08-24T00:00:00Z","timestamp":1345766400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Multimedia Systems"],"DOI":"10.1007\/s00530-012-0293-x","type":"journal-article","created":{"date-parts":[[2012,8,23]],"date-time":"2012-08-23T06:57:33Z","timestamp":1345705053000},"source":"Crossref","is-referenced-by-count":0,"title":["Weakly-supervised object localization in unlabeled image collection"],"prefix":"10.1007","author":[{"given":"Yanyun","family":"Qu","sequence":"first","affiliation":[]},{"given":"Han","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Xiaoqing","family":"Yang","sequence":"additional","affiliation":[]},{"given":"Suwen","family":"Fang","sequence":"additional","affiliation":[]},{"given":"Hanzi","family":"Wang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2012,8,24]]},"reference":[{"key":"293_CR1","doi-asserted-by":"crossref","unstructured":"Viola, P., Jones, M.: Rapid object detection using a boosted cascade of simple features. In: Proceedings of the IEEE Computer Society Conference on Computer Vision and Pattern Recognition (CVPR 2001), vol. 1, pp. I-511\u2013I-518 (2001)","DOI":"10.1109\/CVPR.2001.990517"},{"key":"293_CR2","doi-asserted-by":"crossref","unstructured":"Dalal, N., Triggs, B.: Histograms of oriented gradients for human detection. In: Proceedings of the IEEE Computer Society Conference on Computer Vision and Pattern Recognition (CVPR 2005), vol. 1, pp. 886\u2013893 (2005)","DOI":"10.1109\/CVPR.2005.177"},{"key":"293_CR3","unstructured":"Andrews, S., Tsochantaridis, I., Hofmann, T.: Support vector machines for multiple-instance learning. In: Proceedings of the NIPS, pp. 561\u2013568 (2003)"},{"key":"293_CR4","doi-asserted-by":"crossref","unstructured":"Liu, H., Qu, Y.: Exploiting context aware category discovery for image labeling. In: Proceedings of the Third International Conference on Internet Multimedia Computing and Service (2011)","DOI":"10.1145\/2043674.2043707"},{"key":"293_CR5","doi-asserted-by":"crossref","unstructured":"Russell, B.C., Freeman, W.T., Efros, A.A., Sivic, J., Zisserman, A.: Using multiple segmentations to discover objects and their extent in image collections. In: Proceedings of the 2006 IEEE Computer Society Conference on Computer Vision and Pattern Recognition, pp. 1605\u20131614 (2006)","DOI":"10.1109\/CVPR.2006.326"},{"key":"293_CR6","doi-asserted-by":"crossref","unstructured":"Galleguillos, C., Babenko, B., Rabinovich, A., Belongie, S.: Weakly supervised object localization with stable segmentations. In: Proceedings of the 10th European Conference on Computer Vision: Part I (2008)","DOI":"10.1007\/978-3-540-88682-2_16"},{"key":"293_CR7","doi-asserted-by":"crossref","unstructured":"Lazebnik, S., Schmid, C., Ponce, J.: Beyond bags of features: spatial pyramid matching for recognizing natural scene categories. In: Proceedings of the 2006 IEEE Computer Society Conference on Computer Vision and Pattern Recognition, pp. 2169\u20132178 (2006)","DOI":"10.1109\/CVPR.2006.68"},{"key":"293_CR8","doi-asserted-by":"crossref","unstructured":"Fulkerson, B., Vedaldi, A., Soatto, S.: Class segmentation and object localization with superpixel neighborhoods. In: Proceedings of the ICCV, pp. 670\u2013677 (2009)","DOI":"10.1109\/ICCV.2009.5459175"},{"key":"293_CR9","doi-asserted-by":"crossref","first-page":"2129","DOI":"10.1109\/TPAMI.2009.144","volume":"31","author":"CH Lampert","year":"2009","unstructured":"Lampert, C.H., Blaschko, M.B., Hofmann, T.: Efficient subwindow search: a branch and bound framework for object localization. IEEE Trans. Pattern Anal. Mach. Intell. 31, 2129\u20132142 (2009)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"293_CR10","doi-asserted-by":"crossref","unstructured":"Wang, M., Hua, X.-S., Tang, J., Hong, R.: Beyond distance measurement: constructing neighborhood similarity for video annotation. In: IEEE Transactions on Multimedia, vol. 11, pp. 465\u2013476 (2009)","DOI":"10.1109\/TMM.2009.2012919"},{"key":"293_CR11","doi-asserted-by":"crossref","unstructured":"Wang, M., Hua, X.-S., Hong, R., Tang, J., Qi, G.-J., Song, Y.: Unified video annotation via multigraph learning. In: IEEE Transactions on Circuits and Systems for Video Technology, vol. 19, pp. 733\u2013746 (2009)","DOI":"10.1109\/TCSVT.2009.2017400"},{"key":"293_CR12","doi-asserted-by":"crossref","unstructured":"Fergus, R., Perona, P., Zisserman, A.: Object class recognition by unsupervised scale-invariant learning. In: Proceedings of the 2003 IEEE Computer Society Conference on Computer Vision and Pattern Recognition, vol. 2, pp. II-264\u2013II-271 (2003)","DOI":"10.1109\/CVPR.2003.1211479"},{"key":"293_CR13","unstructured":"Sivic, J., Russell, B.C., Efros, A.A., Zisserman, A., Freeman, W.T.: Discovering objects and their location in images. In: Proceedings of the Tenth IEEE International Conference on Computer Vision, 2005 (ICCV 2005), vol. 1, pp. 370\u2013377 (2005)"},{"key":"293_CR14","doi-asserted-by":"crossref","first-page":"177","DOI":"10.1023\/A:1007617005950","volume":"42","author":"T Hofmann","year":"2001","unstructured":"Hofmann, T.: Unsupervised learning by probabilistic latent semantic analysis. Mach. Learn. 42, 177\u2013196 (2001)","journal-title":"Mach. Learn."},{"key":"293_CR15","first-page":"993","volume":"3","author":"DM Blei","year":"2003","unstructured":"Blei, D.M., Ng, A.Y., Jordan, M.I.: Latent dirichlet allocation. J. Mach. Learn. Res. 3, 993\u20131022 (2003)","journal-title":"J. Mach. Learn. Res."},{"key":"293_CR16","doi-asserted-by":"crossref","unstructured":"Griffiths, T., Steyvers, M.: Finding scientific topics. In: Proceedings of the National Academy of Sciences, pp. 5228\u20135235 (2004)","DOI":"10.1073\/pnas.0307752101"},{"key":"293_CR17","doi-asserted-by":"crossref","first-page":"143","DOI":"10.1007\/s11263-009-0252-y","volume":"85","author":"YJ Lee","year":"2009","unstructured":"Lee, Y.J., Grauman, K.: Foreground focus: unsupervised learning from partially matching images. Int. J. Comput. Vis. 85, 143\u2013166 (2009)","journal-title":"Int. J. Comput. Vis."},{"key":"293_CR18","doi-asserted-by":"crossref","unstructured":"Tighe, J., Lazebnik, S.: Superparsing: scalable nonparametric image parsing with superpixels. In: Proceedings of the 11th European Conference on Computer Vision: Part V (2010)","DOI":"10.1007\/978-3-642-15555-0_26"},{"key":"293_CR19","doi-asserted-by":"crossref","first-page":"31","DOI":"10.1016\/S0004-3702(96)00034-3","volume":"89","author":"TG Dietterich","year":"1997","unstructured":"Dietterich, T.G., Lathrop, R.H.: Solving the multiple instance problem with axis-parallel rectangles. Artif. Intell. 89, 31\u201371 (1997)","journal-title":"Artif. Intell."},{"key":"293_CR20","unstructured":"Wang, J., Zucker, J.-D.: Solving the multiple-instance problem: a lazy learning approach. In: Proceedings of the Seventeenth International Conference on Machine Learning (2000)"},{"key":"293_CR21","unstructured":"Babenko, B., Ming-Hsuan, Y., Belongie, S.: Visual tracking with online multiple instance learning. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2009 (CVPR 2009), pp. 983\u2013990 (2009)"},{"key":"293_CR22","unstructured":"Shi, J., Malik, J.: Normalized cuts and image segmentation. In: Proceedings of the IEEE Computer Society Conference on Computer Vision and Pattern Recognition, 1997, pp. 731\u2013737 (1997)"},{"key":"293_CR23","doi-asserted-by":"crossref","unstructured":"Shi, J., Malik, J.: Normalized cuts and image segmentation. In: IEEE Transactions on Pattern Analysis and Machine Intelligence, vol. 22, pp. 888\u2013905 (2000)","DOI":"10.1109\/34.868688"},{"key":"293_CR24","unstructured":"Achanta, R., Hemami, S., Estrada, F., Susstrunk, S.: Frequency-tuned salient region detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2009 (CVPR 2009), pp. 1597\u20131604 (2009)"},{"key":"293_CR25","unstructured":"Qu, Y., Chen, C., Wu, D., Xie, Y.: Image labeling via incremental model learning. In: Proceedings of the 17th IEEE International Conference on Image Processing (ICIP), 2010, pp. 1573\u20131576 (2010)"}],"container-title":["Multimedia Systems"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-012-0293-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00530-012-0293-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00530-012-0293-x","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,7]],"date-time":"2025-04-07T03:50:59Z","timestamp":1743997859000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00530-012-0293-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,8,24]]},"references-count":25,"alternative-id":["293"],"URL":"https:\/\/doi.org\/10.1007\/s00530-012-0293-x","relation":{},"ISSN":["0942-4962","1432-1882"],"issn-type":[{"type":"print","value":"0942-4962"},{"type":"electronic","value":"1432-1882"}],"subject":[],"published":{"date-parts":[[2012,8,24]]}}}