{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,28]],"date-time":"2026-03-28T05:34:29Z","timestamp":1774676069667,"version":"3.50.1"},"reference-count":49,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2015,6]]},"DOI":"10.1109\/cvpr.2015.7298968","type":"proceedings-article","created":{"date-parts":[[2015,10,15]],"date-time":"2015-10-15T22:42:06Z","timestamp":1444948926000},"page":"3460-3469","source":"Crossref","is-referenced-by-count":277,"title":["Deep multiple instance learning for image classification and auto-annotation"],"prefix":"10.1109","author":[{"given":"Jiajun","family":"Wu","sequence":"first","affiliation":[]},{"family":"Yinan Yu","sequence":"additional","affiliation":[]},{"family":"Chang Huang","sequence":"additional","affiliation":[]},{"family":"Kai Yu","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","article-title":"Superparsing: scalable nonparametric image parsing with superpixels","author":"tighe","year":"2010","journal-title":"ECCV"},{"key":"ref38","article-title":"Going deeper with convolutions","author":"szegedy","year":"2014","journal-title":"arXiv preprint arXiv 1409 4842"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2006.326"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1038\/323533a0"},{"key":"ref31","author":"ramon","year":"2000","journal-title":"Multi instance neural networks In ICML workshop on attribute-value and relational learning"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206537"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.422"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995330"},{"key":"ref35","article-title":"Weakly-supervised discovery of visual pattern configurations","author":"song","year":"2014","journal-title":"NIPS"},{"key":"ref34","article-title":"Overfeat: Integrated recognition, localization and detection using convolutional networks","author":"sermanet","year":"2014","journal-title":"ICLRE"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126383"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2009.5459426"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6248001"},{"key":"ref2","first-page":"1107","article-title":"Matching words and pictures","volume":"3","author":"barnard","year":"2003","journal-title":"IMLR"},{"key":"ref1","article-title":"Support vector machines for multiple-instance learning","author":"andrews","year":"2002","journal-title":"NIPS"},{"key":"ref20","doi-asserted-by":"crossref","first-page":"985","DOI":"10.1109\/TPAMI.2007.70847","article-title":"Real-time computerized annotation of pictures","volume":"30","author":"li","year":"2008","journal-title":"IEEE TPAMI"},{"key":"ref22","article-title":"Object bank: A high-level image representation for scene classification & semantic feature sparsification","author":"li","year":"2010","journal-title":"NIPS"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2007.4408872"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126478"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.115"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2006.04.045"},{"key":"ref25","doi-asserted-by":"crossref","first-page":"353","DOI":"10.1109\/TPAMI.2010.70","article-title":"Learning to detect a salient object","volume":"33","author":"liu","year":"2011","journal-title":"IEEE TPAMI"},{"key":"ref10","author":"everingham","year":"0","journal-title":"The PASCAL Visual Object Classes Challenge 2007 (VOC2007) Results"},{"key":"ref11","article-title":"Weakly supervised object localization with stable segmentations","author":"galleguillos","year":"2008","journal-title":"ECCV"},{"key":"ref40","doi-asserted-by":"crossref","first-page":"303","DOI":"10.1023\/A:1009976227802","article-title":"Learning algorithms for keyphrase extraction","volume":"2","author":"turney","year":"2000","journal-title":"Information Retrieval"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2012.2205597"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2007.383267"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.124"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.223"},{"key":"ref16","article-title":"Learning convolutional feature hierarchies for visual recognition","author":"kavukcuoglu","year":"2010","journal-title":"NIPS"},{"key":"ref17","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"NIPS"},{"key":"ref18","article-title":"Deeply-supervised nets","author":"lee","year":"2015","journal-title":"AISTATS"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/1553374.1553453"},{"key":"ref4","article-title":"Bing: Bina-rized normed gradients for objectness estimation at 300fps","author":"cheng","year":"2014","journal-title":"CVPR"},{"key":"ref3","article-title":"Hierarchical matching with side information for image classification","author":"chen","year":"2012","journal-title":"CVPR"},{"key":"ref6","article-title":"Imagenet: A large-scale hierarchical image database","author":"deng","year":"2009","journal-title":"CVPR"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2012.6252784"},{"key":"ref8","article-title":"Mid-level visual element discovery as discriminative mode seeking","author":"doersch","year":"2013","journal-title":"NIPS"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/S0004-3702(96)00034-3"},{"key":"ref49","article-title":"Unsupervised object class discovery via saliency-guided multiple class learning","author":"zhu","year":"2012","journal-title":"CVPR"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.112"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-014-0748-y"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.40"},{"key":"ref48","author":"zhou","year":"2002","journal-title":"Neural Networks for Multi-instance Learning"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6853873"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2008.4587632"},{"key":"ref41","article-title":"Segmentation as selective search for object recoznirion","author":"van de","year":"2011","journal-title":"TCCV"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2009.5459194"},{"key":"ref43","article-title":"Multiple instance boosting for object detection","author":"viola","year":"2006","journal-title":"NIPS"}],"event":{"name":"2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","location":"Boston, MA, USA","start":{"date-parts":[[2015,6,7]]},"end":{"date-parts":[[2015,6,12]]}},"container-title":["2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7293313\/7298593\/07298968.pdf?arnumber=7298968","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,23]],"date-time":"2017-06-23T21:24:33Z","timestamp":1498253073000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7298968\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,6]]},"references-count":49,"URL":"https:\/\/doi.org\/10.1109\/cvpr.2015.7298968","relation":{},"subject":[],"published":{"date-parts":[[2015,6]]}}}