{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,27]],"date-time":"2025-10-27T20:40:24Z","timestamp":1761597624612,"version":"3.37.3"},"reference-count":101,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"7","license":[{"start":{"date-parts":[[2016,7,1]],"date-time":"2016-07-01T00:00:00Z","timestamp":1467331200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"funder":[{"name":"National Basic Research Program (973 Program) of China","award":["2013CB329403","2012CB316301"],"award-info":[{"award-number":["2013CB329403","2012CB316301"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61332007","61273023","91120011","61128007"],"award-info":[{"award-number":["61332007","61273023","91120011","61128007"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100005089","name":"Beijing Natural Science Foundation","doi-asserted-by":"publisher","award":["4132046"],"award-info":[{"award-number":["4132046"]}],"id":[{"id":"10.13039\/501100005089","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004147","name":"Tsinghua University Initiative Scientific Research Program","doi-asserted-by":"publisher","award":["20121088071"],"award-info":[{"award-number":["20121088071"]}],"id":[{"id":"10.13039\/501100004147","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000183","name":"Army Research Office","doi-asserted-by":"publisher","award":["W911NF-12-1-0057"],"award-info":[{"award-number":["W911NF-12-1-0057"]}],"id":[{"id":"10.13039\/100000183","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Faculty Research Awards by NEC Laboratories of America"},{"DOI":"10.13039\/100008634","name":"2012 University of Texas at San Antonio START-R Research Award","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100008634","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Circuits Syst. Video Technol."],"published-print":{"date-parts":[[2016,7]]},"DOI":"10.1109\/tcsvt.2015.2461978","type":"journal-article","created":{"date-parts":[[2015,7,29]],"date-time":"2015-07-29T14:49:41Z","timestamp":1438181381000},"page":"1251-1264","source":"Crossref","is-referenced-by-count":15,"title":["Simple Techniques Make Sense: Feature Pooling and Normalization for Image Classification"],"prefix":"10.1109","volume":"26","author":[{"given":"Lingxi","family":"Xie","sequence":"first","affiliation":[]},{"given":"Qi","family":"Tian","sequence":"additional","affiliation":[]},{"given":"Bo","family":"Zhang","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-15555-0_11"},{"key":"ref38","first-page":"487","article-title":"Exploiting generative models in discriminative classifiers","author":"jaakkola","year":"1999","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2007.383172"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1145\/2671188.2749289"},{"key":"ref31","first-page":"647","article-title":"DeCAF: A deep convolutional activation feature for generic visual recognition","author":"donahue","year":"2014","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2007.41"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2010.5540018"},{"key":"ref36","first-page":"1794","article-title":"Linear spatial pyramid matching using sparse coding for image classification","author":"yang","year":"2009","journal-title":"Proc IEEE Conf Comput Vis Pattern Recognit"},{"key":"ref35","first-page":"1","article-title":"Efficient sparse coding algorithms","author":"lee","year":"2007","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-88682-2_24"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-15561-1_11"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2009.154"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/34.993558"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2011.222"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126544"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2009.77"},{"key":"ref24","first-page":"2911","article-title":"Three things everyone should know to improve object retrieval","author":"arandjelovic","year":"2012","journal-title":"Proc IEEE Conf Comput Vis Pattern Recognit"},{"key":"ref23","first-page":"1369","article-title":"Image classification with max-SIFT descriptors","author":"xie","year":"2015","journal-title":"Proc Int Conf Acoust Speech Signal Process"},{"key":"ref101","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10578-9_28"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2014.2310117"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.96"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2007.4409066"},{"key":"ref50","first-page":"3370","article-title":"Beyond spatial pyramids: Receptive field learning for pooled image features","author":"jia","year":"2012","journal-title":"Proc IEEE Conf Comput Vis Pattern Recognit"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.5244\/C.26.102"},{"key":"ref59","first-page":"95","article-title":"Feature scaling in support vector data description","author":"juszczak","year":"2002","journal-title":"Annual Conf Advanced School for Comput Imag"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-45404-7_37"},{"journal-title":"The Nature of Statistical Learning Theory","year":"1999","author":"vapnik","key":"ref57"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1145\/1282280.1282361"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.47"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.215"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.206"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.315"},{"key":"ref40","first-page":"747","article-title":"BoF meets HOG: Feature extraction based on histograms of oriented p.d.f. gradients for image classification","author":"kobayashi","year":"2013","journal-title":"Proc IEEE Conf Comput Vis Pattern Recognit"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2013.6738537"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2006.264"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2011.2134010"},{"key":"ref5","first-page":"1374","article-title":"Generalized regular spatial pooling for image classification","author":"xie","year":"2015","journal-title":"Proc Int Conf Acoust Speech Signal Process"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"387","DOI":"10.1109\/TCSVT.2014.2351092","article-title":"Neighborhood feature line segment for image classification","volume":"25","author":"pan","year":"2015","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2006.68"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2014.2345933"},{"key":"ref9","doi-asserted-by":"crossref","first-page":"1197","DOI":"10.1109\/TCSVT.2014.2302518","article-title":"Boosting separability in semisupervised learning for object classification","volume":"24","author":"xu","year":"2014","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.317"},{"key":"ref45","first-page":"111","article-title":"A theoretical analysis of feature pooling in visual recognition","author":"boureau","year":"2010","journal-title":"Proc 27th Int Conf Mach Learn"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2005.239"},{"key":"ref47","first-page":"2609","article-title":"Geometric ${\\ell }_{p}$ -norm feature pooling for image classification","author":"feng","year":"2011","journal-title":"Proc IEEE Conf Comput Vis Pattern Recognit"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2011.07.011"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2013.2293418"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2012.07.019"},{"key":"ref43","first-page":"2734","article-title":"Weighted bag of visual words for object recognition","author":"san biagio","year":"2014","journal-title":"Proc IEEE Int Conf Image Process"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-013-0636-x"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.5244\/C.25.76"},{"key":"ref71","first-page":"1871","article-title":"LIBLINEAR: A library for large linear classification","volume":"9","author":"fan","year":"2008","journal-title":"J Mach Learn Res"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6248364"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2007.4408872"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1145\/1869790.1869829"},{"article-title":"A practical guide to support vector classification","year":"2003","author":"hsu","key":"ref74"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2005.09.012"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206537"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2010.5539970"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2008.4517925"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2005.845806"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2008.11.013"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1162\/neco.2006.18.4.961"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-8655(00)00112-4"},{"key":"ref65","first-page":"248","article-title":"ImageNet: A large-scale hierarchical image database","author":"deng","year":"2009","journal-title":"Proc IEEE Conf Comput Vis Pattern Recognit"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.146"},{"key":"ref67","first-page":"2072","article-title":"Discriminative learning of relaxed hierarchy for large-scale visual recognition","author":"gao","year":"2011","journal-title":"Proc Int Conf Comput Vis"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.40"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1023\/B:VISI.0000029664.99615.94"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2008.4587598"},{"key":"ref1","first-page":"1","article-title":"Visual categorization with bags of keypoints","author":"csurka","year":"2004","journal-title":"Proc Workshop Statist Learn Comput Vis Eur Conf Comput Vis"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.477"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.476"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.368"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2010.5539963"},{"key":"ref91","first-page":"161","article-title":"The tradeoffs of large scale learning","author":"bottou","year":"2007","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.1145\/1873951.1874249"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33718-5_57"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.128"},{"key":"ref96","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2009.5459169"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2008.04.022"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2014.2359098"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2013.2254898"},{"key":"ref12","first-page":"508","article-title":"Efficient feature selection and classification for vehicle detection","volume":"25","author":"wen","year":"2014","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1023\/B:VISI.0000027790.02288.f2"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2004.02.006"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2010.5539911"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/11744085_40"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2006.42"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2005.177"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.5244\/C.18.98"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2005.188"},{"journal-title":"The PASCAL Visual Object Classes Challenge 2007 (VOC2007) Results","year":"2007","author":"everingham","key":"ref84"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2007.09.014"},{"article-title":"Caltech-256 object category dataset","year":"2007","author":"griffin","key":"ref83"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2005.10"},{"article-title":"The Caltech-UCSD birds-200-2011 dataset","year":"2011","author":"wah","key":"ref89"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6248092"},{"article-title":"Fine-grained visual classification of aircraft","year":"2013","author":"maji","key":"ref86"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1109\/ICVGIP.2008.47"},{"key":"ref88","first-page":"1","article-title":"Novel dataset for fine-grained image categorization: Stanford dogs","author":"khosla","year":"2011","journal-title":"Proc 1st Workshop Fine-Grained Vis Categorization IEEE Conf Comput Vis Pattern Recognit"}],"container-title":["IEEE Transactions on Circuits and Systems for Video Technology"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/76\/7506358\/07172506.pdf?arnumber=7172506","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,12]],"date-time":"2022-01-12T11:45:57Z","timestamp":1641987957000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7172506\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,7]]},"references-count":101,"journal-issue":{"issue":"7"},"URL":"https:\/\/doi.org\/10.1109\/tcsvt.2015.2461978","relation":{},"ISSN":["1051-8215","1558-2205"],"issn-type":[{"type":"print","value":"1051-8215"},{"type":"electronic","value":"1558-2205"}],"subject":[],"published":{"date-parts":[[2016,7]]}}}