{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,7]],"date-time":"2026-04-07T04:02:49Z","timestamp":1775534569015,"version":"3.50.1"},"reference-count":42,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2015,6]]},"DOI":"10.1109\/cvpr.2015.7299145","type":"proceedings-article","created":{"date-parts":[[2015,10,15]],"date-time":"2015-10-15T18:42:06Z","timestamp":1444934526000},"page":"5097-5106","source":"Crossref","is-referenced-by-count":123,"title":["Domain-size pooling in local descriptors: DSP-SIFT"],"prefix":"10.1109","author":[{"given":"Jingming","family":"Dong","sequence":"first","affiliation":[]},{"given":"Stefano","family":"Soatto","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","article-title":"Dense correspondences across scenes and scales","author":"tau","year":"2014","journal-title":"ArXiv preprint 1406 6323"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995541"},{"key":"ref33","first-page":"163","article-title":"Deep fisher networks for large-scale image classification","author":"simonyan","year":"2013","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref32","author":"shao","year":"1998","journal-title":"Mathematical Statistics Springer Velag"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.0700622104"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2007.383157"},{"key":"ref37","article-title":"Visual scene represen-tations: Scaling and occlusion in convolutional architectures","author":"soatto","year":"2014","journal-title":"ArXiv preprint 1412 6607"},{"key":"ref36","article-title":"Visual scene representations: Sufficiency, minimality, invariance and deep approximation","author":"soatto","year":"2014","journal-title":"ArXiv preprint 1411 7676"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2003.1238663"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2014.2301163"},{"key":"ref10","article-title":"Multi-view feature engineering and learning","author":"dong","year":"2013","journal-title":"Proc of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2015 ArXiv preprint 1311 6048"},{"key":"ref40","first-page":"140","article-title":"Con-volutionallearning of spatio-temporal features","author":"taylor","year":"2010","journal-title":"European Conference on Computer Vision"},{"key":"ref11","article-title":"Domain-size pooling in local de-scriptors: DSP-SIFT (extended version of this paper)","author":"dong","year":"2014","journal-title":"ArXiv preprint 1412 8556"},{"key":"ref12","article-title":"Unsupervised feature learning by augmenting single images","author":"dosovitskiy","year":"2013","journal-title":"ArXiv preprint 1312 5242"},{"key":"ref13","article-title":"Scene parsing with multiscale feature learning, purity trees, and optimal covers","author":"farabet","year":"2012","journal-title":"ArXiv preprint 1202 2160"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2008.4587597"},{"key":"ref15","article-title":"Descriptor matching with convolutional neural networks: A comparison to SIFT","author":"fischer","year":"2014","journal-title":"ArXiv preprint 1405 5769"},{"key":"ref16","article-title":"Multi-scale orderless pooling of deep convolutional activation features","author":"gong","year":"2014","journal-title":"ArXiv preprint 1403 1840"},{"key":"ref17","first-page":"729","article-title":"Temporal pooling and multiscale learning for automatic annotation and ranking of music audio","author":"hamel","year":"2011","journal-title":"International Society for Music Information Retrieval"},{"key":"ref18","first-page":"1522","article-title":"On sifts and their scales","author":"hassne","year":"2012","journal-title":"Proc of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)"},{"key":"ref19","first-page":"3370","article-title":"Beyond spatial pyramids: Receptive field learning for pooled image features","author":"jia","year":"2012","journal-title":"Proc of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1023\/B:VISI.0000027790.02288.f2"},{"key":"ref4","first-page":"111","article-title":"A theoretical analysis of feature pooling in visual recognition","author":"boureau","year":"2010","journal-title":"Proc of the International Conference on Machine Learning (ICML)"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2005.188"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2001.990529"},{"key":"ref6","article-title":"Classification with scattering oper-ators","author":"bruna","year":"2011","journal-title":"Proc of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-006-9967-1"},{"key":"ref5","first-page":"162","article-title":"On invariance in hierarchical models","author":"bouvrie","year":"2009","journal-title":"Advances in Neural Information Processing Systems (NIPS)"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2005.177"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206733"},{"key":"ref2","first-page":"404","article-title":"Surf: Speeded up robust features","author":"bay","year":"2006","journal-title":"European Conference on Computer Vision"},{"key":"ref9","first-page":"248","article-title":"Imagenet: A large-scale hierarchical image database","author":"deng","year":"2009","journal-title":"Proc of the IEEE Conference on Computer Vision and Pattern Recoenition (CVPR)"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177728715"},{"key":"ref20","first-page":"496","author":"lecun","year":"2012","journal-title":"European Conference on Computer Vision"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2011.08.003"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995453"},{"key":"ref42","first-page":"1","article-title":"Learning local image descrip-tors","author":"winder","year":"2007","journal-title":"Proc of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1023\/B:VISI.0000029664.99615.94"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1145\/1873951.1874249"},{"key":"ref23","article-title":"Principles for automatic scale selection","author":"lindeberg","year":"1998","journal-title":"Technical report KTH Computational Vision and Active Perception laboratory"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.53"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.5244\/C.16.36"}],"event":{"name":"2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)","location":"Boston, MA, USA","start":{"date-parts":[[2015,6,7]]},"end":{"date-parts":[[2015,6,12]]}},"container-title":["2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7293313\/7298593\/07299145.pdf?arnumber=7299145","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,3,24]],"date-time":"2017-03-24T17:47:22Z","timestamp":1490377642000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7299145\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,6]]},"references-count":42,"URL":"https:\/\/doi.org\/10.1109\/cvpr.2015.7299145","relation":{},"subject":[],"published":{"date-parts":[[2015,6]]}}}