{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T16:29:20Z","timestamp":1759336160117},"reference-count":52,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2013,4,21]],"date-time":"2013-04-21T00:00:00Z","timestamp":1366502400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2014,9]]},"DOI":"10.1007\/s11042-013-1470-4","type":"journal-article","created":{"date-parts":[[2013,4,20]],"date-time":"2013-04-20T08:30:58Z","timestamp":1366446658000},"page":"1483-1506","source":"Crossref","is-referenced-by-count":11,"title":["Aligning codebooks for near duplicate image detection"],"prefix":"10.1007","volume":"72","author":[{"given":"Sebastiano","family":"Battiato","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Giovanni Maria","family":"Farinella","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Giovanni","family":"Puglisi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Daniele","family":"Rav\u00ec","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2013,4,21]]},"reference":[{"key":"1470_CR1","author":"S Battiato","year":"2010","unstructured":"Battiato S, Farinella GM, Gallo G, Rav\u00ec D (2010) Exploiting textons distributions on spatial hierarchy for scene classification. EURASIP J Image Video Process Article\u00a0ID\u00a0919367:1\u201313. doi: 10.1155\/2010\/919367","journal-title":"EURASIP J Image Video Process"},{"issue":"4","key":"1470_CR2","doi-asserted-by":"crossref","first-page":"1105","DOI":"10.1109\/TIFS.2012.2194285","volume":"7","author":"S Battiato","year":"2012","unstructured":"Battiato S, Farinella GM, Messina E, Puglisi G (2012) Robust image alignment for tampering detection. IEEE Trans Inf Forensics Secur 7(4):1105\u20131117","journal-title":"IEEE Trans Inf Forensics Secur"},{"key":"1470_CR3","doi-asserted-by":"crossref","unstructured":"Battiato S, Farinella GM, Guarnera GC, Meccio T, Puglisi G, Rav\u00ec D, Rizzo R (2010) Bags of phrases with codebooks alignment for near duplicate image detection. In: Proceedings of the international acm workshop on multimedia in forensics, security and intelligence (MiFor 2010), in conjunction with international acm multimedia conference, pp\u00a065\u201370","DOI":"10.1145\/1877972.1877991"},{"issue":"3","key":"1470_CR4","doi-asserted-by":"crossref","first-page":"346","DOI":"10.1016\/j.cviu.2007.09.014","volume":"110","author":"H Bay","year":"2008","unstructured":"Bay H, Ess A, Tuytelaars T, Van Gool L (2008) Speeded-up robust features (SURF). Int J Comput Vis Image Understand 110(3):346\u2013359","journal-title":"Int J Comput Vis Image Understand"},{"issue":"4","key":"1470_CR5","doi-asserted-by":"crossref","first-page":"509","DOI":"10.1109\/34.993558","volume":"2","author":"S Belongie","year":"2002","unstructured":"Belongie S, Malik J, Puzicha J (2002) Shape matching and object recognition using shape contexts. IEEE Trans Pattern Anal Mach Intell 2(4):509\u2013522","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"24","key":"1470_CR6","doi-asserted-by":"crossref","first-page":"509","DOI":"10.1109\/34.993558","volume":"24","author":"S Belongie","year":"2002","unstructured":"Belongie S, Malik J, Puzicha J (2002) Shape matching and object recognition using shape contexts. IEEE Trans Pattern Anal Mach Intell 24(24):509\u2013521","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"1470_CR7","doi-asserted-by":"crossref","unstructured":"Chatfield K, Lempitsky V, Vedaldi A, Zisserman A (2011) The devil is in the details: an evaluation of recent feature encoding methods. In: Proceedings of the British machine vision conference","DOI":"10.5244\/C.25.76"},{"issue":"6","key":"1470_CR8","doi-asserted-by":"crossref","first-page":"750","DOI":"10.1016\/j.cviu.2011.02.003","volume":"115","author":"X Cheng","year":"2011","unstructured":"Cheng X, Hu Y, Chia L-T (2011) Exploiting local dependencies with spatial-scale space (s-cube) for near-duplicate retrieval. Comput Vis Image Understand 115(6):750\u2013758","journal-title":"Comput Vis Image Understand"},{"key":"1470_CR9","doi-asserted-by":"crossref","unstructured":"Chum O, Philbin J, Zisserman A (2008) Near duplicate image detection: min-hash and tf-idf weighting. In: Proceeding of BMVC","DOI":"10.5244\/C.22.50"},{"key":"1470_CR10","doi-asserted-by":"crossref","unstructured":"Chum O, Perdoch M, Matas J (2009) Geometric min-hashing: finding a (thick) needle in a haystack. In: IEEE computer society conference on computer vision and pattern recognition, pp\u00a017\u201324","DOI":"10.1109\/CVPR.2009.5206531"},{"issue":"3","key":"1470_CR11","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/1823746.1823749","volume":"6","author":"R Oliveira De","year":"2010","unstructured":"De\u00a0Oliveira R, Cherubini M, Oliver N (2010) Looking at near-duplicate videos from a human-centric perspective. ACM Trans Multimedia Comput Commun Appl 6(3):15:1\u201315:22","journal-title":"ACM Trans Multimedia Comput Commun Appl"},{"key":"1470_CR12","unstructured":"Eastlake D, Jones P (2001) RFC 3174. http:\/\/tools.ietf.org\/html\/rfc3174"},{"issue":"9","key":"1470_CR13","doi-asserted-by":"crossref","first-page":"891","DOI":"10.1109\/34.93808","volume":"13","author":"W Freeman","year":"1991","unstructured":"Freeman W, Adelson E (1991) The design and use of steerable filters. IEEE Trans Pattern Anal Mach Intell 13(9):891\u2013906","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"1470_CR14","doi-asserted-by":"crossref","unstructured":"Grauman K, Darrell T (2005) The pyramid match kernel: discriminative classification with sets of image features. In: Proceedings of the IEEE International Conference on Computer Vision (ICCV), pp\u00a01458\u20131465","DOI":"10.1109\/ICCV.2005.239"},{"issue":"8","key":"1470_CR15","doi-asserted-by":"crossref","first-page":"1434","DOI":"10.1109\/TMM.2009.2032676","volume":"11","author":"Y Hu","year":"2009","unstructured":"Hu Y, Cheng X, Chia L-T, Xie X, Rajan D, Tan A-H (2009) Coherent phrase model for efficient image near-duplicate retrieval. IEEE Trans Multimedia 11(8):1434\u20131445","journal-title":"IEEE Trans Multimedia"},{"key":"1470_CR16","volume-title":"MIR \u201908: proceedings of the 2008 ACM International conference on multimedia information retrieval","author":"MJ Huiskes","year":"2008","unstructured":"Huiskes MJ, Lew MS (2008) The MIR Flickr retrieval evaluation. In: MIR \u201908: proceedings of the 2008 ACM International conference on multimedia information retrieval. ACM, New York, NY"},{"issue":"5","key":"1470_CR17","doi-asserted-by":"crossref","first-page":"433","DOI":"10.1109\/34.765655","volume":"21","author":"AE Johnson","year":"1999","unstructured":"Johnson AE, Hebert M (1999) Using spin images for efficient object recognition in cluttered 3d scenes. IEEE Trans Pattern Analy Mach Intell 21(5):433\u2013449","journal-title":"IEEE Trans Pattern Analy Mach Intell"},{"issue":"4","key":"1470_CR18","doi-asserted-by":"crossref","first-page":"325","DOI":"10.1007\/BF02278710","volume":"38","author":"R Jonker","year":"1987","unstructured":"Jonker R, Volgenant A (1987) A shortest augmenting path algorithm for dense and sparse linear assignment problems. Computing 38(4):325\u2013340","journal-title":"Computing"},{"key":"1470_CR19","unstructured":"Ke Y, Sukthankar R, Huston L (2004) Efficient near-duplicate detection and sub-image retrieval. In: Proceeding of ACM multimedia, pp\u00a0869\u2013876"},{"key":"1470_CR20","doi-asserted-by":"crossref","first-page":"367","DOI":"10.1007\/BF00318371","volume":"55","author":"J Koenderink","year":"1987","unstructured":"Koenderink J, van Doorn A (1987) Representation of local geometry in the visual system. Biol Cybern 55:367\u2013375","journal-title":"Biol Cybern"},{"key":"1470_CR21","doi-asserted-by":"crossref","unstructured":"Lazebnik S, Schmid C, Ponce J (2006) Beyond bags of features: spatial pyramid matching for recognizing natural scene categories. In: Proceedings of the 2006 IEEE computer society conference on Computer Vision and Pattern Recognition, CVPR\u00a0\u201906, pp\u00a02169\u20132178","DOI":"10.1109\/CVPR.2006.68"},{"issue":"7","key":"1470_CR22","doi-asserted-by":"crossref","first-page":"1294","DOI":"10.1109\/TPAMI.2008.138","volume":"31","author":"S Lazebnik","year":"2009","unstructured":"Lazebnik S, Raginsky M (2009) Supervised learning of quantizer codebooks by information loss minimization. IEEE Trans Pattern Anal Mach Intell 31(7):1294\u20131309","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"1470_CR23","doi-asserted-by":"crossref","unstructured":"Lejsek H, \u00c3orm\u00f3\u00c3\u0159sd\u00f3ttir H, \u00c1smundsson F, Da\u00c3\u0159ason K, J\u00f3hannsson \u00c1\u00c3, J\u00f3nsson B\u00c3, Amsaleg L (2010) Videntifier forensic: large-scale video identification in practice. In: Proceeding of ACM workshop on multimedia in forensics, security and intelligence, pp\u00a01\u20136","DOI":"10.1145\/1877972.1877973"},{"key":"1470_CR24","doi-asserted-by":"crossref","unstructured":"Leung T, Malik JJ (1999) Recognizing surfaces using three-dimensional textons. In: Proceedings of the IEEE international conference on computer vision, pp\u00a01010\u20131017","DOI":"10.1109\/ICCV.1999.790379"},{"issue":"2","key":"1470_CR25","doi-asserted-by":"crossref","first-page":"91","DOI":"10.1023\/B:VISI.0000029664.99615.94","volume":"60","author":"D Lowe","year":"2004","unstructured":"Lowe D (2004) Distinctive image features from scale-invariant keypoints. Int J Comput Vis 60(2):91\u2013110","journal-title":"Int J Comput Vis"},{"key":"1470_CR26","doi-asserted-by":"crossref","unstructured":"Matas J, Chum O, Urban M, Pajdla T (2002) Robust wide-baseline stereo from maximally stable extremal regions. In: Proceedings of the British machine vision conference, pp\u00a0384\u2013393","DOI":"10.5244\/C.16.36"},{"issue":"1","key":"1470_CR27","doi-asserted-by":"crossref","first-page":"63","DOI":"10.1023\/B:VISI.0000027790.02288.f2","volume":"60","author":"K Mikolajczyk","year":"2004","unstructured":"Mikolajczyk K, Schmid C (2004) Scale & affine invariant interest point detectors. Int J Comput Vis (IJCV) 60(1):63\u201386","journal-title":"Int J Comput Vis (IJCV)"},{"issue":"10","key":"1470_CR28","doi-asserted-by":"crossref","first-page":"1615","DOI":"10.1109\/TPAMI.2005.188","volume":"27","author":"K Mikolajczyk","year":"2005","unstructured":"Mikolajczyk K, Schmid C (2005) A performance evaluation of local descriptors. IEEE Trans Pattern Analy Mach Intell (PAMI) 27(10):1615\u20131630","journal-title":"IEEE Trans Pattern Analy Mach Intell (PAMI)"},{"key":"1470_CR29","doi-asserted-by":"crossref","unstructured":"Nist\u00e8r D, Stew\u00e8nius H (2006) Scalable recognition with a vocabulary tree. In: Proceedings of the IEEE conference on Computer Vision and Pattern Recognition (CVPR), pp\u00a02161\u20132168","DOI":"10.1109\/CVPR.2006.264"},{"key":"1470_CR30","unstructured":"Papadimitriou CH, Steiglitz K (1982) Combinatorial optimization: algorithms and complexity. Prentice-Hall, Inc"},{"key":"1470_CR31","doi-asserted-by":"crossref","unstructured":"Philbin J, Chum O, Isard M, Sivic J, Zisserman A (2007) Object retrieval with large vocabularies and fast spatial matching. In: Proceedings of the International conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2007.383172"},{"key":"1470_CR32","unstructured":"Rivest RL (1992) RFC 1321. http:\/\/tools.ietf.org\/html\/rfc1321"},{"key":"1470_CR33","doi-asserted-by":"crossref","unstructured":"Rosten E, Drummond T (2006) Machine learning for high-speed corner detection. In: Proceedings of the European conference on computer vision, pp\u00a0430\u2013443","DOI":"10.1007\/11744023_34"},{"issue":"4","key":"1470_CR34","doi-asserted-by":"crossref","first-page":"2282","DOI":"10.1109\/TIP.2011.2176950","volume":"21","author":"J Rongrong","year":"2012","unstructured":"Rongrong J, Hongxun Y, Wei L, Xiaoshuai S, Tian TQ (2012) Task-dependent visual-codebook compression. IEEE Trans Image Process 21(4):2282\u20132293","journal-title":"IEEE Trans Image Process"},{"issue":"1","key":"1470_CR35","doi-asserted-by":"crossref","first-page":"153","DOI":"10.1109\/TMM.2012.2225035","volume":"15","author":"J Rongrong","year":"2013","unstructured":"Rongrong J, Duan L-Y, Chen J, Xie L, Yao H, Gao W (2013) Learning to distribute vocabulary indexing for scalable visual search. IEEE Trans Multimedia 15(1):153\u2013166","journal-title":"IEEE Trans Multimedia"},{"key":"1470_CR36","unstructured":"Saffari A, Bischof H (2007) Clustering in a boosting framework. In: Computer vision winter workshop, pp\u00a075\u201382"},{"key":"1470_CR37","unstructured":"Salton G, McGill M (1983) Introduction to modern information retrieval. McGraw-Hill"},{"issue":"5","key":"1470_CR38","doi-asserted-by":"crossref","first-page":"513","DOI":"10.1016\/0306-4573(88)90021-0","volume":"24","author":"G Salton","year":"1988","unstructured":"Salton G, Buckley C (1988) Term-weighting approaches in automatic text retrieval. Inf Process Manage 24(5):513\u2013523","journal-title":"Inf Process Manage"},{"key":"1470_CR39","unstructured":"Sivic J, Russell BC, Efros AA, Zisserman A, Freeman WT (2005) Discovering object categories in image collections. In: Proceedings of the international conference on computer vision"},{"issue":"1","key":"1470_CR40","doi-asserted-by":"crossref","first-page":"11","DOI":"10.1007\/BF00130487","volume":"7","author":"MJ Swain","year":"1991","unstructured":"Swain MJ, Ballard DH (1991) Color indexing. Int J Comput Vis 7(1):11\u201332","journal-title":"Int J Comput Vis"},{"key":"1470_CR41","doi-asserted-by":"crossref","unstructured":"Szeliski R (2010) Computer vision: algorithms and applications. Springer Available at http:\/\/szeliski.org\/Book","DOI":"10.1007\/978-1-84882-935-0"},{"issue":"7","key":"1470_CR42","doi-asserted-by":"crossref","first-page":"1271","DOI":"10.1109\/TPAMI.2009.132","volume":"32","author":"LC Gemert van","year":"2010","unstructured":"van\u00a0Gemert LC, Veenman CJ, Smeulders AWM, Geusebroek JM (2010) Visual word ambiguity. IEEE Trans Pattern Anal Mach Intell 32(7):1271\u20131283","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"1470_CR43","doi-asserted-by":"crossref","unstructured":"Wang Y, Hou Z, Leman K (2011) Keypoint-based near-duplicate images detection using affine invariant feature and color matching In: Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP 2011), pp\u00a01209\u20131212","DOI":"10.1109\/ICASSP.2011.5946627"},{"key":"1470_CR44","unstructured":"Wu Z, Ke Q, Isard M, Sun J (2009) Bundling features for large scale partial-duplicate web image search. In: Proceedings of the international conference on computer vision and pattern recognition, pp\u00a025\u201332"},{"key":"1470_CR45","doi-asserted-by":"crossref","unstructured":"Xu D, Chang S-F (2007) Visual event recognition in news video using kernel methods with multi-level temporal alignment. In: Proceeding of IEEE international conference on computer vision and pattern recognition","DOI":"10.1109\/CVPR.2007.383226"},{"issue":"8","key":"1470_CR46","doi-asserted-by":"crossref","first-page":"1068","DOI":"10.1109\/TCSVT.2010.2051286","volume":"20","author":"D Xu","year":"2010","unstructured":"Xu D, Cham TJ, Yan S, Duan L, Chang S-F (2010) Near duplicate identification with spatially aligned pyramid matching. IEEE Trans Circuits Syst Video Technol (TCSVT) 20(8):1068\u20131079","journal-title":"IEEE Trans Circuits Syst Video Technol (TCSVT)"},{"key":"1470_CR47","unstructured":"Zhang D-Q, Chang S-F (2004) Detecting image near-duplicate by stochastic attributed relational graph matching with learning. In: Proceedings of the ACM multimedia conference, pp\u00a0877\u2013884"},{"issue":"5","key":"1470_CR48","doi-asserted-by":"crossref","first-page":"1037","DOI":"10.1109\/TMM.2007.898928","volume":"9","author":"W-L Zhao","year":"2007","unstructured":"Zhao W-L, Ngo C-W, Tan H-K, Wu X (2007) Near-duplicate keyframe identification with interest point matching and pattern learning. IEEE Trans Multimedia 9(5):1037\u20131048","journal-title":"IEEE Trans Multimedia"},{"issue":"2","key":"1470_CR49","doi-asserted-by":"crossref","first-page":"412","DOI":"10.1109\/TIP.2008.2008900","volume":"18","author":"W-L Zhao","year":"2009","unstructured":"Zhao W-L, Ngo C-W (2009) Scale-rotation invariant pattern entropy for keypoint-based near-duplicate detection. IEEE Trans Image Process 18(2):412\u2013423","journal-title":"IEEE Trans Image Process"},{"issue":"5","key":"1470_CR50","doi-asserted-by":"crossref","first-page":"448","DOI":"10.1109\/TMM.2010.2050651","volume":"12","author":"WL Zhao","year":"2010","unstructured":"Zhao WL, Wu X, Ngo CW (2010) On the annotation of web videos by efficient near-duplicate search. IEEE Trans Multimedia 12(5):448\u2013461","journal-title":"IEEE Trans Multimedia"},{"key":"1470_CR51","unstructured":"Zhao W-L, Wu X, Ngo C-W (2011) SOTU: a toolkit for efficient near-duplicate image\/video & retrieval\/detection. Manual for SOTU Version 1.06. http:\/\/www.cs.cityu.edu.hk\/~wzhao2\/sotu.htm"},{"key":"1470_CR52","doi-asserted-by":"crossref","unstructured":"Zhu J, Hoi SC, Lyu MR, Yan S (2008) Near-duplicate keyframe retrieval by nonrigid image matching. In: Proceedings of the ACM multimedia conference, pp\u00a041\u201350","DOI":"10.1145\/1459359.1459366"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-013-1470-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s11042-013-1470-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-013-1470-4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,7,12]],"date-time":"2019-07-12T21:43:27Z","timestamp":1562967807000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s11042-013-1470-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013,4,21]]},"references-count":52,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2014,9]]}},"alternative-id":["1470"],"URL":"https:\/\/doi.org\/10.1007\/s11042-013-1470-4","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2013,4,21]]}}}