{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T12:42:04Z","timestamp":1743079324910,"version":"3.40.3"},"publisher-location":"Cham","reference-count":51,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319056951"},{"type":"electronic","value":"9783319056968"}],"license":[{"start":{"date-parts":[[2014,1,1]],"date-time":"2014-01-01T00:00:00Z","timestamp":1388534400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-319-05696-8_4","type":"book-chapter","created":{"date-parts":[[2014,5,9]],"date-time":"2014-05-09T14:19:39Z","timestamp":1399645179000},"page":"79-107","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Fusion of Multiple Visual Cues for Object Recognition in Videos"],"prefix":"10.1007","author":[{"given":"Iv\u00e1n","family":"Gonz\u00e1lez-D\u00edaz","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jenny","family":"Benois-Pineau","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Vincent","family":"Buso","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hugo","family":"Boujut","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2014,3,26]]},"reference":[{"key":"4_CR1","doi-asserted-by":"crossref","unstructured":"Pirsiavash H, Ramanan D (2012) Detecting activities of daily living in first-person camera views. In: IEEE conference on computer vision and pattern recognition (CVPR), pp 2847\u20132854","DOI":"10.1109\/CVPR.2012.6248010"},{"issue":"9","key":"4_CR2","doi-asserted-by":"publisher","first-page":"1627","DOI":"10.1109\/TPAMI.2009.167","volume":"32","author":"PF Felzenszwalb","year":"2010","unstructured":"Felzenszwalb PF, Girshick RB, McAllester DA, Ramanan D (2010) Object detection with discriminatively trained part-based models. IEEE Trans Pattern Anal Mach Intell 32(9):1627\u20131645","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"4_CR3","doi-asserted-by":"crossref","unstructured":"Lampert CH, Blaschko MB, Hofmann T (2008) Beyond sliding windows: object localization by efficient subwindow search. In: IEEE computer society conference on computer vision and pattern recognition (CVPR 2008), IEEE Computer Society, Anchorage, 24\u201326 June 2008","DOI":"10.1109\/CVPR.2008.4587586"},{"issue":"3","key":"4_CR4","doi-asserted-by":"crossref","first-page":"194","DOI":"10.1038\/35058500","volume":"2","author":"L Itti","year":"2001","unstructured":"Itti L, Koch C (2001) Computational modelling of visual attention. Nat Rev Neurosci 2(3):194\u2013203","journal-title":"Nat Rev Neurosci"},{"key":"4_CR5","doi-asserted-by":"crossref","unstructured":"Fathi A, Li Y, Rehg JM (2012) Learning to recognize daily actions using gaze. In: Proceedings of the 12th European conference on computer vision\u2014Volume Part I, ECCV\u201912, pp 314\u2013327, Springer, Berlin, 2012","DOI":"10.1007\/978-3-642-33718-5_23"},{"key":"4_CR6","doi-asserted-by":"crossref","unstructured":"Ogaki K, Kitani KM, Sugano Y, Sato Y (2012) Coupling eye-motion and ego-motion features for first-person activity recognition. In: 2012 IEEE computer society conference on computer vision and pattern recognition workshops, IEEE, pp 1\u20137, 2012","DOI":"10.1109\/CVPRW.2012.6239188"},{"key":"4_CR7","unstructured":"Csurka G, Dance CR, Fan L, Willamowski J, Bray C (2004) Visual categorization with bags of keypoints. In: Workshop on statistical learning in computer vision, ECCV, pp 1\u201322"},{"key":"4_CR8","doi-asserted-by":"crossref","unstructured":"Dalal N, Triggs B (2005) Histograms of oriented gradients for human detection. In: Schmid C, Soatto S, Tomasi C (eds) International conference on computer vision and pattern recognition, vol 2. INRIA Rh\u00f4ne-Alpes, ZIRST-655, av. de l\u2019Europe, Montbonnot-38334, pp 886\u2013893","DOI":"10.1109\/CVPR.2005.177"},{"key":"4_CR9","doi-asserted-by":"crossref","unstructured":"Jing F, Li M, Zhang H, Zhang B (2002) An effective region-based image retrieval framework. In: ACM international conference on multimedia, 2002","DOI":"10.1145\/641007.641106"},{"key":"4_CR10","doi-asserted-by":"crossref","unstructured":"Long F, Zhang H, Feng D (2003) Fundamentals of content-based image retrieval. In: Multimedia information retrieval and management, 2003","DOI":"10.1007\/978-3-662-05300-3_1"},{"issue":"6","key":"4_CR11","doi-asserted-by":"publisher","first-page":"703","DOI":"10.1109\/76.927424","volume":"11","author":"B Manjunath","year":"2001","unstructured":"Manjunath B, Ohm J, Vasudevan V, Yamada A (2001) Colour and texture descriptors. IEEE Trans Circ Sys Video Technol 11(6):703\u2013715","journal-title":"IEEE Trans Circ Sys Video Technol"},{"key":"4_CR12","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1023\/B:VISI.0000029664.99615.94","volume":"60","author":"DG Lowe","year":"2004","unstructured":"Lowe DG (2004) Distinctive image features from scale-invariant keypoints. Intern J Comput Vis 60:91\u2013110","journal-title":"Intern J Comput Vis"},{"key":"4_CR13","doi-asserted-by":"crossref","first-page":"346","DOI":"10.1016\/j.cviu.2007.09.014","volume":"110","author":"H Bay","year":"2008","unstructured":"Bay H, Ess A, Tuytelaars T, Van Gool L (2008) Speeded-up robust features (surf). Comput Vis Image Underst 110:346\u2013359","journal-title":"Comput Vis Image Underst"},{"issue":"12","key":"4_CR14","doi-asserted-by":"publisher","first-page":"1376","DOI":"10.1109\/34.735812","volume":"20","author":"F Mokhtarian","year":"1998","unstructured":"Mokhtarian F, Suomela R (1998) Robust image corner detection through curvature scale space. IEEE Trans Pattern Anal Mach Intell 20(12):1376\u20131381","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"4_CR15","doi-asserted-by":"crossref","unstructured":"Sivic J, Zisserman A (2003) Video google: a text retrieval approach to object matching in videos. In: Proceedings of the international conference on computer vision 2:1470\u20131477","DOI":"10.1109\/ICCV.2003.1238663"},{"key":"4_CR16","doi-asserted-by":"crossref","unstructured":"Viola P, Jones M (2001) Rapid object detection using a boosted cascade of simple features. In: 2001 IEEE computer society conference on computer vision and pattern recognition, vol 1. IEEE, Los Alamitos, pp 511\u2013518","DOI":"10.1109\/CVPR.2001.990517"},{"key":"4_CR17","doi-asserted-by":"crossref","unstructured":"Pirsiavash H, Ramanan D (2012) Detecting activities of daily living in first-person camera views. In: 2012 IEEE conference on computer vision and pattern recognition (CVPR), IEEE, 2012","DOI":"10.1109\/CVPR.2012.6248010"},{"key":"4_CR18","doi-asserted-by":"crossref","unstructured":"de Carvalho Soares R, da Silva I, Guliato D (2012) Spatial locality weighting of features using saliency map with a bag-of-visual-words approach. In: IEEE 24th international conference on tools with artificial intelligence (ICTAI), vol 1. pp 1070\u20131075","DOI":"10.1109\/ICTAI.2012.151"},{"key":"4_CR19","doi-asserted-by":"crossref","unstructured":"Sharma G, Jurie F, Schmid C (2012) Discriminative spatial saliency for image classification. In: IEEE conference on computer vision and pattern recognition (CVPR), pp 3506\u20133513","DOI":"10.1109\/CVPR.2012.6248093"},{"key":"4_CR20","doi-asserted-by":"crossref","unstructured":"Vig E, Dorr M, Cox D (2012) Space-variant descriptor sampling for action recognition based on saliency and eye movements. Springer, Firenze, pp 84\u201397","DOI":"10.1007\/978-3-642-33786-4_7"},{"issue":"1","key":"4_CR21","doi-asserted-by":"crossref","first-page":"97","DOI":"10.1016\/0010-0285(80)90005-5","volume":"12","author":"AM Treisman","year":"1980","unstructured":"Treisman AM, Gelade G (1980) A feature-integration theory of attention. Cogn Psychol 12(1):97\u2013136","journal-title":"Cogn Psychol"},{"issue":"9","key":"4_CR22","doi-asserted-by":"crossref","first-page":"1758","DOI":"10.1109\/TPAMI.2011.220","volume":"34","author":"A Borji","year":"2012","unstructured":"Borji A, Itti L (2012) State-of-the-art in visual attention modeling. IEEE Trans Pattern Anal Mach Intell 99 (PrePrints), 34(9):1758\u20131772","journal-title":"IEEE Trans Pattern Anal Mach Intell 99 (PrePrints)"},{"key":"4_CR23","doi-asserted-by":"crossref","unstructured":"Vig E, Dorr M, Cox D (2012) Space-variant descriptor sampling for action recognition based on saliency and eye movements. In: European conference on computer vision, 2012","DOI":"10.1007\/978-3-642-33786-4_7"},{"issue":"14","key":"4_CR24","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1167\/7.14.4","volume":"7","author":"BW Tatler","year":"2007","unstructured":"Tatler BW (2007) The central fixation bias in scene viewing: selecting an optimal viewing position independently of motor biases and image feature distributions. J Vis 7(14):1\u201317","journal-title":"J Vis"},{"issue":"10","key":"4_CR25","doi-asserted-by":"crossref","first-page":"28","DOI":"10.1167\/10.10.28","volume":"10","author":"M Dorr","year":"2010","unstructured":"Dorr M, Martinetz T, Gegenfurtner KR, Barth E (2010) Variability of eye movements when viewing dynamic natural scenes. J Vis, 10(10):28","journal-title":"J Vis"},{"key":"4_CR26","first-page":"219","volume":"4","author":"C Koch","year":"1985","unstructured":"Koch C, Ullman S (1985) Shifts in selective visual attention: towards the underlying neural circuitry. Hum Neurobiol 4:219\u2013227","journal-title":"Hum Neurobiol"},{"key":"4_CR27","volume-title":"Attention and performance X: control of language processes","author":"MI Posner","year":"1984","unstructured":"Posner MI, Cohen YA (1984) Components of visual orienting. In: Bouma H, Bouwhuis DG (eds) Attention and performance X: control of language processes. Lawrence Erlbaum, Hillsdale"},{"issue":"1","key":"4_CR28","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1016\/S0042-6989(01)00250-4","volume":"42","author":"D Parkhurst","year":"2002","unstructured":"Parkhurst D, Law K, Niebur E (2002) Modeling the role of salience in the allocation of overt visual attention. Vis Res 42(1):107\u2013123","journal-title":"Vis Res"},{"key":"4_CR29","doi-asserted-by":"crossref","unstructured":"Harel J, Koch C, Perona P (2007) Graph-based visual saliency. In: Advances in neural information processing systems 19. MIT Press, Cambridge, pp 545\u2013552","DOI":"10.7551\/mitpress\/7503.003.0073"},{"issue":"3","key":"4_CR30","doi-asserted-by":"crossref","first-page":"231","DOI":"10.1007\/s11263-009-0215-3","volume":"82","author":"S Marat","year":"2009","unstructured":"Marat S, Ho Phuoc T, Granjon L, Guyader N, Pellerin D, Gu\u00e9rin-Dugu\u00e9, V (2009) Modelling spatio-temporal saliency to predict gaze direction for short videos. Intern J Comput Vis 82(3):231\u2013243","journal-title":"Intern J Comput Vis"},{"issue":"11","key":"4_CR31","doi-asserted-by":"crossref","first-page":"1254","DOI":"10.1109\/34.730558","volume":"20","author":"L Itti","year":"1998","unstructured":"Itti L, Koch C, Niebur E (1998) A model of saliency-based visual attention for rapid scene analysis. IEEE Trans Pattern Anal Mach Intell 20(11):1254\u20131259","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"4_CR32","unstructured":"Itti L, Baldi PF (2006) Bayesian surprise attracts human attention. In: Advances in neural information processing systems, (NIPS*2005) vol 19. MIT Press, Cambridge, pp 547\u2013554"},{"key":"4_CR33","first-page":"155","volume-title":"Advances in Neural Information Processing Systems 18","author":"JK Tsotsos","year":"2006","unstructured":"Tsotsos JK, Bruce NDB (2006) Saliency based on information maximization. In: Weiss Y, Sch\u00f6lkopf B, Platt J (eds) Advances in Neural Information Processing Systems 18. MIT Press, Cambridge, pp 155\u2013162"},{"key":"4_CR34","unstructured":"Itti L, Braun J, Lee DK, Koch C (1999) Attentional modulation of human pattern discrimination psychophysics reproduced by a quantitative model. In: Advances in neural information processing systems. MIT Press, Cambridge, p 1998"},{"issue":"10\u201312","key":"4_CR35","doi-asserted-by":"crossref","first-page":"1489","DOI":"10.1016\/S0042-6989(99)00163-7","volume":"40","author":"L Itti","year":"2000","unstructured":"Itti L (June 2000) A saliency-based search mechanism for overt and covert shifts of visual attention. Vis Res 40(10\u201312):1489\u20131506","journal-title":"Vis Res"},{"issue":"4","key":"4_CR36","doi-asserted-by":"crossref","first-page":"375","DOI":"10.1038\/7286","volume":"2","author":"DK Lee","year":"1999","unstructured":"Lee DK, Itti L, Koch C, Braun J (Apr 1999) Attention activates winner-take-all competition among visual filters. Nat Neurosci 2(4):375\u201381","journal-title":"Nat Neurosci"},{"key":"4_CR37","unstructured":"Brouard O, Ricordel V, Barba D (2009) Cartes de Saillance Spatio-Temporelle bas\u00e9es Contrastes de Couleur et Mouvement Relatif. In: Compression et representation des signaux audiovisuels, 2009"},{"key":"4_CR38","unstructured":"Farneb\u00e4ck G (2000) Fast and accurate motion estimation using orientation tensors and parametric motion models. In: Proceedings of 15th international conference on pattern recognition, vol 1. IAPR, Barcelona, Sept 2000, pp 135\u2013139"},{"key":"4_CR39","doi-asserted-by":"crossref","first-page":"381","DOI":"10.1145\/358669.358692","volume":"24","author":"MA Fischler","year":"1981","unstructured":"Fischler MA, Bolles RC (June 1981) Random sample consensus: a paradigm for model fitting with applications to image analysis and automated cartography. Commun ACM 24:381\u2013395","journal-title":"Commun ACM"},{"key":"4_CR40","doi-asserted-by":"crossref","unstructured":"Daly SJ (1998) Engineering observations from spatiovelocity and spatiotemporal visual models. In: IS&T\/SPIE conference on human vision and electronic imaging III:1, 1998","DOI":"10.1117\/12.320110"},{"key":"4_CR41","doi-asserted-by":"crossref","unstructured":"Boujut H, Benois-Pineau J, Megret R (2012) Fusion of multiple visual cues for visual saliency extraction from wearable camera settings with strong motion. In: Fusiello A, Murino V, Cucchiara R (eds) Computer vision\u2014ECCV 2012. Workshops and Demonstrations, Lecture Notes in Computer Science, vol 7585. Springer, Berlin, pp 436\u2013445","DOI":"10.1007\/978-3-642-33885-4_44"},{"key":"4_CR42","doi-asserted-by":"publisher","first-page":"1311","DOI":"10.1068\/p2935","volume":"28","author":"M Land","year":"1999","unstructured":"Land M, Mennie N, Rusted J (1999) The roles of vision and eye movements in the control of activities of daily living. Perception 28:1311\u20131328","journal-title":"Perception"},{"issue":"3","key":"4_CR43","doi-asserted-by":"crossref","first-page":"553","DOI":"10.1137\/0904038","volume":"4","author":"JJ Mor\u00e9","year":"1983","unstructured":"Mor\u00e9 JJ, Sorensen DC (1983) Computing a trust region step. SIAM J Sci Stat Comput 4(3):553\u2013572","journal-title":"SIAM J Sci Stat Comput"},{"key":"4_CR44","doi-asserted-by":"crossref","unstructured":"Boujut H, Benois-Pineau J, Ahmed T, Hadar O, Bonnet P (2011) A metric for no-reference video quality assessment for hd tv delivery based on saliency maps. In: IEEE international conference on multimedia and expo, July 2011","DOI":"10.1109\/ICME.2011.6012136"},{"key":"4_CR45","doi-asserted-by":"publisher","first-page":"284","DOI":"10.1007\/s11263-009-0271-8","volume":"88","author":"T Tuytelaars","year":"2010","unstructured":"Tuytelaars T, Lampert C, Blaschko M, Buntine W (2010) Unsupervised object discovery: a comparison. Intern J Comput Vis 88:284\u2013302","journal-title":"Intern J Comput Vis"},{"key":"4_CR46","doi-asserted-by":"crossref","unstructured":"Philbin J, Chum O, Isard M, Sivic J, Zisserman A (2008) Lost in quantization: improving particular object retrieval in large scale image databases. In: IEEE conference on computer vision and pattern recognition, pp 1\u20138, June 2008","DOI":"10.1109\/CVPR.2008.4587635"},{"key":"4_CR47","doi-asserted-by":"crossref","unstructured":"Marsza\u0142ek M, Schmid C (2006) Spatial weighting for bag-of-features. In: IEEE conference on computer vision and pattern recognition, vol 2. pp 2118\u20132125","DOI":"10.1109\/CVPR.2006.288"},{"key":"4_CR48","first-page":"273","volume":"20","author":"C Cortes","year":"1995","unstructured":"Cortes C, Vapnik V (1995) Support-vector networks. Mach Learn 20:273\u2013297","journal-title":"Mach Learn"},{"key":"4_CR49","unstructured":"Sreekanth V, Vedaldi A, Jawahar CV, Zisserman A (2010) Generalized RBF feature maps for efficient detection. In: Proceedings of the British machine vision conference (BMVC), 2010"},{"key":"4_CR50","doi-asserted-by":"crossref","unstructured":"Fathi A, Ren X, Rehg JM (2011) Learning to recognize objects in egocentric activities. In: The 24th IEEE conference on computer vision and pattern recognition, CVPR 2011, IEEE, Colorado Springs, 20\u201325 June 2011, pp 3281\u20133288","DOI":"10.1109\/CVPR.2011.5995444"},{"key":"4_CR51","unstructured":"Over P, Awad G, Michel M, Fiscus J, Sanders G, Shaw B, Kraaij W, Smeaton AF, Qu\u00e9enot G (2012) Trecvid 2012\u2014an overview of the goals, tasks, data, evaluation mechanisms and metrics. In: Proceedings of TRECVID 2012, NIST, USA, 2012"}],"container-title":["Advances in Computer Vision and Pattern Recognition","Fusion in Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-05696-8_4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,13]],"date-time":"2023-07-13T00:39:22Z","timestamp":1689208762000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-05696-8_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783319056951","9783319056968"],"references-count":51,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-05696-8_4","relation":{},"ISSN":["2191-6586","2191-6594"],"issn-type":[{"type":"print","value":"2191-6586"},{"type":"electronic","value":"2191-6594"}],"subject":[],"published":{"date-parts":[[2014]]},"assertion":[{"value":"26 March 2014","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}