{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,2]],"date-time":"2026-01-02T07:36:10Z","timestamp":1767339370067,"version":"3.40.4"},"publisher-location":"Cham","reference-count":52,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319106014"},{"type":"electronic","value":"9783319106021"}],"license":[{"start":{"date-parts":[[2014,1,1]],"date-time":"2014-01-01T00:00:00Z","timestamp":1388534400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-319-10602-1_24","type":"book-chapter","created":{"date-parts":[[2014,8,14]],"date-time":"2014-08-14T07:07:56Z","timestamp":1408000076000},"page":"361-376","source":"Crossref","is-referenced-by-count":67,"title":["Training Object Class Detectors from Eye Tracking Data"],"prefix":"10.1007","author":[{"given":"Dim P.","family":"Papadopoulos","sequence":"first","affiliation":[]},{"given":"Alasdair D. F.","family":"Clarke","sequence":"additional","affiliation":[]},{"given":"Frank","family":"Keller","sequence":"additional","affiliation":[]},{"given":"Vittorio","family":"Ferrari","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"24_CR1","unstructured":"Imagenet large scale visual recognition challenge, ILSVRC (2011), http:\/\/www.image-net.org\/challenges\/LSVRC\/2011\/index"},{"key":"24_CR2","doi-asserted-by":"crossref","unstructured":"Alexe, B., Deselaers, T., Ferrari, V.: What is an object? In: CVPR (2010)","DOI":"10.1109\/CVPR.2010.5540226"},{"key":"24_CR3","unstructured":"Berg, T., Berg, A., Edwards, J., Mair, M., White, R., Teh, Y., Learned-Miller, E., Forsyth, D.: Names and Faces in the News. In: CVPR (2004)"},{"key":"24_CR4","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"428","DOI":"10.1007\/978-3-540-24670-1_33","volume-title":"Computer Vision - ECCV 2004","author":"A. Blake","year":"2004","unstructured":"Blake, A., Rother, C., Brown, M., Perez, P., Torr, P.: Interactive image segmentation using an adaptive GMMRF model. In: Pajdla, T., Matas, J(G.) (eds.) ECCV 2004. LNCS, vol.\u00a03021, pp. 428\u2013441. Springer, Heidelberg (2004)"},{"issue":"9","key":"24_CR5","doi-asserted-by":"publisher","first-page":"1124","DOI":"10.1109\/TPAMI.2004.60","volume":"26","author":"Y. Boykov","year":"2004","unstructured":"Boykov, Y., Kolmogorov, V.: An experimental comparison of min-cut\/max-flow algorithms for energy minimization in vision. IEEE Trans. on PAMI\u00a026(9), 1124\u20131137 (2004)","journal-title":"IEEE Trans. on PAMI"},{"key":"24_CR6","doi-asserted-by":"publisher","first-page":"433","DOI":"10.1163\/156856897X00357","volume":"10","author":"D.H. Brainard","year":"1997","unstructured":"Brainard, D.H.: The Psychophysics Toolbox. Spatial Vision\u00a010, 433\u2013436 (1997)","journal-title":"Spatial Vision"},{"key":"24_CR7","doi-asserted-by":"crossref","unstructured":"Chum, O., Zisserman, A.: An exemplar model for learning object classes. In: CVPR (2007)","DOI":"10.1109\/CVPR.2007.383050"},{"key":"24_CR8","unstructured":"Dalal, N., Triggs, B.: Histogram of Oriented Gradients for human detection. In: CVPR (2005)"},{"key":"24_CR9","doi-asserted-by":"crossref","unstructured":"Deselaers, T., Alexe, B., Ferrari, V.: Weakly supervised localization and learning with generic knowledge. IJCV (2012)","DOI":"10.1007\/s11263-012-0538-3"},{"key":"24_CR10","doi-asserted-by":"crossref","unstructured":"Deselaers, T., Ferrari, V.: Global and efficient self-similarity for object classification and detection. In: CVPR (2010)","DOI":"10.1109\/CVPR.2010.5539775"},{"key":"24_CR11","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1007\/3-540-47979-1_7","volume-title":"Computer Vision - ECCV 2002","author":"P. Duygulu","year":"2002","unstructured":"Duygulu, P., Barnard, K., de Freitas, J.F.G., Forsyth, D.: Object recognition as machine translation: Learning a lexicon for a fixed image vocabulary. In: Heyden, A., Sparr, G., Nielsen, M., Johansen, P. (eds.) ECCV 2002, Part IV. LNCS, vol.\u00a02353, pp. 97\u2013112. Springer, Heidelberg (2002)"},{"key":"24_CR12","first-page":"1","volume":"8","author":"W. Einh\u00e4user","year":"2008","unstructured":"Einh\u00e4user, W., Spain, M., Perona, P.: Objects predict fixations better than early saliency. Journal of Vision\u00a08, 1\u201326 (2008)","journal-title":"Journal of Vision"},{"key":"24_CR13","unstructured":"Everingham, M., Van Gool, L., Williams, C.K.I., Winn, J., Zisserman, A.: The PASCAL Visual Object Classes Challenge (VOC2012) Results (2012), http:\/\/www.pascal-network.org\/challenges\/VOC\/voc2012\/workshop\/index.html"},{"key":"24_CR14","doi-asserted-by":"crossref","unstructured":"Everingham, M., Van Gool, L., Williams, C.K.I., Winn, J., Zisserman, A.: The pascal visual object classes (voc) challenge. IJCV (2010)","DOI":"10.1007\/s11263-009-0275-4"},{"key":"24_CR15","doi-asserted-by":"crossref","unstructured":"Felzenszwalb, P., Girshick, R., McAllester, D., Ramanan, D.: Object detection with discriminatively trained part based models. IEEE Trans. on PAMI\u00a032(9) (2010)","DOI":"10.1109\/TPAMI.2009.167"},{"key":"24_CR16","unstructured":"Fergus, R., Perona, P., Zisserman, A.: Object class recognition by unsupervised scale-invariant learning. In: CVPR (2003)"},{"key":"24_CR17","doi-asserted-by":"crossref","unstructured":"Guillaumin, M., Ferrari, V.: Large-scale knowledge transfer for object localization in imagenet. In: CVPR (2012)","DOI":"10.1109\/CVPR.2012.6248055"},{"key":"24_CR18","doi-asserted-by":"crossref","unstructured":"Guillaumin, M., Kuettel, D., Ferrari, V.: ImageNet Auto-annotation with Segmentation Propagation. Tech. rep., ETH Zurich (2013)","DOI":"10.1007\/978-3-642-33786-4_34"},{"key":"24_CR19","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"16","DOI":"10.1007\/978-3-540-88682-2_3","volume-title":"Computer Vision \u2013 ECCV 2008","author":"A. Gupta","year":"2008","unstructured":"Gupta, A., Davis, L.S.: Beyond nouns: Exploiting prepositions and comparative adjectives for learning visual classifiers. In: Forsyth, D., Torr, P., Zisserman, A. (eds.) ECCV 2008, Part I. LNCS, vol.\u00a05302, pp. 16\u201329. Springer, Heidelberg (2008)"},{"key":"24_CR20","unstructured":"Hao, S., Deng, J., Fei-Fei, L.: Crowdsourcing annotations for visual object detection. In: AAAI (2012)"},{"key":"24_CR21","doi-asserted-by":"crossref","unstructured":"Harel, J., Koch, C., Perona, P.: Graph-based visual saliency. In: NIPS (2007)","DOI":"10.7551\/mitpress\/7503.003.0073"},{"key":"24_CR22","doi-asserted-by":"publisher","first-page":"498","DOI":"10.1016\/j.tics.2003.09.006","volume":"7","author":"J. Henderson","year":"2003","unstructured":"Henderson, J.: Human gaze control in real-world scene perception. Trends in Cognitive Sciences\u00a07, 498\u2013504 (2003)","journal-title":"Trends in Cognitive Sciences"},{"issue":"11","key":"24_CR23","doi-asserted-by":"publisher","first-page":"1254","DOI":"10.1109\/34.730558","volume":"20","author":"L. Itti","year":"1998","unstructured":"Itti, L., Koch, C., Niebur, E.: A model of saliency-based visual attention for rapid scene analysis. IEEE Trans. on PAMI\u00a020(11), 1254\u20131259 (1998)","journal-title":"IEEE Trans. on PAMI"},{"key":"24_CR24","doi-asserted-by":"crossref","unstructured":"Judd, T., Ehinger, K., Durand, F., Torralba, A.: Learning to predict where humans look. In: IEEE International Conference on Computer Vision, ICCV (2009)","DOI":"10.1109\/ICCV.2009.5459462"},{"key":"24_CR25","doi-asserted-by":"crossref","unstructured":"Karthikeyan, S., Jagadeesh, V., Shenoy, R., Eckstein, M., Manjunath, B.: From where and how to whatwe see. In: ICCV (2013)","DOI":"10.1109\/ICCV.2013.83"},{"key":"24_CR26","doi-asserted-by":"crossref","unstructured":"Kuettel, D., Ferrari, V.: Figure-ground segmentation by transferring window masks. In: CVPR (2012)","DOI":"10.1109\/CVPR.2012.6247721"},{"key":"24_CR27","doi-asserted-by":"crossref","unstructured":"Ladicky, L., Russell, C., Kohli, P.: Associative hierarchical crfs for object class image segmentation. In: ICCV (2009)","DOI":"10.1109\/ICCV.2009.5459248"},{"key":"24_CR28","doi-asserted-by":"crossref","unstructured":"Leistner, C., Godec, M., Schulter, S., Saffari, A., Bischof, H.: Improving classifiers with weakly-related videos. In: CVPR (2011)","DOI":"10.1109\/CVPR.2011.5995475"},{"key":"24_CR29","doi-asserted-by":"crossref","unstructured":"Levinshtein, A., Stere, A., Kutulakos, K., Fleed, D., Dickinson, S.: Turbopixels: Fast superpixels using geometric flows. IEEE Trans. on PAMI (2009)","DOI":"10.1109\/TPAMI.2009.96"},{"key":"24_CR30","unstructured":"Luo, J., Caputo, B., Ferrari, V.: Who\u2019s doing what: Joint modeling of names and verbs for simultaneous face and pose annotation. In: NIPS (2009)"},{"key":"24_CR31","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"842","DOI":"10.1007\/978-3-642-33709-3_60","volume-title":"Computer Vision \u2013 ECCV 2012","author":"S. Mathe","year":"2012","unstructured":"Mathe, S., Sminchisescu, C.: Dynamic eye movement datasets and learnt saliency models for visual action recognition. In: Fitzgibbon, A., Lazebnik, S., Perona, P., Sato, Y., Schmid, C. (eds.) ECCV 2012, Part II. LNCS, vol.\u00a07573, pp. 842\u2013856. Springer, Heidelberg (2012)"},{"key":"24_CR32","doi-asserted-by":"crossref","unstructured":"Mishra, A., Aloimonos, Y., Fah, C.L.: Active segmentation with fixation. In: ICCV (2009)","DOI":"10.1109\/IROS.2009.5354325"},{"issue":"8","key":"24_CR33","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1167\/10.8.20","volume":"10","author":"A. Nuthmann","year":"2010","unstructured":"Nuthmann, A., Henderson, J.M.: Object-based attentional selection in scene viewing. Journal of Vision\u00a010(8), 1\u201319 (2010)","journal-title":"Journal of Vision"},{"key":"24_CR34","doi-asserted-by":"crossref","unstructured":"Pandey, M., Lazebnik, S.: Scene recognition and weakly supervised object localization with deformable part-based models. In: ICCV (2011)","DOI":"10.1109\/ICCV.2011.6126383"},{"key":"24_CR35","unstructured":"Platt, J.: Probabilistic outputs for support vector machines and comparisons to regularized likelihood methods. Advances in large margin classifiers (1999)"},{"key":"24_CR36","doi-asserted-by":"crossref","unstructured":"Prest, A., Leistner, C., Civera, J., Schmid, C., Ferrari, V.: Learning object class detectors from weakly annotated video. In: CVPR (2012)","DOI":"10.1109\/CVPR.2012.6248065"},{"key":"24_CR37","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"30","DOI":"10.1007\/978-3-642-15561-1_3","volume-title":"Computer Vision \u2013 ECCV 2010","author":"S. Ramanathan","year":"2010","unstructured":"Ramanathan, S., Katti, H., Sebe, N., Kankanhalli, M., Chua, T.-S.: An eye fixation database for saliency detection in images. In: Daniilidis, K., Maragos, P., Paragios, N. (eds.) ECCV 2010, Part IV. LNCS, vol.\u00a06314, pp. 30\u201343. Springer, Heidelberg (2010)"},{"key":"24_CR38","doi-asserted-by":"crossref","unstructured":"Rother, C., Kolmogorov, V., Blake, A.: Grabcut: interactive foreground extraction using iterated graph cuts. SIGGRAPH (2004)","DOI":"10.1145\/1186562.1015720"},{"key":"24_CR39","doi-asserted-by":"crossref","unstructured":"Siva, P., Russell, C., Xiang, T., Agapito, L.: Looking beyond the image: Unsupervised learning for object saliency and detection. In: CVPR (2013)","DOI":"10.1109\/CVPR.2013.416"},{"key":"24_CR40","doi-asserted-by":"crossref","unstructured":"Siva, P., Xiang, T.: Weakly supervised object detector learning with model drift detection. In: ICCV (2011)","DOI":"10.1109\/ICCV.2011.6126261"},{"key":"24_CR41","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"594","DOI":"10.1007\/978-3-642-33712-3_43","volume-title":"Computer Vision \u2013 ECCV 2012","author":"P. Siva","year":"2012","unstructured":"Siva, P., Russell, C., Xiang, T.: In defence of negative mining for annotating weakly labelled data. In: Fitzgibbon, A., Lazebnik, S., Perona, P., Sato, Y., Schmid, C. (eds.) ECCV 2012, Part III. LNCS, vol.\u00a07574, pp. 594\u2013608. Springer, Heidelberg (2012)"},{"key":"24_CR42","doi-asserted-by":"crossref","unstructured":"Tang, K., Sukthankar, R., Yagnik, J., Fei-Fei, L.: Discriminative segment annotation in weakly labeled video. In: CVPR (2013)","DOI":"10.1109\/CVPR.2013.321"},{"key":"24_CR43","unstructured":"Vedaldi, A., Fulkerson, B.: VLFeat: An open and portable library of computer vision algorithms (2008)"},{"key":"24_CR44","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/978-3-642-15555-0_16","volume-title":"Computer Vision \u2013 ECCV 2010","author":"O. Veksler","year":"2010","unstructured":"Veksler, O., Boykov, Y., Mehrani, P.: Superpixels and supervoxels in an energy optimization framework. In: Daniilidis, K., Maragos, P., Paragios, N. (eds.) ECCV 2010, Part V. LNCS, vol.\u00a06315, pp. 211\u2013224. Springer, Heidelberg (2010)"},{"key":"24_CR45","doi-asserted-by":"crossref","unstructured":"Vicente, S., Rother, C., Kolmogorov, V.: Object cosegmentation. In: CVPR, pp. 2217\u20132224 (2011)","DOI":"10.1109\/CVPR.2011.5995530"},{"key":"24_CR46","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1007\/978-3-642-33786-4_7","volume-title":"Computer Vision \u2013 ECCV 2012","author":"E. Vig","year":"2012","unstructured":"Vig, E., Dorr, M., Cox, D.: Space-variant descriptor sampling for action recognition based on saliency and eye movements. In: Fitzgibbon, A., Lazebnik, S., Perona, P., Sato, Y., Schmid, C. (eds.) ECCV 2012, Part VII. LNCS, vol.\u00a07578, pp. 84\u201397. Springer, Heidelberg (2012)"},{"key":"24_CR47","unstructured":"Viola, P.A., Platt, J., Zhang, C.: Multiple instance boosting for object detection. In: NIPS (2005)"},{"key":"24_CR48","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"36","DOI":"10.1007\/978-3-642-35725-1_4","volume-title":"Advances in Multimedia Modeling","author":"T. Walber","year":"2013","unstructured":"Walber, T., Scherp, A., Staab, S.: Can you see it? Two novel eye-tracking-based measures for assigning tags to image regions. In: Li, S., El Saddik, A., Wang, M., Mei, T., Sebe, N., Yan, S., Hong, R., Gurrin, C. (eds.) MMM 2013, Part I. LNCS, vol.\u00a07732, pp. 36\u201346. Springer, Heidelberg (2013)"},{"key":"24_CR49","doi-asserted-by":"crossref","unstructured":"Wang, J., Cohen, M.: An iterative optimization approach for unified image segmentation and matting. In: ICCV (2005)","DOI":"10.1109\/ICCV.2005.37"},{"key":"24_CR50","doi-asserted-by":"crossref","unstructured":"Wang, X., Yang, M., Zhu, S., Lin, Y.: Regionlets for generic object detection. In: ICCV (2013)","DOI":"10.1109\/ICCV.2013.10"},{"issue":"7","key":"24_CR51","doi-asserted-by":"publisher","first-page":"3325","DOI":"10.4249\/scholarpedia.3325","volume":"3","author":"J. Wolfe","year":"2008","unstructured":"Wolfe, J., Horowitz, T.S.: Visual search. Scholarpedia\u00a03(7), 3325 (2008)","journal-title":"Scholarpedia"},{"key":"24_CR52","doi-asserted-by":"crossref","unstructured":"Yun, K., Peng, Y., Samaras, D., Zelinsky, G.J., Berg, T.L.: Studying relationships between human gaze, description, and computer vision. In: CVPR (2013)","DOI":"10.1109\/CVPR.2013.101"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2014"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-10602-1_24","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,4]],"date-time":"2025-05-04T05:37:27Z","timestamp":1746337047000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-10602-1_24"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783319106014","9783319106021"],"references-count":52,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-10602-1_24","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2014]]}}}