{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,19]],"date-time":"2026-06-19T02:18:45Z","timestamp":1781835525599,"version":"3.54.5"},"publisher-location":"Cham","reference-count":49,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783319464534","type":"print"},{"value":"9783319464541","type":"electronic"}],"license":[{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016]]},"DOI":"10.1007\/978-3-319-46454-1_30","type":"book-chapter","created":{"date-parts":[[2016,9,15]],"date-time":"2016-09-15T09:15:09Z","timestamp":1473930909000},"page":"489-505","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":51,"title":["Look-Ahead Before You Leap: End-to-End Active Recognition by Forecasting the Effect of Motion"],"prefix":"10.1007","author":[{"given":"Dinesh","family":"Jayaraman","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Kristen","family":"Grauman","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2016,9,16]]},"reference":[{"key":"30_CR1","doi-asserted-by":"crossref","unstructured":"Agrawal, P., Carreira, J., Malik, J.: Learning to see by moving. In: ICCV (2015)","DOI":"10.1109\/ICCV.2015.13"},{"key":"30_CR2","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1007\/BF00133571","volume":"1","author":"J Aloimonos","year":"1988","unstructured":"Aloimonos, J., Weiss, I., Bandyopadhyay, A.: Active vision. IJCV 1, 333\u2013356 (1988)","journal-title":"IJCV"},{"key":"30_CR3","doi-asserted-by":"crossref","unstructured":"Andreopoulos, A., Tsotsos, J.: A theory of active object localization. In: ICCV (2009)","DOI":"10.1109\/ICCV.2009.5459332"},{"key":"30_CR4","first-page":"827","volume":"117","author":"A Andreopoulos","year":"2013","unstructured":"Andreopoulos, A., Tsotsos, J.: 50 years of object recognition: directions forward. CVIU 117, 827\u2013891 (2013)","journal-title":"CVIU"},{"key":"30_CR5","unstructured":"Ba, J., Mnih, V., Kavukcuoglu, K.: Multiple object recognition with visual attention. In: ICLR (2015)"},{"key":"30_CR6","doi-asserted-by":"publisher","first-page":"996","DOI":"10.1109\/5.5968","volume":"76","author":"R Bajcsy","year":"1988","unstructured":"Bajcsy, R.: Active perception. Proc. IEEE 76, 996\u20131005 (1988)","journal-title":"Proc. IEEE"},{"key":"30_CR7","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1016\/0004-3702(91)90080-4","volume":"48","author":"D Ballard","year":"1991","unstructured":"Ballard, D.: Animate vision. Artif. Intell. 48, 57\u201386 (1991)","journal-title":"Artif. Intell."},{"key":"30_CR8","unstructured":"Bazzani, L., et al.: Learning attentional policies for tracking and recognition in video with deep networks. In: ICML (2011)"},{"key":"30_CR9","first-page":"281","volume":"13","author":"J Bergstra","year":"2012","unstructured":"Bergstra, J., Bengio, Y.: Random search for hyper-parameter optimization. JMLR 13, 281\u2013305 (2012)","journal-title":"JMLR"},{"key":"30_CR10","doi-asserted-by":"crossref","unstructured":"Borotschnig, H., Paletta, L., Prantl, M., Pinz, A., et al.: Active object recognition in parametric eigenspace. In: BMVC (1998)","DOI":"10.5244\/C.12.63"},{"key":"30_CR11","doi-asserted-by":"crossref","unstructured":"Bowling, M., Ghodsi, A., Wilkinson, D.: Action respecting embedding. In: ICML (2005)","DOI":"10.1145\/1102351.1102360"},{"key":"30_CR12","unstructured":"Brentano, F.: Psychologie vom empirischen Standpunkte (1874)"},{"key":"30_CR13","doi-asserted-by":"crossref","unstructured":"Butko, N., Movellan, J.: Optimal scanning for faster object detection. In: CVPR (2009)","DOI":"10.1109\/CVPR.2009.5206540"},{"key":"30_CR14","doi-asserted-by":"publisher","first-page":"189","DOI":"10.1023\/A:1011135513777","volume":"43","author":"F Callari","year":"2001","unstructured":"Callari, F., Ferrie, F.: Active object recognition: looking for differences. IJCV 43, 189\u2013204 (2001)","journal-title":"IJCV"},{"key":"30_CR15","doi-asserted-by":"crossref","unstructured":"Chen, C., Seff, A., Kornhauser, A., Xiao, J.: DeepDriving: learning affordance for direct perception in autonomous driving. In: ICCV (2015)","DOI":"10.1109\/ICCV.2015.312"},{"key":"30_CR16","unstructured":"Cohen, T.S., Welling, M.: Transformation properties of learned visual representations. arXiv preprint \n                      arXiv:1412.7659\n                      \n                     (2014)"},{"key":"30_CR17","doi-asserted-by":"publisher","first-page":"145","DOI":"10.1109\/34.982896","volume":"24","author":"J Denzler","year":"2002","unstructured":"Denzler, J., Brown, C.M.: Information theoretic sensor data selection for active object recognition and state estimation. TPAMI 24, 145\u2013157 (2002)","journal-title":"TPAMI"},{"key":"30_CR18","first-page":"239","volume":"67","author":"S Dickinson","year":"1997","unstructured":"Dickinson, S., Christensen, H., Tsotsos, J., Olofsson, G.: Active object recognition integrating attention and viewpoint control. CVIU 67, 239\u2013260 (1997)","journal-title":"CVIU"},{"key":"30_CR19","unstructured":"Ding, W., Taylor, G.W.: Mental rotation by optimizing transforming distance. In: NIPS DL Workshop (2014)"},{"key":"30_CR20","doi-asserted-by":"crossref","unstructured":"Flynn, J., Neulander, I., Philbin, J., Snavely, N.: DeepStereo: Learning to predict new views from the world\u2019s imagery. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.595"},{"key":"30_CR21","unstructured":"Garcia, A.G., Vezhnevets, A., Ferrari, V.: An active search strategy for efficient object detection. In: CVPR (2015)"},{"key":"30_CR22","unstructured":"Helmer, S., et al.: Semantic robot vision challenge: current state and future directions. In: IJCAI Workshop (2009)"},{"key":"30_CR23","doi-asserted-by":"crossref","unstructured":"Jayaraman, D., Grauman, K.: Learning image representations tied to ego-motion. In: ICCV (2015)","DOI":"10.1109\/ICCV.2015.166"},{"key":"30_CR24","doi-asserted-by":"crossref","unstructured":"Jayaraman, D., Grauman, K.: Slow and steady feature analysis: higher order temporal coherence in video. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.418"},{"key":"30_CR25","unstructured":"Kulkarni, T.D., Whitney, W., Kohli, P., Tenenbaum, J.B.: Deep convolutional inverse graphics network. In: NIPS (2015)"},{"key":"30_CR26","unstructured":"Levine, S., Finn, C., Darrell, T., Abbeel, P.: End-to-End training of deep visuomotor policies. In: ICRA (2015)"},{"key":"30_CR27","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"740","DOI":"10.1007\/978-3-319-10602-1_48","volume-title":"Computer Vision \u2013 ECCV 2014","author":"T-Y Lin","year":"2014","unstructured":"Lin, T.-Y., Maire, M., Belongie, S., Hays, J., Perona, P., Ramanan, D., Doll\u00e1r, P., Zitnick, C.L.: Microsoft COCO: common objects in context. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014, Part V. LNCS, vol. 8693, pp. 740\u2013755. Springer, Heidelberg (2014)"},{"key":"30_CR28","unstructured":"Malmir, M., Sikka, K., Forster, D., Movellan, J., Cottrell, G.W.: Deep Q-learning for active recognition of GERMS. In: BMVC (2015)"},{"key":"30_CR29","doi-asserted-by":"crossref","unstructured":"Mishra, A., Aloimonos, Y., Fermuller, C.: Active segmentation for robotics. In: IROS (2009)","DOI":"10.1109\/IROS.2009.5354325"},{"key":"30_CR30","unstructured":"Mnih, V., Heess, N., Graves, A., Kavukcuoglu, K.: Recurrent models of visual attention. In: NIPS (2014)"},{"key":"30_CR31","doi-asserted-by":"crossref","unstructured":"Paletta, L., Pinz, A.: Active object recognition by view integration and reinforcement learning. In: RAS (2000)","DOI":"10.1016\/S0921-8890(99)00079-2"},{"key":"30_CR32","unstructured":"Ramanathan, V., Pinz, A.: Active object categorization on a humanoid robot. In: VISAPP (2011)"},{"key":"30_CR33","unstructured":"Ranzato, M., Szlam, A., Bruna, J., Mathieu, M., Collobert, R., Chopra, S.: Video (language) modeling: a baseline for generative models of natural videos. arXiv preprint \n                      arXiv:1412.6604\n                      \n                     (2014)"},{"key":"30_CR34","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky, O., Deng, J., Su, H., Krause, J., Satheesh, S., Ma, S., Huang, Z., Karpathy, A., Khosla, A., Bernstein, M., Berg, A.C., Fei-Fei, L.: ImageNet large scale visual recognition challenge. IJCV 115, 211\u2013252 (2015)","journal-title":"IJCV"},{"key":"30_CR35","unstructured":"Schiele, B., Crowley, J.: Transinformation for active object recognition. In: ICCV (1998)"},{"key":"30_CR36","unstructured":"Sermanet, P., Frome, A., Real, E.: Attention for fine-grained categorization. arXiv (2014)"},{"key":"30_CR37","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. arXiv (2014)"},{"key":"30_CR38","doi-asserted-by":"crossref","unstructured":"Soatto, S.: Actionable information in vision. In: ICCV (2009)","DOI":"10.1109\/ICCV.2009.5459468"},{"key":"30_CR39","doi-asserted-by":"crossref","unstructured":"Stober, J., Miikkulainen, R., Kuipers, B.: Learning geometry from sensorimotor experience. In: ICDL (2011)","DOI":"10.1109\/DEVLRN.2011.6037381"},{"key":"30_CR40","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Liu, W., Jia, Y., Sermanet, P., Reed, S., Anguelov, D., Erhan, D., Vanhoucke, V., Rabinovich, A.: Going deeper with convolutions. In: CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"30_CR41","unstructured":"Vondrick, C., Pirsiavash, H., Torralba, A.: Anticipating the future by watching unlabeled video. In: CVPR (2016)"},{"key":"30_CR42","doi-asserted-by":"crossref","unstructured":"Walker, J., Gupta, A., Hebert, M.: Dense optical flow prediction from a static image. In: ICCV (2015)","DOI":"10.1109\/ICCV.2015.281"},{"key":"30_CR43","unstructured":"Watter, M., Springenberg, J.T., Boedecker, J., Riedmiller, M.: Embed to control: a locally linear latent dynamics model for control from raw images. In: NIPS (2015)"},{"key":"30_CR44","unstructured":"Wilkes, D., Tsotsos, J.: Active object recognition. In: CVPR (1992)"},{"key":"30_CR45","first-page":"229","volume":"8","author":"R Williams","year":"1992","unstructured":"Williams, R.: Simple statistical gradient-following algorithms for connectionist reinforcement learning. JMLR 8, 229\u2013256 (1992)","journal-title":"JMLR"},{"key":"30_CR46","unstructured":"Wu, Z., Song, S., Khosla, A., Yu, F., Zhang, L., Tang, X., Xiao, J.: 3D ShapeNets: a deep representation for volumetric shape modeling. In: CVPR (2015)"},{"key":"30_CR47","unstructured":"Xiao, J., Ehinger, K., Oliva, A., Torralba, A., et al.: Recognizing scene viewpoint using panoramic place representation. In: CVPR (2012)"},{"key":"30_CR48","unstructured":"Xu, K., Ba, J., Kiros, R., Cho, K., Courville, A., Salakhutdinov, R., Zemel, R., Bengio, Y.: Show, attend and tell: Neural image caption generation with visual attention. In: ICML (2015)"},{"key":"30_CR49","unstructured":"Yu, X., Fermuller, C., Teo, C.L., Yang, Y., Aloimonos, Y.: Active scene recognition with vision and language. In: CVPR (2011)"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2016"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-46454-1_30","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,10,10]],"date-time":"2020-10-10T01:46:47Z","timestamp":1602294407000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-46454-1_30"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016]]},"ISBN":["9783319464534","9783319464541"],"references-count":49,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-46454-1_30","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016]]},"assertion":[{"value":"16 September 2016","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Amsterdam","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"The Netherlands","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2016","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 October 2016","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"16 October 2016","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2016","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.eccv2016.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}