{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T19:10:49Z","timestamp":1775243449317,"version":"3.50.1"},"publisher-location":"Cham","reference-count":60,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030012458","type":"print"},{"value":"9783030012465","type":"electronic"}],"license":[{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2018,1,1]],"date-time":"2018-01-01T00:00:00Z","timestamp":1514764800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018]]},"DOI":"10.1007\/978-3-030-01246-5_11","type":"book-chapter","created":{"date-parts":[[2018,10,5]],"date-time":"2018-10-05T16:14:56Z","timestamp":1538756096000},"page":"172-190","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":115,"title":["Attributes as Operators: Factorizing Unseen Attribute-Object Compositions"],"prefix":"10.1007","author":[{"given":"Tushar","family":"Nagarajan","sequence":"first","affiliation":[]},{"given":"Kristen","family":"Grauman","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,10,6]]},"reference":[{"key":"11_CR1","doi-asserted-by":"crossref","unstructured":"Al-Halah, Z., Tapaswi, M., Stiefelhagen, R.: Recovering the missing link: predicting class-attribute associations for unsupervised zero-shot learning. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.643"},{"key":"11_CR2","doi-asserted-by":"crossref","unstructured":"Alayrac, J.B., Sivic, J., Laptev, I., Lacoste-Julien, S.: Joint discovery of object states and manipulating actions. In: ICCV (2017)","DOI":"10.1109\/ICCV.2017.234"},{"key":"11_CR3","unstructured":"Baroni, M., Zamparelli, R.: Nouns are vectors, adjectives are matrices: representing adjective-noun constructions in semantic space. In: EMNLP (2010)"},{"key":"11_CR4","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"663","DOI":"10.1007\/978-3-642-15549-9_48","volume-title":"Computer Vision \u2013 ECCV 2010","author":"TL Berg","year":"2010","unstructured":"Berg, T.L., Berg, A.C., Shih, J.: Automatic attribute discovery and characterization from noisy web data. In: Daniilidis, K., Maragos, P., Paragios, N. (eds.) ECCV 2010. LNCS, vol. 6311, pp. 663\u2013676. Springer, Heidelberg (2010). https:\/\/doi.org\/10.1007\/978-3-642-15549-9_48"},{"key":"11_CR5","doi-asserted-by":"crossref","unstructured":"Chen, C.Y., Grauman, K.: Inferring analogous attributes. In: CVPR (2014)","DOI":"10.1109\/CVPR.2014.33"},{"key":"11_CR6","doi-asserted-by":"crossref","unstructured":"Chen, L., Zhang, H., Xiao, J., Liu, W., Chang, S.F.: Zero-shot visual recognition using semantics-preserving adversarial embedding network. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00115"},{"key":"11_CR7","doi-asserted-by":"crossref","unstructured":"Cheng, D., Gong, Y., Zhou, S., Wang, J., Zheng, N.: Person re-identification by multi-channel parts-based cnn with improved triplet loss function. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.149"},{"key":"11_CR8","doi-asserted-by":"crossref","unstructured":"Choe, J., Park, S., Kim, K., Park, J.H., Kim, D., Shim, H.: Face generation for low-shot learning using generative adversarial networks. In: ICCVW (2017)","DOI":"10.1109\/ICCVW.2017.229"},{"key":"11_CR9","doi-asserted-by":"crossref","unstructured":"Cruz, R.S., Fernando, B., Cherian, A., Gould, S.: Neural algebra of classifiers. In: WACV (2018)","DOI":"10.1109\/WACV.2018.00085"},{"key":"11_CR10","doi-asserted-by":"crossref","unstructured":"Dixit, M., Kwitt, R., Niethammer, M., Vasconcelos, N.: Aga: Attribute-guided augmentation. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.355"},{"key":"11_CR11","doi-asserted-by":"crossref","unstructured":"Farhadi, A., Endres, I., Hoiem, D., Forsyth, D.: Describing objects by their attributes. In: CVPR (2009)","DOI":"10.1109\/CVPR.2009.5206772"},{"key":"11_CR12","doi-asserted-by":"crossref","unstructured":"Fathi, A., Rehg, J.M.: Modeling actions through state changes. In: CVPR (2013)","DOI":"10.1109\/CVPR.2013.333"},{"key":"11_CR13","unstructured":"Guevara, E.: A regression model of adjective-noun compositionality in distributional semantics. In: ACL Workshop on Geometrical Models of Natural Language Semantics (2010)"},{"key":"11_CR14","doi-asserted-by":"crossref","unstructured":"Hariharan, B., Girshick, R.: Low-shot visual recognition by shrinking and hallucinating features. In: ICCV (2017)","DOI":"10.1109\/ICCV.2017.328"},{"key":"11_CR15","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"11_CR16","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1007\/978-3-319-24261-3_7","volume-title":"Similarity-Based Pattern Recognition","author":"E Hoffer","year":"2015","unstructured":"Hoffer, E., Ailon, N.: Deep metric learning using triplet network. In: Feragen, A., Pelillo, M., Loog, M. (eds.) SIMBAD 2015. LNCS, vol. 9370, pp. 84\u201392. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-24261-3_7"},{"key":"11_CR17","doi-asserted-by":"crossref","unstructured":"Hsiao, W.L., Grauman, K.: Learning the latent look: Unsupervised discovery of a style-coherent embedding from fashion images. In: ICCV (2017)","DOI":"10.1109\/ICCV.2017.451"},{"key":"11_CR18","doi-asserted-by":"crossref","unstructured":"Huang, J., Feris, R., Chen, Q., Yan, S.: Cross-domain image retrieval with a dual attribute-aware ranking network. In: ICCV (2015)","DOI":"10.1109\/ICCV.2015.127"},{"key":"11_CR19","doi-asserted-by":"crossref","unstructured":"Huang, S., Elhoseiny, M., Elgammal, A., Yang, D.: Learning hypergraph-regularized attribute predictors. In: CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298638"},{"key":"11_CR20","doi-asserted-by":"crossref","unstructured":"Isola, P., Lim, J.J., Adelson, E.H.: Discovering states and transformations in image collections. In: CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298744"},{"key":"11_CR21","unstructured":"Jayaraman, D., Grauman, K.: Zero-shot recognition with unreliable attributes. In: NIPS (2014)"},{"key":"11_CR22","doi-asserted-by":"crossref","unstructured":"Jayaraman, D., Grauman, K.: Learning image representations tied to ego-motion. In: ICCV (2015)","DOI":"10.1109\/ICCV.2015.166"},{"key":"11_CR23","doi-asserted-by":"crossref","unstructured":"Jayaraman, D., Sha, F., Grauman, K.: Decorrelating semantic visual attributes by resisting the urge to share. In: CVPR (2014)","DOI":"10.1109\/CVPR.2014.211"},{"key":"11_CR24","doi-asserted-by":"crossref","unstructured":"Kovashka, A., Parikh, D., Grauman, K.: Whittlesearch: image search with relative attribute feedback. In: CVPR (2012)","DOI":"10.1109\/CVPR.2012.6248026"},{"issue":"12","key":"11_CR25","doi-asserted-by":"publisher","first-page":"2891","DOI":"10.1109\/TPAMI.2012.162","volume":"35","author":"Girish Kulkarni","year":"2013","unstructured":"Kulkarni, G., et al.: Babytalk: understanding and generating simple image descriptions. TPAMI 35, 2891\u20132903 (2013)","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"11_CR26","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"340","DOI":"10.1007\/978-3-540-88693-8_25","volume-title":"Computer Vision \u2013 ECCV 2008","author":"N Kumar","year":"2008","unstructured":"Kumar, N., Belhumeur, P., Nayar, S.: FaceTracer: a search engine for large collections of images with faces. In: Forsyth, D., Torr, P., Zisserman, A. (eds.) ECCV 2008. LNCS, vol. 5305, pp. 340\u2013353. Springer, Heidelberg (2008). https:\/\/doi.org\/10.1007\/978-3-540-88693-8_25"},{"key":"11_CR27","doi-asserted-by":"crossref","unstructured":"Laffont, P.Y., Ren, Z., Tao, X., Qian, C., Hays, J.: Transient attributes for high-level understanding and editing of outdoor scenes. In: SIGGRAPH (2014)","DOI":"10.1145\/2601097.2601101"},{"key":"11_CR28","doi-asserted-by":"crossref","unstructured":"Lampert, C.H., Nickisch, H., Harmeling, S.: Learning to detect unseen object classes by between-class attribute transfer. In: CVPR (2009)","DOI":"10.1109\/CVPR.2009.5206594"},{"key":"11_CR29","doi-asserted-by":"crossref","unstructured":"Liu, Z., Luo, P., Wang, X., Tang, X.: Deep learning face attributes in the wild. In: ICCV (2015)","DOI":"10.1109\/ICCV.2015.425"},{"key":"11_CR30","doi-asserted-by":"crossref","unstructured":"Lu, C., Krishna, R., Bernstein, M., Fei-Fei, L.: Visual relationship detection with language priors. In: ECCV (2016)","DOI":"10.1007\/978-3-319-46448-0_51"},{"key":"11_CR31","unstructured":"Lu, J., Li, J., Yan, Z., Zhang, C.: Zero-shot learning by generating pseudo feature representations. arXiv preprint arXiv:1703.06389 (2017)"},{"key":"11_CR32","doi-asserted-by":"crossref","unstructured":"Lu, Y., Kumar, A., Zhai, S., Cheng, Y., Javidi, T., Feris, R.: Fully-adaptive feature sharing in multi-task networks with applications in person attribute classification. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.126"},{"key":"11_CR33","doi-asserted-by":"crossref","unstructured":"Misra, I., Gupta, A., Hebert, M.: From red wine to red tomato: composition with context. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.129"},{"key":"11_CR34","doi-asserted-by":"crossref","unstructured":"Mitchell, J., Lapata, M.: Vector-based models of semantic composition. In: HLT, ACL (2008)","DOI":"10.3115\/1699510.1699567"},{"key":"11_CR35","unstructured":"Nguyen, D.T., Lazaridou, A., Bernardi, R.: Coloring objects: adjective-noun visual semantic compositionality. In: ACL Workshop on Vision and Language (2014)"},{"key":"11_CR36","doi-asserted-by":"crossref","unstructured":"Parikh, D., Grauman, K.: Relative attributes. In: ICCV (2011)","DOI":"10.1109\/ICCV.2011.6126281"},{"key":"11_CR37","doi-asserted-by":"crossref","unstructured":"Patterson, G., Hays, J.: Sun attribute database: discovering, annotating, and recognizing scene attributes. In: CVPR (2012)","DOI":"10.1109\/CVPR.2012.6247998"},{"key":"11_CR38","doi-asserted-by":"crossref","unstructured":"Pennington, J., Socher, R., Manning, C.: Glove: global vectors for word representation. In: EMNLP (2014)","DOI":"10.3115\/v1\/D14-1162"},{"key":"11_CR39","doi-asserted-by":"crossref","unstructured":"Pezzelle, S., Shekhar, R., Bernardi, R.: Building a bagpipe with a bag and a pipe: exploring conceptual combination in vision. In: ACL Workshop on Vision and Language (2016)","DOI":"10.18653\/v1\/W16-3208"},{"issue":"3","key":"11_CR40","doi-asserted-by":"publisher","first-page":"382","DOI":"10.1016\/0010-0285(76)90013-X","volume":"8","author":"Eleanor Rosch","year":"1976","unstructured":"Rosch, E., Mervis, C.B., Gray, W.D., Johnson, D.M., Boyes-Braem, P.: Basic objects in natural categories. Cogn. Psychol. 8(3), 382\u2013439 (1976)","journal-title":"Cognitive Psychology"},{"issue":"3","key":"11_CR41","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"Olga Russakovsky","year":"2015","unstructured":"Russakovsky, O., et al.: Imagenet large scale visual recognition challenge. IJCV 115(3), 211\u2013252 (2015)","journal-title":"International Journal of Computer Vision"},{"key":"11_CR42","doi-asserted-by":"crossref","unstructured":"Sadeghi, M.A., Farhadi, A.: Recognition using visual phrases. In: CVPR (2011)","DOI":"10.1109\/CVPR.2011.5995711"},{"key":"11_CR43","doi-asserted-by":"crossref","unstructured":"Schroff, F., Kalenichenko, D., Philbin, J.: Facenet: a unified embedding for face recognition and clustering. In: CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298682"},{"key":"11_CR44","doi-asserted-by":"crossref","unstructured":"Siddiquie, B., Feris, R.S., Davis, L.S.: Image ranking and retrieval based on multi-attribute queries. In: CVPR (2011)","DOI":"10.1109\/CVPR.2011.5995329"},{"key":"11_CR45","doi-asserted-by":"crossref","unstructured":"Singh, K.K., Lee, Y.J.: End-to-end localization and ranking for relative attributes. In: ECCV (2016)","DOI":"10.1007\/978-3-319-46466-4_45"},{"key":"11_CR46","doi-asserted-by":"crossref","unstructured":"Socher, R., et al.: Recursive deep models for semantic compositionality over a sentiment treebank. In: EMNLP (2013)","DOI":"10.18653\/v1\/D13-1170"},{"key":"11_CR47","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"475","DOI":"10.1007\/978-3-319-46475-6_30","volume-title":"Computer Vision \u2013 ECCV 2016","author":"C Su","year":"2016","unstructured":"Su, C., Zhang, S., Xing, J., Gao, W., Tian, Q.: Deep attributes driven multi-camera person re-identification. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9906, pp. 475\u2013491. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46475-6_30"},{"key":"11_CR48","doi-asserted-by":"crossref","unstructured":"Verma, V.K., Arora, G., Mishra, A., Rai, P.: Generalized zero-shot learning via synthesized examples. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00450"},{"key":"11_CR49","doi-asserted-by":"crossref","unstructured":"Wang, J., Cheng, Y., Schmidt Feris, R.: Walk and learn: facial attribute representation learning from egocentric video and contextual data. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.252"},{"key":"11_CR50","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1007\/978-3-319-71249-9_6","volume-title":"Machine Learning and Knowledge Discovery in Databases","author":"Qian Wang","year":"2017","unstructured":"Wang, Q., Chen, K.: Alternative semantic representations for zero-shot human action recognition. In: ECML (2017)"},{"key":"11_CR51","doi-asserted-by":"crossref","unstructured":"Wang, X., Farhadi, A., Gupta, A.: Action\u2019s transformations. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.291"},{"key":"11_CR52","doi-asserted-by":"crossref","unstructured":"Xian, Y., Lorenz, T., Schiele, B., Akata, Z.: Feature generating networks for zero-shot learning. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00581"},{"key":"11_CR53","doi-asserted-by":"crossref","unstructured":"Xian, Y., Schiele, B., Akata, Z.: Zero-shot learning-the good, the bad and the ugly. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.328"},{"key":"11_CR54","doi-asserted-by":"crossref","unstructured":"Yan, X., Yang, J., Sohn, K., Lee, H.: Attribute2image: Conditional image generation from visual attributes. In: ECCV (2016)","DOI":"10.1007\/978-3-319-46493-0_47"},{"key":"11_CR55","doi-asserted-by":"crossref","unstructured":"Yu, A., Grauman, K.: Fine-grained visual comparisons with local learning. In: CVPR (2014)","DOI":"10.1109\/CVPR.2014.32"},{"key":"11_CR56","doi-asserted-by":"crossref","unstructured":"Yu, A., Grauman, K.: Semantic jitter: dense supervision for visual comparisons via synthetic images. In: ICCV (2017)","DOI":"10.1109\/ICCV.2017.594"},{"key":"11_CR57","doi-asserted-by":"crossref","unstructured":"Zhang, H., Kyaw, Z., Chang, S.F., Chua, T.S.: Visual translation embedding network for visual relation detection. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.331"},{"key":"11_CR58","doi-asserted-by":"crossref","unstructured":"Zhou, T., Tulsiani, S., Sun, W., Malik, J., Efros, A.A.: View synthesis by appearance flow. In: ECCV (2016)","DOI":"10.1007\/978-3-319-46493-0_18"},{"key":"11_CR59","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"262","DOI":"10.1007\/978-3-319-46484-8_16","volume-title":"Computer Vision \u2013 ECCV 2016","author":"Y Zhou","year":"2016","unstructured":"Zhou, Y., Berg, T.L.: Learning temporal transformations from time-lapse videos. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9912, pp. 262\u2013277. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46484-8_16"},{"key":"11_CR60","doi-asserted-by":"crossref","unstructured":"Zhu, Y., Elhoseiny, M., Liu, B., Elgammal, A.: Imagine it for me: generative adversarial approach for zero-shot learning from noisy texts. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00111"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2018"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-01246-5_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T18:36:25Z","timestamp":1775241385000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-01246-5_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018]]},"ISBN":["9783030012458","9783030012465"],"references-count":60,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-01246-5_11","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018]]},"assertion":[{"value":"6 October 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Munich","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Germany","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 September 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14 September 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2018.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}