{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T07:26:29Z","timestamp":1740122789035,"version":"3.37.3"},"reference-count":45,"publisher":"Springer Science and Business Media LLC","issue":"15","license":[{"start":{"date-parts":[[2020,8,4]],"date-time":"2020-08-04T00:00:00Z","timestamp":1596499200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,8,4]],"date-time":"2020-08-04T00:00:00Z","timestamp":1596499200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2021,6]]},"DOI":"10.1007\/s11042-020-09001-6","type":"journal-article","created":{"date-parts":[[2020,8,4]],"date-time":"2020-08-04T13:02:33Z","timestamp":1596546153000},"page":"22465-22486","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Modelling relations with prototypes for visual relation detection"],"prefix":"10.1007","volume":"80","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8631-3758","authenticated-orcid":false,"given":"Fran\u00e7ois","family":"Plesse","sequence":"first","affiliation":[]},{"given":"Alexandru","family":"Ginsca","sequence":"additional","affiliation":[]},{"given":"Bertrand","family":"Delezoide","sequence":"additional","affiliation":[]},{"given":"Fran\u00e7oise","family":"Pr\u00eateux","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,8,4]]},"reference":[{"key":"9001_CR1","doi-asserted-by":"publisher","unstructured":"Chao YW, Wang Z, He Y, Wang J, Deng J (2015) HICO: A benchmark for recognizing human-object interactions in images. In: ICCV. https:\/\/doi.org\/10.1109\/ICCV.2015.122","DOI":"10.1109\/ICCV.2015.122"},{"key":"9001_CR2","doi-asserted-by":"publisher","unstructured":"Chao YW, Wang Z, Mihalcea R, Deng J (2015) Mining semantic affordances of visual object categories. In: CVPR. https:\/\/doi.org\/10.1109\/CVPR.2015.7299054","DOI":"10.1109\/CVPR.2015.7299054"},{"key":"9001_CR3","doi-asserted-by":"crossref","unstructured":"Cui Y, Zhou F, Lin Y, Belongie S (2016) Fine-grained Categorization and Dataset Bootstrapping using Deep Metric Learning with Humans in the Loop. In: CVPR","DOI":"10.1109\/CVPR.2016.130"},{"key":"9001_CR4","doi-asserted-by":"publisher","unstructured":"Dai B, Zhang Y, Lin D (2017) Detecting visual relationships with deep relational networks. In: CVPR. https:\/\/doi.org\/10.1109\/CVPR.2017.352","DOI":"10.1109\/CVPR.2017.352"},{"issue":"15","key":"9001_CR5","doi-asserted-by":"publisher","first-page":"9025","DOI":"10.1007\/s11042-015-2757-4","volume":"75","author":"M de Boer","year":"2016","unstructured":"de Boer M, Schutte K, Kraaij W (2016) Knowledge based query expansion in complex multimedia event detection. Multimed Tools Appl 75(15):9025\u20139043. https:\/\/doi.org\/10.1007\/s11042-015-2757-4","journal-title":"Multimed Tools Appl"},{"key":"9001_CR6","doi-asserted-by":"crossref","unstructured":"Deng J, Ding N, Jia Y, Frome A, Murphy K, Bengio S, Li Y, Neven H, Adam H (2014) Large-Scale Object classification using label relation graphs. In: European conference on computer vision","DOI":"10.1007\/978-3-319-10590-1_4"},{"key":"9001_CR7","doi-asserted-by":"crossref","unstructured":"Fang Y, Kuan K, Lin J, Tan C, Chandrasekhar V (2017) Object detection meets knowledge graphs. IJCAI, pp 1661\u20131667","DOI":"10.24963\/ijcai.2017\/230"},{"key":"9001_CR8","doi-asserted-by":"publisher","unstructured":"Fellbaum C (1998) Wordnet: An Electronic Lexical database, vol 71. Bradford Books. https:\/\/doi.org\/10.1139\/h11-025","DOI":"10.1139\/h11-025"},{"key":"9001_CR9","doi-asserted-by":"crossref","unstructured":"Girshick R (2015) Fast r-CNN. In: ICCV","DOI":"10.1109\/ICCV.2015.169"},{"key":"9001_CR10","doi-asserted-by":"crossref","unstructured":"Gkioxari G, Girshick R, Doll\u00e1r P, He K (2018) Detecting and recognizing Human-Object interactions. In: CVPR","DOI":"10.1109\/CVPR.2018.00872"},{"key":"9001_CR11","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: CVPR","DOI":"10.1109\/CVPR.2016.90"},{"key":"9001_CR12","unstructured":"Herzig R, Raboh M, Chechik G, Berant J, Globerson A (2018) Mapping images to scene graphs with Permutation-Invariant structured prediction. In: NIPS"},{"key":"9001_CR13","doi-asserted-by":"publisher","unstructured":"Hu Z, Ma X, Liu Z, Hovy E, Xing E (2016) Harnessing deep neural networks with logic rules. In: ACL. https:\/\/doi.org\/10.18653\/v1\/P16-1228","DOI":"10.18653\/v1\/P16-1228"},{"key":"9001_CR14","unstructured":"Johnson J, Douze M, J\u00e9gou H Billion-scale similarity search with GPUs"},{"key":"9001_CR15","unstructured":"Kaiser L, Nachum O, Roy A, Bengio S (2017) Learning to remember rare events. In: ICLR"},{"key":"9001_CR16","unstructured":"Koch G, Zemel R, Salakhutdinov R Siamese Neural Networks for One-shot Image Recognition. Technical report. https:\/\/www.cs.cmu.edu\/~rsalakhu\/papers\/oneshot1.pdf"},{"key":"9001_CR17","doi-asserted-by":"publisher","unstructured":"Krishna R, Zhu Y, Groth O, Johnson J, Hata K, Kravitz J, Chen S, Kalantidis Y, Li LJ, Shamma DA, Bernstein M, Fei-Fei L (2016) Visual genome: Connecting language and vision using crowdsourced dense image annotations. https:\/\/doi.org\/10.1007\/s11263-016-0981-7","DOI":"10.1007\/s11263-016-0981-7"},{"key":"9001_CR18","doi-asserted-by":"publisher","unstructured":"Li Y, Ouyang W, Wang X, Tang X (2017) Vip-CNN: Visual Phrase Guided Convolutional Neural Network. In: CVPR. https:\/\/doi.org\/10.1109\/CVPR.2017.766","DOI":"10.1109\/CVPR.2017.766"},{"key":"9001_CR19","doi-asserted-by":"crossref","unstructured":"Liang K, Guo Y, Chang H, Chen X (2018) Visual relationship detection with deep structural ranking. In: AAAI","DOI":"10.1609\/aaai.v32i1.12274"},{"key":"9001_CR20","doi-asserted-by":"crossref","unstructured":"Liang X, Lee L, Xing EP (2017) Deep Variation-structured Reinforcement Learning for Visual Relationship and Attribute Detection. In: CVPR. 10.1109\/CVPR.2017.469. arXiv:1703.03054","DOI":"10.1109\/CVPR.2017.469"},{"key":"9001_CR21","doi-asserted-by":"publisher","unstructured":"Long Y, Liu L, Shao L, Shen F, Ding G, Han J (2017) From zero-shot learning to conventional supervised classification: Unseen visual data synthesis. In: CVPR. https:\/\/doi.org\/10.1109\/CVPR.2017.653","DOI":"10.1109\/CVPR.2017.653"},{"key":"9001_CR22","doi-asserted-by":"publisher","unstructured":"Lu C, Krishna R, Bernstein M, Fei-Fei L (2016) Visual relationship detection with language priors. In: ECCV. https:\/\/doi.org\/10.1007\/978-3-319-46448-0_51","DOI":"10.1007\/978-3-319-46448-0_51"},{"key":"9001_CR23","unstructured":"Macqueen J (1967) Some methods for classification and analysis of multivariate observations. In: Fifth berkeley symposium on mathematical statistics and probability"},{"key":"9001_CR24","doi-asserted-by":"publisher","unstructured":"Marino K, Salakhutdinov R, Gupta A (2017) The more you know: Using knowledge graphs for image classification. In: CVPR. https:\/\/doi.org\/10.1109\/CVPR.2017.10","DOI":"10.1109\/CVPR.2017.10"},{"key":"9001_CR25","doi-asserted-by":"publisher","unstructured":"Mikolov T, Corrado G, Chen K, Dean J (2013) Efficient estimation of word representations in vector space. In: ICLR. https:\/\/doi.org\/10.1162\/153244303322533223","DOI":"10.1162\/153244303322533223"},{"key":"9001_CR26","unstructured":"Newell A, Deng J (2017) Pixels to graphs by associative embedding. In: NIPS"},{"key":"9001_CR27","doi-asserted-by":"crossref","unstructured":"Peyre J, Laptev I, Schmid C, Sivic J (2017) Weakly-supervised learning of visual relations. In: ICCV","DOI":"10.1109\/ICCV.2017.554"},{"key":"9001_CR28","doi-asserted-by":"crossref","unstructured":"Plesse F, Ginsca A, Delezoide B, Pr\u00eateux F (2020) Focusing visual relation detection on relevant relations with prior potentials. In: WACV","DOI":"10.1109\/WACV45572.2020.9093605"},{"key":"9001_CR29","doi-asserted-by":"crossref","unstructured":"Plesse F, Ginsca A, Delezoide B, Pr\u00eateux F (2018) Visual relationship detection based on guided proposals and semantic knowledge distillation. In: ICME","DOI":"10.1109\/ICME.2018.8486503"},{"key":"9001_CR30","doi-asserted-by":"publisher","unstructured":"Redmon J, Divvala S, Girshick R, Farhadi A (2016) You only look once: unified, Real-Time Object Detection. In: CVPR. https:\/\/doi.org\/10.1109\/CVPR.2016.91","DOI":"10.1109\/CVPR.2016.91"},{"key":"9001_CR31","unstructured":"Ren S, He K, Girshick R, Sun J (2015) Faster r-CNN: Towards Real-Time object detection with region proposal networks. In: NIPS"},{"key":"9001_CR32","doi-asserted-by":"crossref","unstructured":"Sarullo A, Mu T (2019) On Class Imbalance and Background Filtering in Visual Relationship Detection","DOI":"10.1109\/IJCNN.2019.8851814"},{"key":"9001_CR33","doi-asserted-by":"crossref","unstructured":"Schroff F, Philbin J (2015) Facenet: A Unified Embedding for Face Recognition and Clustering. In: CVPR","DOI":"10.1109\/CVPR.2015.7298682"},{"key":"9001_CR34","doi-asserted-by":"publisher","unstructured":"Simonyan K, Zisserman A (2015) Very deep convolutional networks for Large-Scale image recognition. In: ICLR. https:\/\/doi.org\/10.1016\/j.infsof.2008.09.005","DOI":"10.1016\/j.infsof.2008.09.005"},{"key":"9001_CR35","unstructured":"Speer R, Havasi C (2012) Representing General Relational Knowledge in ConceptNet 5. In: LREC"},{"key":"9001_CR36","first-page":"2579","volume":"9","author":"L Van Der Maaten","year":"2008","unstructured":"Van Der Maaten L, Hinton G (2008) Visualizing Data using t-SNE. Journal of Machine Learning Research 9:2579\u20132605","journal-title":"Journal of Machine Learning Research"},{"key":"9001_CR37","unstructured":"Vinyals O, Deepmind G, Blundell C, Lillicrap T, Kavukcuoglu K, Wierstra D (2016) Matching networks for one shot learning. In: NIPS"},{"key":"9001_CR38","doi-asserted-by":"crossref","unstructured":"Wang X, Ye Y, Gupta A (2018) Zero-shot Recognition via Semantic Embeddings and Knowledge Graphs. In: CVPR","DOI":"10.1109\/CVPR.2018.00717"},{"key":"9001_CR39","unstructured":"Weinberger KQ, Blitzer J, Saul LK (2009) Distance metric learning for large margin nearest neighbor classification journal of machine learning research"},{"key":"9001_CR40","unstructured":"Woo S, Kim D, Daejeon K, Cho DE, So Kweon IE (2018) LinkNet: Relational Embedding for Scene Graph. In: NIPS. arXiv:1811.06410.pdf"},{"key":"9001_CR41","doi-asserted-by":"publisher","unstructured":"Xu D, Zhu Y, Choy CB, Fei-Fei L (2017) Scene graph generation by iterative message passing. In: CVPR. https:\/\/doi.org\/10.1109\/CVPR.2017.330","DOI":"10.1109\/CVPR.2017.330"},{"key":"9001_CR42","doi-asserted-by":"crossref","unstructured":"Yin G, Sheng L, Liu B, Yu N, Wang X, Shao J, Loy CC (2018) Zoom-Net: Mining Deep feature interactions for visual relationship recognition. In: ECCV","DOI":"10.1007\/978-3-030-01219-9_20"},{"key":"9001_CR43","doi-asserted-by":"crossref","unstructured":"Yu R, Li A, Morariu VI, Davis LS (2017) Visual relationship detection with internal and external linguistic knowledge distillation. In: ICCV","DOI":"10.1109\/ICCV.2017.121"},{"key":"9001_CR44","doi-asserted-by":"crossref","unstructured":"Zellers R, Yatskar M, Thomson S, Choi Y (2018) Neural motifs: Scene graph parsing with global context. In: CVPR","DOI":"10.1109\/CVPR.2018.00611"},{"key":"9001_CR45","doi-asserted-by":"crossref","unstructured":"Zhu Y, Jiang S, Li X (2017) Visual relationship detection with object spatial distribution. In: ICME","DOI":"10.1109\/ICME.2017.8019448"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-020-09001-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-020-09001-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-020-09001-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,11,5]],"date-time":"2022-11-05T18:14:08Z","timestamp":1667672048000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-020-09001-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,8,4]]},"references-count":45,"journal-issue":{"issue":"15","published-print":{"date-parts":[[2021,6]]}},"alternative-id":["9001"],"URL":"https:\/\/doi.org\/10.1007\/s11042-020-09001-6","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"type":"print","value":"1380-7501"},{"type":"electronic","value":"1573-7721"}],"subject":[],"published":{"date-parts":[[2020,8,4]]},"assertion":[{"value":"20 March 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 February 2020","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 May 2020","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 August 2020","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}