{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,15]],"date-time":"2025-11-15T10:29:08Z","timestamp":1763202548533,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":58,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,8,24]],"date-time":"2021-08-24T00:00:00Z","timestamp":1629763200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"GENCI-IDRIS","award":["2021-[AD011012273]"],"award-info":[{"award-number":["2021-[AD011012273]"]}]},{"name":"ANR","award":["CHAIRE IA BE4musIA"],"award-info":[{"award-number":["CHAIRE IA BE4musIA"]}]},{"name":"Clinical Medicine Plus X - Young Scholars Project Peking University the Fundamental Research Funds for the Central Universitie","award":["None"],"award-info":[{"award-number":["None"]}]},{"name":"the National Key R&D Program of China","award":["2017YFB1200700"],"award-info":[{"award-number":["2017YFB1200700"]}]},{"name":"Capital Health Development Scientific Research Project","award":["Grant 2020-1-4093"],"award-info":[{"award-number":["Grant 2020-1-4093"]}]},{"name":"Global Challenges Research Fund (GCRF)","award":["G004"],"award-info":[{"award-number":["G004"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,8,24]]},"DOI":"10.1145\/3460426.3463641","type":"proceedings-article","created":{"date-parts":[[2021,9,1]],"date-time":"2021-09-01T22:50:28Z","timestamp":1630536628000},"page":"367-375","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":19,"title":["Aligning Visual Prototypes with BERT Embeddings for Few-Shot Learning"],"prefix":"10.1145","author":[{"given":"Kun","family":"Yan","sequence":"first","affiliation":[{"name":"Peking University, Beijing, China"}]},{"given":"Zied","family":"Bouraoui","sequence":"additional","affiliation":[{"name":"CRIL - University of Artois &amp; CNRS, Lens , France"}]},{"given":"Ping","family":"Wang","sequence":"additional","affiliation":[{"name":"Peking University, Beijing, China"}]},{"given":"Shoaib","family":"Jameel","sequence":"additional","affiliation":[{"name":"University of Essex, Colchester, United Kingdom"}]},{"given":"Steven","family":"Schockaert","sequence":"additional","affiliation":[{"name":"Cardiff University, Cardiff, United Kingdom"}]}],"member":"320","published-online":{"date-parts":[[2021,9]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11992"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00051"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00115"},{"key":"e_1_3_2_1_4_1","volume-title":"Yu-Chiang Frank Wang, and Jia-Bin Huang","author":"Chen Wei-Yu","year":"2019","unstructured":"Wei-Yu Chen , Yen-Cheng Liu , Zsolt Kira , Yu-Chiang Frank Wang, and Jia-Bin Huang . 2019 . A Closer Look at Few-shot Classification. In 7Proc. ICLR . Wei-Yu Chen, Yen-Cheng Liu, Zsolt Kira, Yu-Chiang Frank Wang, and Jia-Bin Huang. 2019. A Closer Look at Few-shot Classification. In 7Proc. ICLR ."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"e_1_3_2_1_6_1","volume-title":"Proc. NAACL-HLT .","author":"Devlin Jacob","year":"2019","unstructured":"Jacob Devlin , Ming-Wei Chang , Kenton Lee , and Kristina Toutanova . 2019 . BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding . In Proc. NAACL-HLT . Jacob Devlin, Ming-Wei Chang, Kenton Lee, and Kristina Toutanova. 2019. BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. In Proc. NAACL-HLT ."},{"key":"e_1_3_2_1_7_1","volume-title":"Proc. ICML . 1126--1135","author":"Finn Chelsea","year":"2017","unstructured":"Chelsea Finn , Pieter Abbeel , and Sergey Levine . 2017 . Model-Agnostic Meta-Learning for Fast Adaptation of Deep Networks . In Proc. ICML . 1126--1135 . Chelsea Finn, Pieter Abbeel, and Sergey Levine. 2017. Model-Agnostic Meta-Learning for Fast Adaptation of Deep Networks. In Proc. ICML . 1126--1135."},{"key":"e_1_3_2_1_8_1","volume-title":"Proc. NIPS . 2121--2129","author":"Frome Andrea","year":"2013","unstructured":"Andrea Frome , Gregory S. Corrado , Jonathon Shlens , Samy Bengio , Jeffrey Dean , Marc'Aurelio Ranzato , and Tomas Mikolov . 2013 . DeViSE: A Deep Visual-Semantic Embedding Model . In Proc. NIPS . 2121--2129 . Andrea Frome, Gregory S. Corrado, Jonathon Shlens, Samy Bengio, Jeffrey Dean, Marc'Aurelio Ranzato, and Tomas Mikolov. 2013. DeViSE: A Deep Visual-Semantic Embedding Model. In Proc. NIPS . 2121--2129."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00459"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00855"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.328"},{"key":"e_1_3_2_1_12_1","volume-title":"Proc. FLAIRS .","author":"He Han","year":"2020","unstructured":"Han He and Jinho Choi . 2020 . Establishing strong baselines for the new decade: Sequence tagging, syntactic and semantic parsing with BERT . In Proc. FLAIRS . Han He and Jinho Choi. 2020. Establishing strong baselines for the new decade: Sequence tagging, syntactic and semantic parsing with BERT. In Proc. FLAIRS ."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_2_1_14_1","volume-title":"Proc. NeurIPS . 4005--4016","author":"Hou Ruibing","year":"2019","unstructured":"Ruibing Hou , Hong Chang , Bingpeng Ma , Shiguang Shan , and Xilin Chen . 2019 . Cross Attention Network for Few-shot Classification . In Proc. NeurIPS . 4005--4016 . Ruibing Hou, Hong Chang, Bingpeng Ma, Shiguang Shan, and Xilin Chen. 2019. Cross Attention Network for Few-shot Classification. In Proc. NeurIPS . 4005--4016."},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.243"},{"key":"e_1_3_2_1_16_1","volume-title":"Proc. ICML. 448--456","author":"Ioffe Sergey","year":"2015","unstructured":"Sergey Ioffe and Christian Szegedy . 2015 . Batch Normalization: Accelerating Deep Network Training by Reducing Internal Covariate Shift . In Proc. ICML. 448--456 . Sergey Ioffe and Christian Szegedy. 2015. Batch Normalization: Accelerating Deep Network Training by Reducing Internal Covariate Shift. In Proc. ICML. 448--456."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00010"},{"key":"e_1_3_2_1_18_1","volume-title":"Kipf and Max Welling","author":"Thomas","year":"2017","unstructured":"Thomas N. Kipf and Max Welling . 2017 . Semi-Supervised Classification with Graph Convolutional Networks. In Proc. ICLR . Thomas N. Kipf and Max Welling. 2017. Semi-Supervised Classification with Graph Convolutional Networks. In Proc. ICLR ."},{"key":"e_1_3_2_1_19_1","volume-title":"ICML Workshop","volume":"2","author":"Koch Gregory","year":"2015","unstructured":"Gregory Koch , Richard Zemel , and Ruslan Salakhutdinov . 2015 . Siamese neural networks for one-shot image recognition . In ICML Workshop , Vol. 2 . Lille. Gregory Koch, Richard Zemel, and Ruslan Salakhutdinov. 2015. Siamese neural networks for one-shot image recognition. In ICML Workshop , Vol. 2. Lille."},{"key":"e_1_3_2_1_20_1","volume-title":"Proc. NIPS . 1097--1105","author":"Krizhevsky Alex","year":"2012","unstructured":"Alex Krizhevsky , Ilya Sutskever , and Geoffrey E Hinton . 2012 . Imagenet classification with deep convolutional neural networks . In Proc. NIPS . 1097--1105 . Alex Krizhevsky, Ilya Sutskever, and Geoffrey E Hinton. 2012. Imagenet classification with deep convolutional neural networks. In Proc. NIPS . 1097--1105."},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01091"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01259"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00009"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00743"},{"key":"e_1_3_2_1_25_1","volume-title":"Meta-sgd: Learning to learn quickly for few-shot learning. arXiv preprint arXiv:1707.09835","author":"Li Zhenguo","year":"2017","unstructured":"Zhenguo Li , Fengwei Zhou , Fei Chen , and Hang Li . 2017 . Meta-sgd: Learning to learn quickly for few-shot learning. arXiv preprint arXiv:1707.09835 (2017). Zhenguo Li, Fengwei Zhou, Fei Chen, and Hang Li. 2017. Meta-sgd: Learning to learn quickly for few-shot learning. arXiv preprint arXiv:1707.09835 (2017)."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00948"},{"key":"e_1_3_2_1_27_1","volume-title":"Proc. NeurIPS. 13--23","author":"Lu Jiasen","year":"2019","unstructured":"Jiasen Lu , Dhruv Batra , Devi Parikh , and Stefan Lee . 2019 . ViLBERT: Pretraining Task-Agnostic Visiolinguistic Representations for Vision-and-Language Tasks . In Proc. NeurIPS. 13--23 . Jiasen Lu, Dhruv Batra, Devi Parikh, and Stefan Lee. 2019. ViLBERT: Pretraining Task-Agnostic Visiolinguistic Representations for Vision-and-Language Tasks. In Proc. NeurIPS. 13--23."},{"key":"e_1_3_2_1_28_1","unstructured":"Tomas Mikolov Ilya Sutskever Kai Chen Greg S Corrado and Jeff Dean. 2013. Distributed representations of words and phrases and their compositionality. In Advances in neural information processing systems. 3111--3119.  Tomas Mikolov Ilya Sutskever Kai Chen Greg S Corrado and Jeff Dean. 2013. Distributed representations of words and phrases and their compositionality. In Advances in neural information processing systems. 3111--3119."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58542-6_29"},{"key":"e_1_3_2_1_30_1","volume-title":"On first-order meta-learning algorithms. arXiv preprint arXiv:1803.02999","author":"Nichol Alex","year":"2018","unstructured":"Alex Nichol , Joshua Achiam , and John Schulman . 2018. On first-order meta-learning algorithms. arXiv preprint arXiv:1803.02999 ( 2018 ). Alex Nichol, Joshua Achiam, and John Schulman. 2018. On first-order meta-learning algorithms. arXiv preprint arXiv:1803.02999 (2018)."},{"key":"e_1_3_2_1_31_1","volume-title":"Proc. NIPS . 719--729","author":"Oreshkin Boris N.","year":"2018","unstructured":"Boris N. Oreshkin , Pau Rodr'i guez L\u00f3 pez, and Alexandre Lacoste . 2018 . TADAM: Task dependent adaptive metric for improved few-shot learning . In Proc. NIPS . 719--729 . Boris N. Oreshkin, Pau Rodr'i guez L\u00f3 pez, and Alexandre Lacoste. 2018. TADAM: Task dependent adaptive metric for improved few-shot learning. In Proc. NIPS . 719--729."},{"key":"e_1_3_2_1_32_1","volume-title":"Manning","author":"Pennington Jeffrey","year":"2014","unstructured":"Jeffrey Pennington , Richard Socher , and Christopher D . Manning . 2014 . GloVe: Global Vectors for Word Representation. In Proc. EMNLP. 1532--1543. Jeffrey Pennington, Richard Socher, and Christopher D. Manning. 2014. GloVe: Global Vectors for Word Representation. In Proc. EMNLP. 1532--1543."},{"key":"e_1_3_2_1_33_1","volume-title":"Proc. NAACL-HLT. 1267--1273","author":"Pilehvar Mohammad Taher","year":"2019","unstructured":"Mohammad Taher Pilehvar and Jose Camacho-Collados . 2019 . WiC: the Word-in-Context Dataset for Evaluating Context-Sensitive Meaning Representations . In Proc. NAACL-HLT. 1267--1273 . Mohammad Taher Pilehvar and Jose Camacho-Collados. 2019. WiC: the Word-in-Context Dataset for Evaluating Context-Sensitive Meaning Representations. In Proc. NAACL-HLT. 1267--1273."},{"key":"e_1_3_2_1_34_1","volume-title":"Proc. ICLR .","author":"Ravi Sachin","year":"2017","unstructured":"Sachin Ravi and Hugo Larochelle . 2017 . Optimization as a Model for Few-Shot Learning . In Proc. ICLR . Sachin Ravi and Hugo Larochelle. 2017. Optimization as a Model for Few-Shot Learning. In Proc. ICLR ."},{"key":"e_1_3_2_1_35_1","volume-title":"Zemel","author":"Ren Mengye","year":"2018","unstructured":"Mengye Ren , Eleni Triantafillou , Sachin Ravi , Jake Snell , Kevin Swersky , Joshua B. Tenenbaum , Hugo Larochelle , and Richard S . Zemel . 2018 . Meta-Learning for Semi-Supervised Few-Shot Classification. In Proc. ICLR . Mengye Ren, Eleni Triantafillou, Sachin Ravi, Jake Snell, Kevin Swersky, Joshua B. Tenenbaum, Hugo Larochelle, and Richard S. Zemel. 2018. Meta-Learning for Semi-Supervised Few-Shot Classification. In Proc. ICLR ."},{"key":"e_1_3_2_1_36_1","volume-title":"Proc. ICLR .","author":"Rusu Andrei A.","year":"2019","unstructured":"Andrei A. Rusu , Dushyant Rao , Jakub Sygnowski , Oriol Vinyals , Razvan Pascanu , Simon Osindero , and Raia Hadsell . 2019 . Meta-Learning with Latent Embedding Optimization . In Proc. ICLR . Andrei A. Rusu, Dushyant Rao, Jakub Sygnowski, Oriol Vinyals, Razvan Pascanu, Simon Osindero, and Raia Hadsell. 2019. Meta-Learning with Latent Embedding Optimization. In Proc. ICLR ."},{"key":"e_1_3_2_1_37_1","volume-title":"Proc. ICLR .","author":"Satorras Victor Garcia","year":"2018","unstructured":"Victor Garcia Satorras and Joan Bruna Estrach . 2018 . Few-Shot Learning with Graph Neural Networks . In Proc. ICLR . Victor Garcia Satorras and Joan Bruna Estrach. 2018. Few-Shot Learning with Graph Neural Networks. In Proc. ICLR ."},{"key":"e_1_3_2_1_38_1","volume-title":"Adaptive Subspaces for Few-Shot Learning. In 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2020","author":"Simon Christian","year":"2020","unstructured":"Christian Simon , Piotr Koniusz , Richard Nock , and Mehrtash Harandi . 2020 . Adaptive Subspaces for Few-Shot Learning. In 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2020 , Seattle, WA, USA, June 13--19 , 2020 . 4135--4144. Christian Simon, Piotr Koniusz, Richard Nock, and Mehrtash Harandi. 2020. Adaptive Subspaces for Few-Shot Learning. In 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2020, Seattle, WA, USA, June 13--19, 2020 . 4135--4144."},{"key":"e_1_3_2_1_39_1","volume-title":"Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556","author":"Simonyan Karen","year":"2014","unstructured":"Karen Simonyan and Andrew Zisserman . 2014. Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556 ( 2014 ). Karen Simonyan and Andrew Zisserman. 2014. Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556 (2014)."},{"key":"e_1_3_2_1_40_1","volume-title":"Zemel","author":"Snell Jake","year":"2017","unstructured":"Jake Snell , Kevin Swersky , and Richard S . Zemel . 2017 . Prototypical Networks for Few-shot Learning. In Proc. NIPS. 4077--4087. Jake Snell, Kevin Swersky, and Richard S. Zemel. 2017. Prototypical Networks for Few-shot Learning. In Proc. NIPS. 4077--4087."},{"key":"e_1_3_2_1_41_1","volume-title":"Proc. ICLR .","author":"Su Weijie","year":"2020","unstructured":"Weijie Su , Xizhou Zhu , Yue Cao , Bin Li , Lewei Lu , Furu Wei , and Jifeng Dai . 2020 . VL-BERT: Pre-training of Generic Visual-Linguistic Representations . In Proc. ICLR . Weijie Su, Xizhou Zhu, Yue Cao, Bin Li, Lewei Lu, Furu Wei, and Jifeng Dai. 2020. VL-BERT: Pre-training of Generic Visual-Linguistic Representations. In Proc. ICLR ."},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00049"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00131"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1514"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58568-6_16"},{"key":"e_1_3_2_1_47_1","volume-title":"Proc. NIPS. 5998--6008","author":"Vaswani Ashish","year":"2017","unstructured":"Ashish Vaswani , Noam Shazeer , Niki Parmar , Jakob Uszkoreit , Llion Jones , Aidan N. Gomez , Lukasz Kaiser , and Illia Polosukhin . 2017 . Attention is All you Need . In Proc. NIPS. 5998--6008 . Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N. Gomez, Lukasz Kaiser, and Illia Polosukhin. 2017. Attention is All you Need. In Proc. NIPS. 5998--6008."},{"key":"e_1_3_2_1_48_1","volume-title":"Proc. NIPS. 3630--3638","author":"Vinyals Oriol","year":"2016","unstructured":"Oriol Vinyals , Charles Blundell , Tim Lillicrap , Koray Kavukcuoglu , and Daan Wierstra . 2016 . Matching Networks for One Shot Learning . In Proc. NIPS. 3630--3638 . Oriol Vinyals, Charles Blundell, Tim Lillicrap, Koray Kavukcuoglu, and Daan Wierstra. 2016. Matching Networks for One Shot Learning. In Proc. NIPS. 3630--3638."},{"key":"e_1_3_2_1_49_1","volume-title":"Technical Report CNS-TR-2011-001. California Institute of Technology.","author":"Wah C.","year":"2011","unstructured":"C. Wah , S. Branson , P. Welinder , P. Perona , and S. Belongie . 2011 . The Caltech-UCSD Birds-200--2011 Dataset . Technical Report CNS-TR-2011-001. California Institute of Technology. C. Wah, S. Branson, P. Welinder, P. Perona, and S. Belongie. 2011. The Caltech-UCSD Birds-200--2011 Dataset. Technical Report CNS-TR-2011-001. California Institute of Technology."},{"key":"e_1_3_2_1_50_1","volume-title":"SimpleShot: Revisiting Nearest-Neighbor Classification for Few-Shot Learning. CoRR","author":"Wang Yan","year":"2019","unstructured":"Yan Wang , Wei-Lun Chao , Kilian Q. Weinberger , and Laurens van der Maaten . 2019. SimpleShot: Revisiting Nearest-Neighbor Classification for Few-Shot Learning. CoRR , Vol. abs\/ 1911 .04623 ( 2019 ). Yan Wang, Wei-Lun Chao, Kilian Q. Weinberger, and Laurens van der Maaten. 2019. SimpleShot: Revisiting Nearest-Neighbor Classification for Few-Shot Learning. CoRR , Vol. abs\/1911.04623 (2019)."},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00760"},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.634"},{"key":"e_1_3_2_1_53_1","volume-title":"Pinheiro","author":"Xing Chen","year":"2019","unstructured":"Chen Xing , Negar Rostamzadeh , Boris N. Oreshkin , and Pedro O . Pinheiro . 2019 . Adaptive Cross-Modal Few-shot Learning. In Proc. NIPS. 4848--4858. Chen Xing, Negar Rostamzadeh, Boris N. Oreshkin, and Pedro O. Pinheiro. 2019. Adaptive Cross-Modal Few-shot Learning. In Proc. NIPS. 4848--4858."},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33019079"},{"key":"e_1_3_2_1_55_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00883"},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01222"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.321"},{"key":"e_1_3_2_1_58_1","volume-title":"Proc. NIPS . 2371--2380","author":"Zhang Ruixiang","year":"2018","unstructured":"Ruixiang Zhang , Tong Che , Zoubin Ghahramani , Yoshua Bengio , and Yangqiu Song . 2018 . MetaGAN: An Adversarial Approach to Few-Shot Learning . In Proc. NIPS . 2371--2380 . Ruixiang Zhang, Tong Che, Zoubin Ghahramani, Yoshua Bengio, and Yangqiu Song. 2018. MetaGAN: An Adversarial Approach to Few-Shot Learning. In Proc. NIPS . 2371--2380."}],"event":{"name":"ICMR '21: International Conference on Multimedia Retrieval","sponsor":["SIGMM ACM Special Interest Group on Multimedia"],"location":"Taipei Taiwan","acronym":"ICMR '21"},"container-title":["Proceedings of the 2021 International Conference on Multimedia Retrieval"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3460426.3463641","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3460426.3463641","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T20:17:04Z","timestamp":1750191424000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3460426.3463641"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,8,24]]},"references-count":58,"alternative-id":["10.1145\/3460426.3463641","10.1145\/3460426"],"URL":"https:\/\/doi.org\/10.1145\/3460426.3463641","relation":{},"subject":[],"published":{"date-parts":[[2021,8,24]]},"assertion":[{"value":"2021-09-01","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}