{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:21:26Z","timestamp":1750220486417,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":52,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,10,17]],"date-time":"2021-10-17T00:00:00Z","timestamp":1634428800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61972326"],"award-info":[{"award-number":["61972326"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,10,17]]},"DOI":"10.1145\/3474085.3475530","type":"proceedings-article","created":{"date-parts":[[2021,10,18]],"date-time":"2021-10-18T06:35:51Z","timestamp":1634538951000},"page":"3807-3815","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Towards Accurate Localization by Instance Search"],"prefix":"10.1145","author":[{"given":"Yi-Geng","family":"Hong","sequence":"first","affiliation":[{"name":"Xiamen University, Xiamen, China"}]},{"given":"Hui-Chu","family":"Xiao","sequence":"additional","affiliation":[{"name":"Xiamen University, Xiamen, China"}]},{"given":"Wan-Lei","family":"Zhao","sequence":"additional","affiliation":[{"name":"Xiamen University, Xiamen, China"}]}],"member":"320","published-online":{"date-parts":[[2021,10,17]]},"reference":[{"volume-title":"Fully-Convolutional Siamese Networks for Object Tracking. In ECCV Workshops. 850--865","author":"Bertinetto Luca","key":"e_1_3_2_1_1_1"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"crossref","unstructured":"H. Bilen and A. Vedaldi. 2016. Weakly Supervised Deep Detection Networks. In CVPR. 2846--2854.  H. Bilen and A. Vedaldi. 2016. Weakly Supervised Deep Detection Networks. In CVPR. 2846--2854.","DOI":"10.1109\/CVPR.2016.311"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.5555\/2987189.2987282"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/3343031.3351005"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2020.2987161"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2535231"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-009-0275-4"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"crossref","unstructured":"Heng Fan Liting Lin Fan Yang Peng Chu Ge Deng Sijia Yu Hexin Bai Yong Xu Chunyuan Liao and Haibin Ling. 2019. LaSOT: A High-Quality Benchmark for Large-Scale Single Object Tracking. In CVPR.  Heng Fan Liting Lin Fan Yang Peng Chu Ge Deng Sijia Yu Hexin Bai Yong Xu Chunyuan Liao and Haibin Ling. 2019. LaSOT: A High-Quality Benchmark for Large-Scale Single Object Tracking. In CVPR.","DOI":"10.1109\/CVPR.2019.00552"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"crossref","unstructured":"Q. Fan W. Zhuo C. K. Tang and Y. W. Tai. 2020. Few-Shot Object Detection With Attention-RPN and Multi-Relation Detector. In CVPR. 4012--4021.  Q. Fan W. Zhuo C. K. Tang and Y. W. Tai. 2020. Few-Shot Object Detection With Attention-RPN and Multi-Relation Detector. In CVPR. 4012--4021.","DOI":"10.1109\/CVPR42600.2020.00407"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1023\/B:VISI.0000022288.19776.77"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2844175"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"crossref","unstructured":"K. He X. Zhang S. Ren and J. Sun. 2016. Deep Residual Learning for Image Recognition. In CVPR. 770--778.  K. He X. Zhang S. Ren and J. Sun. 2016. Deep Residual Learning for Image Recognition. In CVPR. 770--778.","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.5555\/3454287.3454532"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"crossref","unstructured":"Jie Hu Li Shen and Gang Sun. 2018. Squeeze-and-Excitation Networks. In CVPR.  Jie Hu Li Shen and Gang Sun. 2018. Squeeze-and-Excitation Networks. In CVPR.","DOI":"10.1109\/CVPR.2018.00745"},{"key":"e_1_3_2_1_15_1","unstructured":"L. Huang X. Zhao and K. Huang. 2019. GOT-10k: A Large High-Diversity Benchmark for Generic Object Tracking in the Wild. TPAMI (2019) 1--1.  L. Huang X. Zhao and K. Huang. 2019. GOT-10k: A Large High-Diversity Benchmark for Generic Object Tracking in the Wild. TPAMI (2019) 1--1."},{"volume-title":"Region Manifolds: Recovering Small Objects with Compact CNN Representations. In CVPR. 926--935.","year":"2017","author":"Iscen A.","key":"e_1_3_2_1_16_1"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"crossref","unstructured":"Albert Jimenez Jose M. Alvarez and Xavier Gir\u00f3-i-Nieto. 2017. Class Weighted Convolutional Features for Visual Instance Search. In BMVC.  Albert Jimenez Jose M. Alvarez and Xavier Gir\u00f3-i-Nieto. 2017. Class Weighted Convolutional Features for Visual Instance Search. In BMVC.","DOI":"10.5244\/C.31.144"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"crossref","unstructured":"Yannis Kalantidis Clayton Mellina and Simon Osindero. 2016. Cross-Dimensional Weighting for Aggregated Deep Convolutional Features. In ECCV. 685--701.  Yannis Kalantidis Clayton Mellina and Simon Osindero. 2016. Cross-Dimensional Weighting for Aggregated Deep Convolutional Features. In ECCV. 685--701.","DOI":"10.1007\/978-3-319-46604-0_48"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"crossref","unstructured":"B. Kang Z. Liu X. Wang F. Yu J. Feng and T. Darrell. 2019. Few-Shot Object Detection via Feature Reweighting. In ICCV. 8419--8428.  B. Kang Z. Liu X. Wang F. Yu J. Feng and T. Darrell. 2019. Few-Shot Object Detection via Feature Reweighting. In ICCV. 8419--8428.","DOI":"10.1109\/ICCV.2019.00851"},{"key":"e_1_3_2_1_20_1","unstructured":"Jaeyoon Kim and Sung-Eui Yoon. 2018. Regional Attention Based Deep Feature for Image Retrieval. In BMVC. 209.  Jaeyoon Kim and Sung-Eui Yoon. 2018. Regional Attention Based Deep Feature for Image Retrieval. In BMVC. 209."},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"crossref","unstructured":"Bo Li Wei Wu Qiang Wang Fangyi Zhang Junliang Xing and Junjie Yan. 2019. SiamRPN: Evolution of Siamese Visual Tracking With Very Deep Networks. In CVPR.  Bo Li Wei Wu Qiang Wang Fangyi Zhang Junliang Xing and Junjie Yan. 2019. SiamRPN: Evolution of Siamese Visual Tracking With Very Deep Networks. In CVPR.","DOI":"10.1109\/CVPR.2019.00441"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"crossref","unstructured":"Bo Li Junjie Yan Wei Wu Zheng Zhu and Xiaolin Hu. 2018. High Performance Visual Tracking With Siamese Region Proposal Network. In CVPR.  Bo Li Junjie Yan Wei Wu Zheng Zhu and Xiaolin Hu. 2018. High Performance Visual Tracking With Siamese Region Proposal Network. In CVPR.","DOI":"10.1109\/CVPR.2018.00935"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2019.11.029"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"crossref","unstructured":"Tsung-Yi Lin Michael Maire Serge Belongie James Hays Pietro Perona Deva Ramanan Piotr Doll\u00e1r and C. Lawrence Zitnick. 2014. Microsoft COCO: Common Objects in Context. In ECCV. 740--755.  Tsung-Yi Lin Michael Maire Serge Belongie James Hays Pietro Perona Deva Ramanan Piotr Doll\u00e1r and C. Lawrence Zitnick. 2014. Microsoft COCO: Common Objects in Context. In ECCV. 740--755.","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.5555\/302528.302753"},{"volume-title":"Saliency Weighted Convolutional Features for Instance Search. In 2018 International Conference on Content-Based Multimedia Indexing (CBMI). 1--6.","year":"2018","author":"Mohedano E.","key":"e_1_3_2_1_26_1"},{"volume-title":"DLWL: Improving Detection for Lowshot Classes With Weakly Labelled Data. In CVPR.","year":"2020","author":"Ramanathan Vignesh","key":"e_1_3_2_1_27_1"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"crossref","unstructured":"E. Real J. Shlens S. Mazzocchi X. Pan and V. Vanhoucke. 2017. YouTube-Bounding Boxes: A Large High-Precision Human-Annotated Data Set for Object Detection in Video. In CVPR. 7464--7473.  E. Real J. Shlens S. Mazzocchi X. Pan and V. Vanhoucke. 2017. YouTube-Bounding Boxes: A Large High-Precision Human-Annotated Data Set for Object Detection in Video. In CVPR. 7464--7473.","DOI":"10.1109\/CVPR.2017.789"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"crossref","unstructured":"J. Redmon S. Divvala R. Girshick and A. Farhadi. 2016. You Only Look Once: Unified Real-Time Object Detection. In CVPR. 779--788.  J. Redmon S. Divvala R. Girshick and A. Farhadi. 2016. You Only Look Once: Unified Real-Time Object Detection. In CVPR. 779--788.","DOI":"10.1109\/CVPR.2016.91"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2577031"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2015.2456908"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"volume-title":"Faster R-CNN Features for Instance Search. In CVPR Workshops.","year":"2016","author":"Salvador Amaia","key":"e_1_3_2_1_33_1"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2804907"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.230"},{"volume-title":"FSCE: Few-Shot Object Detection via Contrastive Proposal Encoding. arxiv: 2103.05950 [cs.CV]","year":"2021","author":"Sun Bo","key":"e_1_3_2_1_36_1"},{"key":"e_1_3_2_1_37_1","first-page":"176","article-title":"PCL","volume":"42","author":"Tang P.","year":"2020","journal-title":"Proposal Cluster Learning for Weakly Supervised Object Detection. TPAMI"},{"volume-title":"Particular Object Retrieval with Integral Max-Pooling of CNN Activations. arXiv preprint arXiv:1511.05879","year":"2015","author":"Tolias Giorgos","key":"e_1_3_2_1_38_1"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/2700292"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"crossref","unstructured":"Xiaolong Wang Ross Girshick Abhinav Gupta and Kaiming He. 2018. Non-Local Neural Networks. In CVPR.  Xiaolong Wang Ross Girshick Abhinav Gupta and Kaiming He. 2018. Non-Local Neural Networks. In CVPR.","DOI":"10.1109\/CVPR.2018.00813"},{"key":"e_1_3_2_1_41_1","first-page":"9919","article-title":"Frustratingly Simple Few-Shot Object Detection","volume":"119","author":"Wang Xin","year":"2020","journal-title":"ICML"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"crossref","unstructured":"Y. Wang D. Ramanan and M. Hebert. 2019. Meta-Learning to Detect Rare Objects. In ICCV. 9924--9933.  Y. Wang D. Ramanan and M. Hebert. 2019. Meta-Learning to Detect Rare Objects. In ICCV. 9924--9933.","DOI":"10.1109\/ICCV.2019.01002"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2018.10.022"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"crossref","unstructured":"Jiaxi Wu Songtao Liu Di Huang and Yunhong Wang. 2020 a. Multi-scale Positive Sample Refinement for Few-Shot Object Detection. In ECCV. 456--472.  Jiaxi Wu Songtao Liu Di Huang and Yunhong Wang. 2020 a. Multi-scale Positive Sample Refinement for Few-Shot Object Detection. In ECCV. 456--472.","DOI":"10.1007\/978-3-030-58517-4_27"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413832"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2014.2388226"},{"volume-title":"Deeply Activated Salient Region for Instance Search. arxiv","year":"2002","author":"Xiao Hui-Chu","key":"e_1_3_2_1_47_1"},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"crossref","unstructured":"X. Yan Z. Chen A. Xu X. Wang X. Liang and L. Lin. 2019. Meta R-CNN: Towards General Solver for Instance-Level Low-Shot Learning. In ICCV. 9576--9585.  X. Yan Z. Chen A. Xu X. Wang X. Liang and L. Lin. 2019. Meta R-CNN: Towards General Solver for Instance-Level Low-Shot Learning. In ICCV. 9576--9585.","DOI":"10.1109\/ICCV.2019.00967"},{"volume-title":"Instance Search via Instance Level Segmentation and Feature Representation. arxiv","year":"1806","author":"Zhan Yu","key":"e_1_3_2_1_49_1"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-018-1112-4"},{"key":"e_1_3_2_1_51_1","unstructured":"Chenchen Zhu Fangyi Chen Uzair Ahmed and Marios Savvides. 2021. Semantic Relation Reasoning for Shot-Stable Few-Shot Object Detection. arxiv: 2103.01903 [cs.CV]  Chenchen Zhu Fangyi Chen Uzair Ahmed and Marios Savvides. 2021. Semantic Relation Reasoning for Shot-Stable Few-Shot Object Detection. arxiv: 2103.01903 [cs.CV]"},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"crossref","unstructured":"Zheng Zhu Qiang Wang Bo Li Wei Wu Junjie Yan and Weiming Hu. 2018. Distractor-aware Siamese Networks for Visual Object Tracking. In ECCV.  Zheng Zhu Qiang Wang Bo Li Wei Wu Junjie Yan and Weiming Hu. 2018. Distractor-aware Siamese Networks for Visual Object Tracking. In ECCV.","DOI":"10.1007\/978-3-030-01240-3_7"}],"event":{"name":"MM '21: ACM Multimedia Conference","sponsor":["SIGMM ACM Special Interest Group on Multimedia"],"location":"Virtual Event China","acronym":"MM '21"},"container-title":["Proceedings of the 29th ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3474085.3475530","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3474085.3475530","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T20:49:10Z","timestamp":1750193350000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3474085.3475530"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,10,17]]},"references-count":52,"alternative-id":["10.1145\/3474085.3475530","10.1145\/3474085"],"URL":"https:\/\/doi.org\/10.1145\/3474085.3475530","relation":{},"subject":[],"published":{"date-parts":[[2021,10,17]]},"assertion":[{"value":"2021-10-17","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}