{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,11]],"date-time":"2026-01-11T01:02:00Z","timestamp":1768093320029,"version":"3.49.0"},"reference-count":48,"publisher":"Springer Science and Business Media LLC","issue":"8","license":[{"start":{"date-parts":[[2022,7,27]],"date-time":"2022-07-27T00:00:00Z","timestamp":1658880000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,7,27]],"date-time":"2022-07-27T00:00:00Z","timestamp":1658880000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Sci. China Inf. Sci."],"published-print":{"date-parts":[[2022,8]]},"DOI":"10.1007\/s11432-021-3396-7","type":"journal-article","created":{"date-parts":[[2022,7,30]],"date-time":"2022-07-30T09:02:47Z","timestamp":1659171767000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":18,"title":["Fast target-aware learning for few-shot video object segmentation"],"prefix":"10.1007","volume":"65","author":[{"given":"Yadang","family":"Chen","sequence":"first","affiliation":[]},{"given":"Chuanyan","family":"Hao","sequence":"additional","affiliation":[]},{"given":"Zhi-Xin","family":"Yang","sequence":"additional","affiliation":[]},{"given":"Enhua","family":"Wu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,7,27]]},"reference":[{"key":"3396_CR1","doi-asserted-by":"publisher","first-page":"132201","DOI":"10.1007\/s11432-019-2878-y","volume":"64","author":"W M Wu","year":"2021","unstructured":"Wu W M, Wang Q, Yuan C Z, et al. Rapid dynamical pattern recognition for sampling sequences. Sci China Inf Sci, 2021, 64: 132201","journal-title":"Sci China Inf Sci"},{"key":"3396_CR2","doi-asserted-by":"publisher","first-page":"140307","DOI":"10.1007\/s11432-019-2784-4","volume":"63","author":"Y F Gu","year":"2020","unstructured":"Gu Y F, Liu H, Wang T F, et al. Deep feature extraction and motion representation for satellite video scene classification. Sci China Inf Sci, 2020, 63: 140307","journal-title":"Sci China Inf Sci"},{"key":"3396_CR3","doi-asserted-by":"publisher","first-page":"092103","DOI":"10.1007\/s11432-015-0957-4","volume":"59","author":"Y D Chen","year":"2016","unstructured":"Chen Y D, Hao C Y, Wu W, et al. Robust dense reconstruction by range merging based on confidence estimation. Sci China Inf Sci, 2016, 59: 092103","journal-title":"Sci China Inf Sci"},{"key":"3396_CR4","doi-asserted-by":"crossref","unstructured":"Perazzi F, Khoreva A, Benenson R, et al. Learning video object segmentation from static images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2017","DOI":"10.1109\/CVPR.2017.372"},{"key":"3396_CR5","doi-asserted-by":"crossref","unstructured":"Caelles S, Maninis K K, Pont-Tuset J, et al. One-shot video object segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2017. 5320\u20135329","DOI":"10.1109\/CVPR.2017.565"},{"key":"3396_CR6","doi-asserted-by":"crossref","unstructured":"Lu X K, Wang W G, Shen J B, et al. Learning video object segmentation from unlabeled videos. In: Proceedings of the 2020 IEEE Conference on Computer Vision and Pattern Recognition, 2020. 8957\u20138967","DOI":"10.1109\/CVPR42600.2020.00898"},{"key":"3396_CR7","doi-asserted-by":"crossref","unstructured":"Luiten J, Voigtlaender P, Leibe B. PReMVOS: proposal-generation, refinement and merging for video object segmentation. In: Proceedings of the 2018 DAVIS Challenge on Video Object Segmentation-CVPR Workshops, 2018","DOI":"10.1007\/978-3-030-20870-7_35"},{"key":"3396_CR8","doi-asserted-by":"publisher","first-page":"1515","DOI":"10.1109\/TPAMI.2018.2838670","volume":"41","author":"K K Maninis","year":"2019","unstructured":"Maninis K K, Caelles S, Chen Y, et al. Video object segmentation without temporal information. IEEE Trans Pattern Anal Mach Intell, 2019, 41: 1515\u20131530","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"3396_CR9","doi-asserted-by":"publisher","first-page":"1175","DOI":"10.1007\/s11263-019-01164-6","volume":"127","author":"A Khoreva","year":"2019","unstructured":"Khoreva A, Benenson R, Ilg E, et al. Lucid data dreaming for video object segmentation. Int J Comput Vis, 2019, 127: 1175\u20131197","journal-title":"Int J Comput Vis"},{"key":"3396_CR10","doi-asserted-by":"crossref","unstructured":"Oh S W, Lee J, Sunkavalli K, et al. Fast video object segmentation by reference-guided mask propagation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2018. 7376\u20137385","DOI":"10.1109\/CVPR.2018.00770"},{"key":"3396_CR11","doi-asserted-by":"crossref","unstructured":"Xiao H, Feng J, Lin G, et al. MoNet: deep motion exploitation for video object segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2018. 1140\u20131148","DOI":"10.1109\/CVPR.2018.00125"},{"key":"3396_CR12","doi-asserted-by":"crossref","unstructured":"Johnander J, Danelljan M, Brissman E, et al. A generative appearance model for end-to-end video object segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2019. 8945\u20138954","DOI":"10.1109\/CVPR.2019.00916"},{"key":"3396_CR13","doi-asserted-by":"crossref","unstructured":"Xie H Z, Yao H X, Zhou S C, et al. Efficient regional memory network for video object segmentation. 2021. ArXiv:2103.12934","DOI":"10.1109\/CVPR46437.2021.00134"},{"key":"3396_CR14","doi-asserted-by":"crossref","unstructured":"Hu Y T, Huang J B, Schwing A G. VideoMatch: matching based video object segmentation. In: Proceedings of the 2018 European Conference on Computer Vision, 2018","DOI":"10.1007\/978-3-030-01237-3_4"},{"key":"3396_CR15","doi-asserted-by":"crossref","unstructured":"Voigtlaender P, Chai Y, Schroff F, et al. FEELVOS: fast end-to-end embedding learning for video object segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2019. 9473\u20139482","DOI":"10.1109\/CVPR.2019.00971"},{"key":"3396_CR16","doi-asserted-by":"crossref","unstructured":"Lin H, Qi X, Jia J. AGSS-VOS: attention guided single-shot video object segmentation. In: Proceedings of the IEEE International Conference on Computer Vision, 2019. 3948\u20133956","DOI":"10.1109\/ICCV.2019.00405"},{"key":"3396_CR17","doi-asserted-by":"crossref","unstructured":"Yang Z X, Wei Y C, Yang Y. Collaborative video object segmentation by foreground-background integration. In: Proceedings of the European Conference on Computer Vision, 2020","DOI":"10.1007\/978-3-030-58558-7_20"},{"key":"3396_CR18","unstructured":"Vaswani A, Shazeera N, Parmar N, et al. Attention is all you need. In: Proceedings of the 31st International Conference on Neural Information Processing Systems, 2017. 6000\u20136010"},{"key":"3396_CR19","doi-asserted-by":"crossref","unstructured":"Oh S W, Lee J, Xu N, et al. Video object segmentation using space-time memory networks. In: Proceedings of the IEEE International Conference on Computer Vision, 2019. 9225\u20139234","DOI":"10.1109\/ICCV.2019.00932"},{"key":"3396_CR20","doi-asserted-by":"crossref","unstructured":"Li Y, Shen Z R, Shan Y. Fast video object segmentation using the global context module. In: Proceedings of the European Conference on Computer Vision, 2020","DOI":"10.1007\/978-3-030-58607-2_43"},{"key":"3396_CR21","unstructured":"Liang Y Q, Li X, Jafari N, et al. Video object segmentation with adaptive feature bank and uncertain-region refinement. In: Proceedings of the Conference on Neural Information Processing Systems, 2020"},{"key":"3396_CR22","doi-asserted-by":"crossref","unstructured":"Wang H C, Jiang X L, Ren H B, et al. SwiftNet: real-time video object segmentation. 2021. ArXiv:2102.04604","DOI":"10.1109\/CVPR46437.2021.00135"},{"key":"3396_CR23","doi-asserted-by":"crossref","unstructured":"Hu L, Zhang P, Zhang B, et al. Learning position and target consistency for memory-based video object segmentation. 2021. ArXiv:2104.04329","DOI":"10.1109\/CVPR46437.2021.00413"},{"key":"3396_CR24","doi-asserted-by":"crossref","unstructured":"Duke B, Ahmed A, Wolf C, et al. SSTVOS: sparse spatiotemporal transformers for video object segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2021","DOI":"10.1109\/CVPR46437.2021.00585"},{"key":"3396_CR25","doi-asserted-by":"publisher","first-page":"1934","DOI":"10.1109\/TMM.2018.2890361","volume":"21","author":"Y D Chen","year":"2019","unstructured":"Chen Y D, Hao C Y, Liu A X, et al. Multilevel model for video object segmentation based on supervision optimization. IEEE Trans Multimedia, 2019, 21: 1934\u20131945","journal-title":"IEEE Trans Multimedia"},{"key":"3396_CR26","doi-asserted-by":"publisher","first-page":"28","DOI":"10.1016\/j.neucom.2020.03.020","volume":"401","author":"C Y Hao","year":"2020","unstructured":"Hao C Y, Chen Y D, Yang Z X, et al. Higher-order potentials for video object segmentation in bilateral space. Neurocomputing, 2020, 401: 28\u201335","journal-title":"Neurocomputing"},{"key":"3396_CR27","first-page":"1","volume":"15","author":"Y D Chen","year":"2019","unstructured":"Chen Y D, Hao C Y, Liu A X, et al. Appearance-consistent video object segmentation based on a multinomial event model. ACM Trans Multimedia Comput Commun Appl, 2019, 15: 1\u201315","journal-title":"ACM Trans Multimedia Comput Commun Appl"},{"key":"3396_CR28","unstructured":"Pont-Tuset J, Perazzi F, Caelles S, et al. The 2017 DAVIS challenge on video object segmentation. 2017. ArXiv:1704.00675"},{"key":"3396_CR29","doi-asserted-by":"crossref","unstructured":"Xu N, Yang L J, Fan Y C, et al. YouTube-VOS: a large-scale video object segmentation benchmark. 2018. ArXiv:1809.03327","DOI":"10.1007\/978-3-030-01228-1_36"},{"key":"3396_CR30","doi-asserted-by":"crossref","unstructured":"Voigtlaender P, Leibe B. Online adaptation of convolutional neural networks for video object segmentation. In: Proceedings of the British Machine Vision Conference, 2017","DOI":"10.5244\/C.31.116"},{"key":"3396_CR31","doi-asserted-by":"crossref","unstructured":"Li X X, Loy C C. Video object segmentation with joint re-identification and attention-aware mask propagation. In: Proceedings of the European Conference on Computer Vision, 2018","DOI":"10.1007\/978-3-030-01219-9_6"},{"key":"3396_CR32","doi-asserted-by":"crossref","unstructured":"Griffin B A, Corso J J. BubbleNets: learning to select the guidance frame in video object segmentation by deep sorting frames. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2019. 8906\u20138915","DOI":"10.1109\/CVPR.2019.00912"},{"key":"3396_CR33","doi-asserted-by":"crossref","unstructured":"Tian Z, He T, Shen C. Decoders matter for semantic segmentation: data-dependent decoding enables flexible feature aggregation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2019. 3121\u20133130","DOI":"10.1109\/CVPR.2019.00324"},{"key":"3396_CR34","doi-asserted-by":"crossref","unstructured":"Bao L C, Wu B Y, Liu W. CNN in MRF: video object segmentation via inference in a CNN-based higher-order spatio-temporal MRF. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2018","DOI":"10.1109\/CVPR.2018.00626"},{"key":"3396_CR35","doi-asserted-by":"crossref","unstructured":"Zhang Y, Wu Z, Peng H, et al. A transductive approach for video object segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2020. 6947\u20136956","DOI":"10.1109\/CVPR42600.2020.00698"},{"key":"3396_CR36","doi-asserted-by":"crossref","unstructured":"Zhang K H, Wang L, Liu D, et al. Dual temporal memory network for efficient video object segmentation. 2020. ArXiv:2003.06125","DOI":"10.1145\/3394171.3413942"},{"key":"3396_CR37","doi-asserted-by":"crossref","unstructured":"Chen Y, Pont-Tuset J, Montes A, et al. Blazingly fast video object segmentation with pixel-wise metric learning. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2018. 1189\u20131198","DOI":"10.1109\/CVPR.2018.00130"},{"key":"3396_CR38","unstructured":"Hospedales T, Antoniou A, Micaelli P, et al. Meta-learning in neural networks: a survey. 2020. ArXiv:2004.05439"},{"key":"3396_CR39","doi-asserted-by":"crossref","unstructured":"Yang L, Wang Y, Xiong X, et al. Efficient video object segmentation via network modulation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2018. 6499\u20136507","DOI":"10.1109\/CVPR.2018.00680"},{"key":"3396_CR40","first-page":"1","volume":"12","author":"L L Tang","year":"2020","unstructured":"Tang L L, Chen K, Wu C, et al. Improving semantic analysis on point clouds via auxiliary supervision of local geometric priors. IEEE Trans Cybern, 2020, 12: 1\u201311","journal-title":"IEEE Trans Cybern"},{"key":"3396_CR41","doi-asserted-by":"crossref","unstructured":"Robinson A, Lawin A J, Danelljan M, et al. Learning fast and robust target models for video object segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2020. 7404\u20137413","DOI":"10.1109\/CVPR42600.2020.00743"},{"key":"3396_CR42","doi-asserted-by":"crossref","unstructured":"Bhat G, Lawin F G, Danelljan M, et al. Learning what to learn for video object segmentation. In: Proceedings of the European Conference on Computer Vision, 2020","DOI":"10.1007\/978-3-030-58536-5_46"},{"key":"3396_CR43","doi-asserted-by":"crossref","unstructured":"Behl H S, Najafi M, Arnab A, et al. Meta learning deep visual words for fast video object segmentation. In: Proceedings of the Conference on Neural Information Processing Systems Machine Learning for Autonomous Driving Workshop, 2019","DOI":"10.1109\/IROS45743.2020.9341737"},{"key":"3396_CR44","doi-asserted-by":"crossref","unstructured":"Pinheiro P, Lin T Y, Collobert R, et al. Learning to refine object segments. In: Proceedings of the European Conference on Computer Vision, 2016. 75\u201391","DOI":"10.1007\/978-3-319-46448-0_5"},{"key":"3396_CR45","doi-asserted-by":"publisher","first-page":"834","DOI":"10.1109\/TPAMI.2017.2699184","volume":"40","author":"L C Chen","year":"2018","unstructured":"Chen L C, Papandreou G, Kokkinos I, et al. DeepLab: semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected CRFs. IEEE Trans Pattern Anal Mach Intell, 2018, 40: 834\u2013848","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"3396_CR46","doi-asserted-by":"crossref","unstructured":"He K M, Zhang X, Ren S Q, et al. Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2016. 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"3396_CR47","unstructured":"Finn C, Abbeel P, Levine S. Model-agnostic meta-learning for fast adaptation of deep networks. In: Proceedings of the Machine Learning Research, 2017. 1126\u20131135"},{"key":"3396_CR48","doi-asserted-by":"crossref","unstructured":"He K M, Zhang X, Ren S Q, et al. Delving deep into rectifiers: surpassing human-level performance on ImageNet classification. In: Proceedings of the IEEE International Conference on Computer Vision, 2015. 1026\u20131034","DOI":"10.1109\/ICCV.2015.123"}],"container-title":["Science China Information Sciences"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11432-021-3396-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11432-021-3396-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11432-021-3396-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,30]],"date-time":"2024-09-30T07:23:23Z","timestamp":1727681003000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11432-021-3396-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,7,27]]},"references-count":48,"journal-issue":{"issue":"8","published-print":{"date-parts":[[2022,8]]}},"alternative-id":["3396"],"URL":"https:\/\/doi.org\/10.1007\/s11432-021-3396-7","relation":{},"ISSN":["1674-733X","1869-1919"],"issn-type":[{"value":"1674-733X","type":"print"},{"value":"1869-1919","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,7,27]]},"assertion":[{"value":"12 July 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 October 2021","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 December 2021","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 July 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"182104"}}