{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T12:40:53Z","timestamp":1772800853667,"version":"3.50.1"},"reference-count":92,"publisher":"Springer Science and Business Media LLC","issue":"19","license":[{"start":{"date-parts":[[2022,5,20]],"date-time":"2022-05-20T00:00:00Z","timestamp":1653004800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,5,20]],"date-time":"2022-05-20T00:00:00Z","timestamp":1653004800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100010909","name":"Young Scientists Fund","doi-asserted-by":"publisher","award":["51807003"],"award-info":[{"award-number":["51807003"]}],"id":[{"id":"10.13039\/501100010909","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Neural Comput &amp; Applic"],"published-print":{"date-parts":[[2022,10]]},"DOI":"10.1007\/s00521-022-07330-1","type":"journal-article","created":{"date-parts":[[2022,5,20]],"date-time":"2022-05-20T23:02:47Z","timestamp":1653087767000},"page":"16861-16877","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":10,"title":["Spatiotemporal context-aware network for video salient object detection"],"prefix":"10.1007","volume":"34","author":[{"given":"Tianyou","family":"Chen","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2462-4996","authenticated-orcid":false,"given":"Jin","family":"Xiao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiaoguang","family":"Hu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Guofeng","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shaojie","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,5,20]]},"reference":[{"key":"7330_CR1","doi-asserted-by":"publisher","first-page":"10","DOI":"10.1109\/TIP.2018.2843680","volume":"27","author":"W Qiu","year":"2018","unstructured":"Qiu W, Gao X, Han B (2018) Eye fixation assisted video saliency detection via total variation-based pairwise interaction. IEEE Trans Image Process 27:10. https:\/\/doi.org\/10.1109\/TIP.2018.2843680","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR2","doi-asserted-by":"publisher","first-page":"10","DOI":"10.1109\/TIP.2018.2849860","volume":"27","author":"TN Le","year":"2018","unstructured":"Le TN, Sugimoto A (2018) Video salient object detection using spatiotemporal deep features. IEEE Trans Image Process 27:10. https:\/\/doi.org\/10.1109\/TIP.2018.2849860","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR3","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2011.2125450","author":"W Kim","year":"2011","unstructured":"Kim W, Jung C, Kim C (2011) Spatiotemporal saliency detection and its applications in static and dynamic scenes. IEEE Trans Circuits Syst Video Technol. https:\/\/doi.org\/10.1109\/TCSVT.2011.2125450","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"7330_CR4","doi-asserted-by":"publisher","unstructured":"Hu YT, Bin Huang J, Schwing AG (2018) Unsupervised video object segmentation using motion saliency-guided spatio-temporal propagation. Lecture notes in computer science (including subseries lecture notes in artificial intelligence and lecture notes in bioinformatics), vol 11205 LNCS. https:\/\/doi.org\/10.1007\/978-3-030-01246-5_48","DOI":"10.1007\/978-3-030-01246-5_48"},{"key":"7330_CR5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00783","author":"S Gorji","year":"2018","unstructured":"Gorji S, Clark JJ (2018) Going from image to video saliency: augmenting image salience with dynamic attentional push. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2018.00783","journal-title":"CVPR"},{"key":"7330_CR6","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2018.2839523","author":"C Chen","year":"2018","unstructured":"Chen C, Li S, Qin H, Pan Z, Yang G (2018) Bilevel feature learning for video saliency detection. IEEE Trans Multimed. https:\/\/doi.org\/10.1109\/TMM.2018.2839523","journal-title":"IEEE Trans Multimed"},{"key":"7330_CR7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.47","author":"N Xu","year":"2016","unstructured":"Xu N, Price B, Cohen S, Yang J, Huang T (2016) Deep interactive object selection. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2016.47","journal-title":"CVPR"},{"key":"7330_CR8","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2013.2282897","author":"H Hadizadeh","year":"2014","unstructured":"Hadizadeh H, Bajic IV (2014) Saliency-aware video compression. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2013.2282897","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR9","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2009.2030969","author":"C Guo","year":"2010","unstructured":"Guo C, Zhang L (2010) A novel multiresolution spatiotemporal saliency detection model and its applications in image and video compression. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2009.2030969","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.111","author":"Y Pan","year":"2017","unstructured":"Pan Y, Yao T, Li H, Mei T (2017) Video captioning with transferred semantic attributes. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2017.111","journal-title":"CVPR"},{"key":"7330_CR11","doi-asserted-by":"publisher","unstructured":"Xu N et al (2018) YouTube-VOS: sequence-to-sequence video object segmentation. In: Lecture notes in computer science (including subseries lecture notes in artificial intelligence and lecture notes in bioinformatics), vol 11209 LNCS. https:\/\/doi.org\/10.1007\/978-3-030-01228-1_36.","DOI":"10.1007\/978-3-030-01228-1_36"},{"key":"7330_CR12","doi-asserted-by":"publisher","unstructured":"Wang W, Shen J, Porikli F (2015) Saliency-aware geodesic video object segmentation. In: Proceedings of the IEEE computer society conference on computer vision and pattern recognition, vol 07-12-June-2015. https:\/\/doi.org\/10.1109\/CVPR.2015.7298961","DOI":"10.1109\/CVPR.2015.7298961"},{"key":"7330_CR13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.79","author":"Z Zhang","year":"2016","unstructured":"Zhang Z, Fidler S, Urtasun R (2016) Instance-level segmentation for autonomous driving with deep densely connected MRFs. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2016.79","journal-title":"CVPR"},{"key":"7330_CR14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.407","author":"C Yang","year":"2013","unstructured":"Yang C, Zhang L, Lu H, Ruan X, Yang MH (2013) Saliency detection via graph-based manifold ranking. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2013.407","journal-title":"CVPR"},{"key":"7330_CR15","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2662005","author":"W Wang","year":"2018","unstructured":"Wang W, Shen J, Yang R, Porikli F (2018) Saliency-aware video object segmentation. IEEE Trans Pattern Anal Mach Intel. https:\/\/doi.org\/10.1109\/TPAMI.2017.2662005","journal-title":"IEEE Trans Pattern Anal Mach Intel"},{"key":"7330_CR16","doi-asserted-by":"publisher","unstructured":"Wang W, Shen J, Guo F, Cheng MM, Borji A (2018) Revisiting video saliency: a large-scale benchmark and a new model. https:\/\/doi.org\/10.1109\/CVPR.2018.00514.","DOI":"10.1109\/CVPR.2018.00514"},{"key":"7330_CR17","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2017.2787612","author":"W Wang","year":"2018","unstructured":"Wang W, Shen J (2018) Deep visual attention prediction. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2017.2787612","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR18","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2015.2460013","author":"W Wang","year":"2015","unstructured":"Wang W, Shen J, Shao L (2015) Consistent video saliency using local gradient flow optimization and global refinement. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2015.2460013","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR19","doi-asserted-by":"publisher","DOI":"10.1109\/TCYB.2017.2761361","author":"F Guo","year":"2018","unstructured":"Guo F et al (2018) Video saliency detection using object proposals. IEEE Trans Cybern. https:\/\/doi.org\/10.1109\/TCYB.2017.2761361","journal-title":"IEEE Trans Cybern"},{"key":"7330_CR20","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2014.2336549","author":"Y Fang","year":"2014","unstructured":"Fang Y, Wang Z, Lin W, Fang Z (2014) Video saliency incorporating spatiotemporal cues and uncertainty weighting. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2014.2336549","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR21","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2021.3068644","author":"C Chen","year":"2021","unstructured":"Chen C, Wang G, Peng C, Fang Y, Zhang D, Qin H (2021) Exploring rich and efficient spatial temporal interactions for real-time video salient object detection. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2021.3068644","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR22","doi-asserted-by":"publisher","unstructured":"Wu Z, Su L, Huang Q (2019) Cascaded partial decoder for fast and accurate salient object detection. In: Proceedings of the IEEE computer society conference on computer vision and pattern recognition, vol 2019-June. https:\/\/doi.org\/10.1109\/CVPR.2019.00403","DOI":"10.1109\/CVPR.2019.00403"},{"key":"7330_CR23","doi-asserted-by":"publisher","unstructured":"Zhao J, Liu JJ, Fan DP, Cao Y, Yang J, Cheng MM (2019) EGNet: edge guidance network for salient object detection. In: Proceedings of the IEEE international conference on computer vision, vol 2019-October. https:\/\/doi.org\/10.1109\/ICCV.2019.00887","DOI":"10.1109\/ICCV.2019.00887"},{"key":"7330_CR24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00404","author":"JJ Liu","year":"2019","unstructured":"Liu JJ, Hou Q, Cheng MM, Feng J, Jiang J (2019) A simple pooling-based design for real-time salient object detection. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2019.00404","journal-title":"CVPR"},{"key":"7330_CR25","doi-asserted-by":"crossref","unstructured":"Li S, Sui X, Luo X, Xu X, Liu Y, Goh R (2021) Medical image segmentation using squeeze-and-expansion transformers [Online]. Available: http:\/\/arxiv.org\/abs\/2105.09511","DOI":"10.24963\/ijcai.2021\/112"},{"key":"7330_CR26","unstructured":"Mao Y et al (2021) Transformer transforms salient object detection and camouflaged object detection 14(8):1\u201315, [Online]. Available: http:\/\/arxiv.org\/abs\/2104.10127"},{"key":"7330_CR27","unstructured":"Vaswani A et al (2017) Attention is all you need. Advances in neural information processing systems, vol. 2017-December"},{"key":"7330_CR28","unstructured":"Chen J et al (2021) TransUNet: transformers make strong encoders for medical image segmentation, pp 1\u201313, [Online]. Available: http:\/\/arxiv.org\/abs\/2102.04306"},{"key":"7330_CR29","unstructured":"Dosovitskiy A et al (2021) An image is worth 16\u2009\u00d7\u200916 words: transformers for image recognition at scale. ICLR"},{"key":"7330_CR30","doi-asserted-by":"publisher","unstructured":"Li H, Chen G, Li G, Yu Y (2019) Motion guided attention for video salient object detection. In: Proceedings of the IEEE international conference on computer vision, vol 2019-October. https:\/\/doi.org\/10.1109\/ICCV.2019.00737","DOI":"10.1109\/ICCV.2019.00737"},{"key":"7330_CR31","doi-asserted-by":"publisher","unstructured":"Ren S, Han C, Yang X, Han G, He S (2020) TENet: triple excitation network for video salient object detection. Lecture notes in computer science (including subseries lecture notes in artificial intelligence and lecture notes in bioinformatics), vol 12350 LNCS. https:\/\/doi.org\/10.1007\/978-3-030-58558-7_13","DOI":"10.1007\/978-3-030-58558-7_13"},{"key":"7330_CR32","doi-asserted-by":"publisher","unstructured":"Song H, Wang W, Zhao S, Shen J, Lam KM (2018) Pyramid dilated deeper ConvLSTM for video salient object detection. In: Lecture notes in computer science (including subseries lecture notes in artificial intelligence and lecture notes in bioinformatics), vol 11215 LNCS, https:\/\/doi.org\/10.1007\/978-3-030-01252-6_44","DOI":"10.1007\/978-3-030-01252-6_44"},{"key":"7330_CR33","doi-asserted-by":"publisher","unstructured":"Fan DP, Wang W, Cheng MM, Shen J (2019) Shifting more attention to video salient object detection. In: Proceedings of the IEEE computer society conference on computer vision and pattern recognition, vol. 2019-June. https:\/\/doi.org\/10.1109\/CVPR.2019.00875","DOI":"10.1109\/CVPR.2019.00875"},{"key":"7330_CR34","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6633","author":"Z Chen","year":"2020","unstructured":"Chen Z, Xu Q, Cong R, Huang Q (2020) Global context-aware progressive aggregation network for salient object detection. AAAI. https:\/\/doi.org\/10.1609\/aaai.v34i07.6633","journal-title":"AAAI"},{"key":"7330_CR35","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr42600.2020.00943","author":"Y Pang","year":"2020","unstructured":"Pang Y, Zhao X, Zhang L, Lu H (2020) Multi-scale interactive network for salient object detection. CVPR. https:\/\/doi.org\/10.1109\/cvpr42600.2020.00943","journal-title":"CVPR"},{"key":"7330_CR36","unstructured":"Klein DA, Frintrop S (2021) Center-surround divergence of feature statistics for salient object detection. ICCV"},{"key":"7330_CR37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.271","author":"H Jiang","year":"2013","unstructured":"Jiang H, Wang J, Yuan Z, Wu Y, Zheng N, Li S (2013) Salient object detection: a discriminative regional feature integration approach. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2013.271","journal-title":"CVPR"},{"key":"7330_CR38","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2017.11.024","author":"J Liang","year":"2018","unstructured":"Liang J, Zhou J, Tong L, Bai X, Wang B (2018) Material based salient object detection from hyperspectral images. Pattern Recognit. https:\/\/doi.org\/10.1016\/j.patcog.2017.11.024","journal-title":"Pattern Recognit"},{"key":"7330_CR39","unstructured":"Shijian L, Joo-Hwee L (2012) Saliency modeling from image histograms. ECCV"},{"key":"7330_CR40","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.158","author":"S Lu","year":"2014","unstructured":"Lu S, Tan C, Lim JH (2014) Robust and efficient saliency modeling from image co-occurrence histograms. IEEE Trans Pattern Anal Mach Intell. https:\/\/doi.org\/10.1109\/TPAMI.2013.158","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"7330_CR41","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2016.10.025","author":"J Zhang","year":"2017","unstructured":"Zhang J, Ehinger KA, Wei H, Zhang K, Yang J (2017) A novel graph-based optimization framework for salient object detection. Pattern Recognit. https:\/\/doi.org\/10.1016\/j.patcog.2016.10.025","journal-title":"Pattern Recognit"},{"key":"7330_CR42","doi-asserted-by":"publisher","unstructured":"Wang T, Borji A, Zhang L, Zhang P, Lu H (2017) A stagewise refinement model for detecting salient objects in images. In: Proceedings of the IEEE international conference on computer vision, vol 2017-October. https:\/\/doi.org\/10.1109\/ICCV.2017.433","DOI":"10.1109\/ICCV.2017.433"},{"key":"7330_CR43","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2021.04.078","author":"T Chen","year":"2021","unstructured":"Chen T, Hu X, Xiao J, Zhang G (2021) BPFINet: boundary-aware progressive feature integration network for salient object detection. Neurocomputing. https:\/\/doi.org\/10.1016\/j.neucom.2021.04.078","journal-title":"Neurocomputing"},{"key":"7330_CR44","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00320","author":"T Zhao","year":"2019","unstructured":"Zhao T, Wu X (2019) Pyramid feature attention network for saliency detection. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2019.00320","journal-title":"CVPR"},{"key":"7330_CR45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00766","author":"X Qin","year":"2019","unstructured":"Qin X, Zhang Z, Huang C, Gao C, Dehghan M, Jagersand M (2019) Basnet: Boundary-aware salient object detection. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2019.00766","journal-title":"CVPR"},{"key":"7330_CR46","doi-asserted-by":"publisher","unstructured":"Feng M, Lu H, Ding E (2019) Attentive feedback network for boundary-aware salient object detection. In: Proceedings of the IEEE computer society conference on computer vision and pattern recognition, vol. 2019-June. https:\/\/doi.org\/10.1109\/CVPR.2019.00172","DOI":"10.1109\/CVPR.2019.00172"},{"key":"7330_CR47","doi-asserted-by":"publisher","first-page":"8652","DOI":"10.1109\/TIP.2020.3017352","volume":"29","author":"JJ Liu","year":"2020","unstructured":"Liu JJ, Hou Q, Cheng MM (2020) Dynamic feature integration for simultaneous detection of salient object, edge, and skeleton. IEEE Trans Image Process 29:8652\u20138667. https:\/\/doi.org\/10.1109\/TIP.2020.3017352","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR48","doi-asserted-by":"publisher","unstructured":"Chen Z, Xu Q, Cong R, Huang Q (2020) Global context-aware progressive aggregation network for salient object detection. https:\/\/doi.org\/10.1609\/aaai.v34i07.6633","DOI":"10.1609\/aaai.v34i07.6633"},{"key":"7330_CR49","doi-asserted-by":"crossref","unstructured":"Zhao X, Pang Y, Zhang L, Lu H, Zhang L (2020) Suppress and balance: a simple gated network for salient object detection. ECCV","DOI":"10.1109\/CVPR42600.2020.00943"},{"key":"7330_CR50","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00736","author":"Z Wu","year":"2019","unstructured":"Wu Z, Su L, Huang Q (2019) Stacked cross refinement network for edge-aware salient object detection. ICCV. https:\/\/doi.org\/10.1109\/ICCV.2019.00736","journal-title":"ICCV"},{"key":"7330_CR51","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6916","author":"J Wei","year":"2020","unstructured":"Wei J, Wang S, Huang Q (2020) F3Net: fusion, feedback and focus for salient object detection. AAAI. https:\/\/doi.org\/10.1609\/aaai.v34i07.6916","journal-title":"AAAI"},{"key":"7330_CR52","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2019.2941017","author":"L Zhu","year":"2020","unstructured":"Zhu L et al (2020) Aggregating attentional dilated features for salient object detection. IEEE Trans Circ Syst Video Technol. https:\/\/doi.org\/10.1109\/TCSVT.2019.2941017","journal-title":"IEEE Trans Circ Syst Video Technol"},{"key":"7330_CR53","doi-asserted-by":"publisher","DOI":"10.1109\/tcsvt.2020.2980853","author":"Z Tu","year":"2020","unstructured":"Tu Z, Ma Y, Li C, Li C, Tang J, Luo B (2020) Edge-guided non-local fully convolutional network for salient object detection. IEEE Trans Circuits Syst Video Technol. https:\/\/doi.org\/10.1109\/tcsvt.2020.2980853","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"7330_CR54","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2008.4587715","author":"C Guo","year":"2008","unstructured":"Guo C, Ma Q, Zhang L (2008) Spatio-temporal saliency detection using phase spectrum of quaternion fourier transform. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2008.4587715","journal-title":"CVPR"},{"key":"7330_CR55","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2015.2425544","author":"H Kim","year":"2015","unstructured":"Kim H, Kim Y, Sim JY, Kim CS (2015) Spatiotemporal saliency detection for video sequences based on random walk with restart. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2015.2425544","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR56","doi-asserted-by":"publisher","unstructured":"Zhang P, Wang D, Lu H, Wang H, Ruan X (2017) Amulet: aggregating multi-level convolutional features for salient object detection. In: Proceedings of the IEEE international conference on computer vision, vol. 2017-October. https:\/\/doi.org\/10.1109\/ICCV.2017.31","DOI":"10.1109\/ICCV.2017.31"},{"key":"7330_CR57","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.698","author":"Z Luo","year":"2017","unstructured":"Luo Z, Mishra A, Achkar A, Eichel J, Li S, Jodoin PM (2017) Non-local deep features for salient object detection. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2017.698","journal-title":"CVPR"},{"key":"7330_CR58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00326","author":"N Liu","year":"2018","unstructured":"Liu N, Han J, Yang MH (2018) PiCANet: learning pixel-wise contextual attention for saliency detection. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2018.00326","journal-title":"CVPR"},{"key":"7330_CR59","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00081","author":"X Zhang","year":"2018","unstructured":"Zhang X, Wang T, Qi J, Lu H, Wang G (2018) Progressive attention guided recurrent network for salient object detection. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2018.00081","journal-title":"CVPR"},{"key":"7330_CR60","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6892","author":"B Wang","year":"2020","unstructured":"Wang B, Chen Q, Zhou M, Zhang Z, Jin X, Gai K (2020) Progressive feature polishing network for salient object detection. AAAI. https:\/\/doi.org\/10.1609\/aaai.v34i07.6892","journal-title":"AAAI"},{"key":"7330_CR61","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2017.2754941","author":"W Wang","year":"2018","unstructured":"Wang W, Shen J, Shao L (2018) Video salient object detection via fully convolutional networks. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2017.2754941","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR62","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00342","author":"G Li","year":"2018","unstructured":"Li G, Xie Y, Wei T, Wang K, Lin L (2018) Flow guided recurrent neural encoder for video salient object detection. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2018.00342","journal-title":"CVPR"},{"key":"7330_CR63","doi-asserted-by":"publisher","unstructured":"Dosovitskiy A et al (2015) FlowNet: learning optical flow with convolutional networks. ICCV. https:\/\/doi.org\/10.1109\/ICCV.2015.316.","DOI":"10.1109\/ICCV.2015.316"},{"key":"7330_CR64","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6718","author":"Y Gu","year":"2020","unstructured":"Gu Y, Wang L, Wang Z, Liu Y, Cheng MM, Lu SP (2020) Pyramid constrained self-attention network for fast video salient object detection. AAAI. https:\/\/doi.org\/10.1609\/aaai.v34i07.6718","journal-title":"AAAI"},{"key":"7330_CR65","unstructured":"Zheng S et al (2020) Rethinking semantic segmentation from a sequence-to-sequence perspective with transformers. CoRR, vol. abs\/2012.15840, [Online]. Available: http:\/\/arxiv.org\/abs\/2012.15840"},{"key":"7330_CR66","doi-asserted-by":"crossref","unstructured":"Wang W et al (2021) Pyramid vision transformer: a versatile backbone for dense prediction without convolutions, [Online]. Available: http:\/\/arxiv.org\/abs\/2102.12122","DOI":"10.1109\/ICCV48922.2021.00061"},{"key":"7330_CR67","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90","author":"K He","year":"2016","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2016.90","journal-title":"CVPR"},{"key":"7330_CR68","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2815688","author":"Q Hou","year":"2019","unstructured":"Hou Q, Cheng MM, Hu X, Borji A, Tu Z, Torr PHS (2019) Deeply supervised salient object detection with short connections. IEEE Trans Pattern Anal Mach Intell. https:\/\/doi.org\/10.1109\/TPAMI.2018.2815688","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"7330_CR69","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00187","author":"L Zhang","year":"2018","unstructured":"Zhang L, Dai J, Lu H, He Y, Wang G (2018) A bi-directional message passing model for salient object detection. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2018.00187","journal-title":"CVPR"},{"issue":"4","key":"7330_CR70","doi-asserted-by":"publisher","first-page":"600","DOI":"10.1109\/TIP.2003.819861","volume":"13","author":"Z Wang","year":"2004","unstructured":"Wang Z, Bovik AC, Sheikh HR, Simoncelli EP (2004) Image quality assessment: from error visibility to structural similarity. IEEE Trans Image Process 13(4):600\u2013612. https:\/\/doi.org\/10.1109\/TIP.2003.819861","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR71","doi-asserted-by":"publisher","unstructured":"Mattyus G, Luo W, Urtasun R (2017) DeepRoadMapper: extracting road topology from aerial images. In: Proceedings of the IEEE international conference on computer vision, vol. 2017-October. https:\/\/doi.org\/10.1109\/ICCV.2017.372","DOI":"10.1109\/ICCV.2017.372"},{"key":"7330_CR72","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.404","author":"L Wang","year":"2017","unstructured":"Wang L et al (2017) Learning to detect salient objects with image-level supervision. CVPR. https:\/\/doi.org\/10.1109\/CVPR.2017.404","journal-title":"CVPR"},{"key":"7330_CR73","doi-asserted-by":"publisher","unstructured":"Brox T, Malik J (2010) Object segmentation by long term analysis of point trajectories. Lecture notes in computer science (including subseries lecture notes in artificial intelligence and lecture notes in bioinformatics), vol 6315 LNCS, no Part 5, https:\/\/doi.org\/10.1007\/978-3-642-15555-0_21","DOI":"10.1007\/978-3-642-15555-0_21"},{"key":"7330_CR74","doi-asserted-by":"publisher","unstructured":"Perazzi F, Pont-Tuset J, McWilliams B, Van Gool L, Gross M, Sorkine-Hornung A (2016) A benchmark dataset and evaluation methodology for video object segmentation. In: Proceedings of the IEEE computer society conference on computer vision and pattern recognition, vol. 2016-December. https:\/\/doi.org\/10.1109\/CVPR.2016.85.","DOI":"10.1109\/CVPR.2016.85"},{"key":"7330_CR75","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2017.2762594","author":"J Li","year":"2018","unstructured":"Li J, Xia C, Chen X (2018) A benchmark dataset and saliency-guided stacked autoencoders for video-based salient object detection. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2017.2762594","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR76","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.273","author":"F Li","year":"2013","unstructured":"Li F, Kim T, Humayun A, Tsai D, Rehg JM (2013) Video segmentation by tracking many figure-ground segments. ICCV. https:\/\/doi.org\/10.1109\/ICCV.2013.273","journal-title":"ICCV"},{"key":"7330_CR77","doi-asserted-by":"crossref","unstructured":"Fan DP, Zhai Y, Borji A, Yang J, Shao L (2020) BBS-Net: RGB-D salient object detection with a bifurcated backbone strategy network. ECCV","DOI":"10.1007\/978-3-030-58610-2_17"},{"key":"7330_CR78","unstructured":"Kingma DP, Ba JL (2015) Adam: a method for stochastic optimization"},{"key":"7330_CR79","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2016.2631900","author":"T Xi","year":"2017","unstructured":"Xi T, Zhao W, Wang H, Lin W (2017) Salient object detection with spatiotemporal background priors for video. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2016.2631900","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR80","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2016.2595324","author":"Z Liu","year":"2017","unstructured":"Liu Z, Li J, Ye L, Sun G, Shen L (2017) Saliency Detection for unconstrained videos using superpixel-level graph and spatiotemporal propagation. IEEE Trans Circ Sys Video Technol. https:\/\/doi.org\/10.1109\/TCSVT.2016.2595324","journal-title":"IEEE Trans Circ Sys Video Technol"},{"key":"7330_CR81","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2017.2670143","author":"C Chen","year":"2017","unstructured":"Chen C, Li S, Wang Y, Qin H, Hao A (2017) Video Saliency detection via spatial-temporal fusion and low-rank coherency diffusion. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2017.2670143","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR82","doi-asserted-by":"publisher","unstructured":"Li S, Seybold B, Vorobyov A, Lei X, Kuo CCJ (2018) Unsupervised video object segmentation with motion-based bilateral networks. Lecture notes in computer science (including subseries lecture notes in artificial intelligence and lecture notes in bioinformatics), vol 11207 LNCS, https:\/\/doi.org\/10.1007\/978-3-030-01219-9_13","DOI":"10.1007\/978-3-030-01219-9_13"},{"key":"7330_CR83","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2018.2859773","author":"Y Tang","year":"2019","unstructured":"Tang Y, Zou W, Jin Z, Chen Y, Hua Y, Li X (2019) Weakly supervised salient object detection with spatiotemporal cascade neural networks. IEEE Trans Circ Syst Video Technol. https:\/\/doi.org\/10.1109\/TCSVT.2018.2859773","journal-title":"IEEE Trans Circ Syst Video Technol"},{"key":"7330_CR84","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2018.2813165","author":"Y Chen","year":"2018","unstructured":"Chen Y, Zou W, Tang Y, Li X, Xu C, Komodakis N (2018) SCOM: spatiotemporal constrained optimization for salient object detection. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2018.2813165","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR85","doi-asserted-by":"publisher","unstructured":"Wang W et al (2019) Learning unsupervised video object segmentation through visual attention. In: Proceedings of the IEEE computer society conference on computer vision and pattern recognition, vol. 2019-June. https:\/\/doi.org\/10.1109\/CVPR.2019.00318","DOI":"10.1109\/CVPR.2019.00318"},{"key":"7330_CR86","doi-asserted-by":"crossref","unstructured":"Zhao W, Zhang J, Li L, Barnes N, Liu N, Han J (2021) Weakly supervised video salient object detection. In: Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 16826\u201316835","DOI":"10.1109\/CVPR46437.2021.01655"},{"key":"7330_CR87","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2699184","author":"LC Chen","year":"2018","unstructured":"Chen LC, Papandreou G, Kokkinos I, Murphy K, Yuille AL (2018) DeepLab: semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected CRFs. IEEE Trans Pattern Anal Mach Intell. https:\/\/doi.org\/10.1109\/TPAMI.2017.2699184","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"7330_CR88","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2021.3049959","author":"Z Zhang","year":"2021","unstructured":"Zhang Z, Lin Z, Xu J, Da Jin W, Lu SP, Fan DP (2021) Bilateral attention network for RGB-D salient object detection. IEEE Trans Image Process. https:\/\/doi.org\/10.1109\/TIP.2021.3049959","journal-title":"IEEE Trans Image Process"},{"key":"7330_CR89","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-59725-2_26","author":"DP Fan","year":"2020","unstructured":"Fan DP et al (2020) PraNet: parallel reverse attention network for polyp segmentation. MICCAI. https:\/\/doi.org\/10.1007\/978-3-030-59725-2_26","journal-title":"MICCAI"},{"key":"7330_CR90","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3085766","author":"DP Fan","year":"2021","unstructured":"Fan DP, Ji GP, Cheng MM, Shao L (2021) Concealed object detection. IEEE Trans Pattern Anal Mach Intell. https:\/\/doi.org\/10.1109\/TPAMI.2021.3085766","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"7330_CR91","unstructured":"Howard A et al (2019) Searching for MobileNetV3, CoRR, vol. abs\/1905.02244. Available: http:\/\/arxiv.org\/abs\/1905.02244"},{"key":"7330_CR92","unstructured":"Simonyan K, Zisserman A (2015) Very deep convolutional networks for large-scale image recognition. ICLR"}],"container-title":["Neural Computing and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00521-022-07330-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00521-022-07330-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00521-022-07330-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,9,22]],"date-time":"2022-09-22T13:47:28Z","timestamp":1663854448000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00521-022-07330-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,5,20]]},"references-count":92,"journal-issue":{"issue":"19","published-print":{"date-parts":[[2022,10]]}},"alternative-id":["7330"],"URL":"https:\/\/doi.org\/10.1007\/s00521-022-07330-1","relation":{},"ISSN":["0941-0643","1433-3058"],"issn-type":[{"value":"0941-0643","type":"print"},{"value":"1433-3058","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,5,20]]},"assertion":[{"value":"26 November 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"18 April 2022","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 May 2022","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"We declare that we have no financial and personal relationships with other people or organizations that can inappropriately influence our work, there is no professional or other personal interest of any nature or kind in any product, service and\/or company that could be construed as influencing the position presented in, or the review of, the manuscript entitled.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}