{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,9]],"date-time":"2025-11-09T03:49:20Z","timestamp":1762660160162,"version":"3.37.3"},"reference-count":47,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2022,3,11]],"date-time":"2022-03-11T00:00:00Z","timestamp":1646956800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,3,11]],"date-time":"2022-03-11T00:00:00Z","timestamp":1646956800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62073140","62073141"],"award-info":[{"award-number":["62073140","62073141"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100007219","name":"Natural Science Foundation of Shanghai","doi-asserted-by":"publisher","award":["19ZR1473200"],"award-info":[{"award-number":["19ZR1473200"]}],"id":[{"id":"10.13039\/100007219","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2023,2]]},"DOI":"10.1007\/s00371-021-02362-5","type":"journal-article","created":{"date-parts":[[2022,3,11]],"date-time":"2022-03-11T16:15:59Z","timestamp":1647015359000},"page":"625-637","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["A flow-guided self-calibration Siamese network for visual tracking"],"prefix":"10.1007","volume":"39","author":[{"given":"Zhenyang","family":"Qu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9400-1415","authenticated-orcid":false,"given":"Hongbo","family":"Shi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shuai","family":"Tan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bing","family":"Song","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yang","family":"Tao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,3,11]]},"reference":[{"key":"2362_CR1","doi-asserted-by":"publisher","first-page":"993","DOI":"10.1007\/s00371-020-01848-y","volume":"37","author":"MY Abbass","year":"2021","unstructured":"Abbass, M.Y., Kwon, K.C., Kim, N., et al.: A survey on online learning for visual tracking. Vis. Comput. 37, 993\u20131014 (2021)","journal-title":"Vis. Comput."},{"key":"2362_CR2","doi-asserted-by":"crossref","unstructured":"Bertinetto, L., Valmadre, J., Golodetz, S., et al.: Staple: complementary learners for real-time tracking. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1401\u20131409 (2016)","DOI":"10.1109\/CVPR.2016.156"},{"key":"2362_CR3","doi-asserted-by":"crossref","unstructured":"Bertinetto, L., Valmadre, J., Henriques, J. F., et al.: Fully-convolutional siamese networks for object tracking. In: European Conference on Computer Vision, pp. 850\u2013865. Springer (2016)","DOI":"10.1007\/978-3-319-48881-3_56"},{"key":"2362_CR4","doi-asserted-by":"publisher","first-page":"80","DOI":"10.1016\/j.patcog.2018.10.005","volume":"87","author":"B Chen","year":"2019","unstructured":"Chen, B., Li, P., Sun, C., et al.: Multi attention module for visual tracking. Pattern Recognit. 87, 80\u201393 (2019)","journal-title":"Pattern Recognit."},{"key":"2362_CR5","doi-asserted-by":"crossref","unstructured":"Chen, Z., Zhong, B., Li, G., et al.: Siamese box adaptive network for visual tracking. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 6668\u20136677(2020)","DOI":"10.1109\/CVPR42600.2020.00670"},{"key":"2362_CR6","doi-asserted-by":"publisher","first-page":"74","DOI":"10.1016\/j.patrec.2018.03.009","volume":"124","author":"M Danelljan","year":"2019","unstructured":"Danelljan, M., Bhat, G., Gladh, S., et al.: Deep motion and appearance cues for visual tracking. Pattern Recognit. Lett. 124, 74\u201381 (2019)","journal-title":"Pattern Recognit. Lett."},{"key":"2362_CR7","doi-asserted-by":"crossref","unstructured":"Danelljan, M., Bhat, G., Khan, F. S., et al. Atom: accurate tracking by overlap maximization. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4660\u2013\u20134669 (2019)","DOI":"10.1109\/CVPR.2019.00479"},{"key":"2362_CR8","doi-asserted-by":"crossref","unstructured":"Danelljan, M., Bhat, G., Shahbaz Khan, F., et al.: Eco: efficient convolution operators for tracking. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 6638\u20136646 (2017)","DOI":"10.1109\/CVPR.2017.733"},{"key":"2362_CR9","doi-asserted-by":"crossref","unstructured":"Danelljan, M., Hager, G., Shahbaz Khan, F., et al.: Learning spatially regularized correlation filters for visual tracking. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 4310\u20134318 (2015)","DOI":"10.1109\/ICCV.2015.490"},{"key":"2362_CR10","doi-asserted-by":"crossref","unstructured":"Danelljan, M., H\u00e4ger, G., Khan, F., Felsberg, M.: Accurate scale estimation for robust visual tracking. In: British Machine Vision Conference, Nottingham, September 1\u20135, 2014. BMVA Press (2014)","DOI":"10.5244\/C.28.65"},{"key":"2362_CR11","doi-asserted-by":"crossref","unstructured":"Dong, X., Shen, J.: Triplet loss in siamese network for object tracking. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 459\u2013474 (2018)","DOI":"10.1007\/978-3-030-01261-8_28"},{"key":"2362_CR12","doi-asserted-by":"crossref","unstructured":"Guo, Q., Feng, W., Zhou, C., et al.: Learning dynamic siamese network for visual object tracking. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1763\u20131771 (2017)","DOI":"10.1109\/ICCV.2017.196"},{"key":"2362_CR13","doi-asserted-by":"crossref","unstructured":"He, A., Luo, C., Tian, X., et al.: A twofold siamese network for real-time object tracking. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4834\u20134843 (2018)","DOI":"10.1109\/CVPR.2018.00508"},{"issue":"3","key":"2362_CR14","doi-asserted-by":"publisher","first-page":"583","DOI":"10.1109\/TPAMI.2014.2345390","volume":"37","author":"JF Henriques","year":"2014","unstructured":"Henriques, J.F., Caseiro, R., Martins, P., Batista, J.: High-speed tracking with kernelized correlation filters. IEEE Trans. Pattern Anal. Mach. Intell. 37(3), 583\u2013596 (2014)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2362_CR15","doi-asserted-by":"crossref","unstructured":"Hu, J., Shen, L., Sun, G.: Squeeze-and-excitation networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7132\u20137141(2018)","DOI":"10.1109\/CVPR.2018.00745"},{"key":"2362_CR16","unstructured":"Huang, L., Zhao, X., Huang, K.: Got-10k: A large high-diversity benchmark for generic object tracking in the wild. IEEE Trans. Pattern Anal. Mach. Intell. (2019)."},{"key":"2362_CR17","doi-asserted-by":"crossref","unstructured":"Hui, T. W., Tangm X., Loy, C. C.: Liteflownet: A lightweight convolutional neural network for optical flow estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 8981\u20138989 (2018)","DOI":"10.1109\/CVPR.2018.00936"},{"key":"2362_CR18","doi-asserted-by":"crossref","unstructured":"Kiani Galoogahi, H., Fagg, A., Lucey, S.: Learning background-aware correlation filters for visual tracking. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1135\u20131143 (2017)","DOI":"10.1109\/ICCV.2017.129"},{"key":"2362_CR19","doi-asserted-by":"publisher","first-page":"587","DOI":"10.1007\/s00371-020-01825-5","volume":"37","author":"C Li","year":"2021","unstructured":"Li, C., Lin, S., Qiao, J., et al.: Partial tracking method based on siamese network. Vis Comput 37, 587\u2013601 (2021)","journal-title":"Vis. Comput."},{"key":"2362_CR20","doi-asserted-by":"crossref","unstructured":"Li, P., Chen, B., Ouyang, W., et al.: Gradnet: gradient-guided network for visual object tracking. In: Proceedings of the IEEE International Conference on Computer Vision. pp. 6162\u20136171 (2019)","DOI":"10.1109\/ICCV.2019.00626"},{"key":"2362_CR21","doi-asserted-by":"crossref","unstructured":"Li, B., Yan, J., Wu, W., et al.: High performance visual tracking with siamese region proposal network. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. pp. 8971-8980 (2018)","DOI":"10.1109\/CVPR.2018.00935"},{"key":"2362_CR22","doi-asserted-by":"crossref","unstructured":"Li, G., Xie, Y., Wei, T., et al.: Flow guided recurrent neural encoder for video salient object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3243\u20133252 (2018)","DOI":"10.1109\/CVPR.2018.00342"},{"key":"2362_CR23","doi-asserted-by":"crossref","unstructured":"Li, Y., Zhu, J.: A scale adaptive kernel correlation filter tracker with feature integration. In: European Conference on Computer Vision, pp. 254\u2013265. Springer (2014)","DOI":"10.1007\/978-3-319-16181-5_18"},{"key":"2362_CR24","doi-asserted-by":"crossref","unstructured":"Lin, T. Y., Goyal, P., Girshick, R., et al.: Focal loss for dense object detection. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2980\u20132988 (2017)","DOI":"10.1109\/ICCV.2017.324"},{"key":"2362_CR25","doi-asserted-by":"crossref","unstructured":"Liu, P., Yan, X., Jiang, Y., et al.: Deep flow collaborative network for online visual tracking. In: 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 2598\u20132602 (2020)","DOI":"10.1109\/ICASSP40776.2020.9054590"},{"key":"2362_CR26","doi-asserted-by":"crossref","unstructured":"Liu, J. J., Hou, Q., Cheng, M. M., et al.: Improving convolutional networks with self-calibrated convolutions. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 10096\u201310105(2020)","DOI":"10.1109\/CVPR42600.2020.01011"},{"key":"2362_CR27","doi-asserted-by":"crossref","unstructured":"Ma, S., Zhang, L., Pu, L., et al.: An adaptive model update object tracking algorithm based on densenet features. In:2020 International Conference on Networking and Network Applications (NaNA), pp. 321\u2013325 (2020)","DOI":"10.1109\/NaNA51271.2020.00062"},{"key":"2362_CR28","unstructured":"Marvasti-Zadeh, S. M., Cheng, L., Ghanei-Yakhdan, H., et al.: Deep learning for visual tracking: a comprehensive survey. IEEE Trans. Intell. Transp. Sys., 1\u201326 (2021)"},{"key":"2362_CR29","doi-asserted-by":"crossref","unstructured":"Nam, H., Han, B.: Learning multi-domain convolutional neural networks for visual tracking. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4293\u20134302 (2016)","DOI":"10.1109\/CVPR.2016.465"},{"issue":"7","key":"2362_CR30","doi-asserted-by":"publisher","first-page":"3068","DOI":"10.1109\/TCYB.2019.2936503","volume":"50","author":"J Shen","year":"2019","unstructured":"Shen, J., Tang, X., Dong, X., et al.: Visual object tracking by hierarchical attention siamese network. IEEE Trans. Cybern. 50(7), 3068\u20133080 (2019)","journal-title":"IEEE Trans. Cybern."},{"key":"2362_CR31","doi-asserted-by":"crossref","unstructured":"Shuang, K., Huang, Y., Sun, Y., et al.: Fine-grained motion representation for template-free visual tracking. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 671\u2013680 (2020)","DOI":"10.1109\/WACV45572.2020.9093517"},{"key":"2362_CR32","doi-asserted-by":"crossref","unstructured":"Sun, S., Kuang, Z., Sheng, L., et al.: Optical flow guided feature: a fast and robust motion representation for video action recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1390\u20131399 (2018)","DOI":"10.1109\/CVPR.2018.00151"},{"key":"2362_CR33","doi-asserted-by":"crossref","unstructured":"Valmadre, J., Bertinetto, L., Henriques, J., et al.: End-to-end representation learning for correlation filter based tracking. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. pp. 2805\u20132813 (2017)","DOI":"10.1109\/CVPR.2017.531"},{"key":"2362_CR34","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., et al.: Attention is all you need. arXiv preprint. https:\/\/arxiv.org\/abs\/1706.03762, 2017."},{"key":"2362_CR35","doi-asserted-by":"publisher","first-page":"683","DOI":"10.1007\/s00371-019-01646-1","volume":"36","author":"Y Wang","year":"2020","unstructured":"Wang, Y., Wei, X., Ding, L., et al.: A robust visual tracking method via local feature extraction and saliency detection. Vis Comput 36, 683\u2013700 (2020)","journal-title":"Vis Comput"},{"key":"2362_CR36","doi-asserted-by":"crossref","unstructured":"Wang, M., Liu, Y., Huang, Z.: Large margin object tracking with circulant feature maps. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4021\u2013\u20134029 (2017)","DOI":"10.1109\/CVPR.2017.510"},{"key":"2362_CR37","doi-asserted-by":"crossref","unstructured":"Wang, X., Girshick, R., Gupta, A., et al.: Non-local neural networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7794-7803(2018)","DOI":"10.1109\/CVPR.2018.00813"},{"issue":"9","key":"2362_CR38","doi-asserted-by":"publisher","first-page":"1834","DOI":"10.1109\/TPAMI.2014.2388226","volume":"37","author":"Y Wu","year":"2015","unstructured":"Wu, Y., Lim, J., Yang, M.: Object tracking benchmark. IEEE Trans. Pattern Anal. Mach. Intell. 37(9), 1834\u20131848 (2015)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2362_CR39","doi-asserted-by":"crossref","unstructured":"Wu, Y., Lim, J., Yang, M. H.: Online object tracking: a benchmark. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2411\u20132418 (2013)","DOI":"10.1109\/CVPR.2013.312"},{"key":"2362_CR40","doi-asserted-by":"crossref","unstructured":"Xu, R., Li, X., Zhou, B., et al.: Deep flow-guided video inpainting. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3723\u20133732 (2019)","DOI":"10.1109\/CVPR.2019.00384"},{"key":"2362_CR41","doi-asserted-by":"crossref","unstructured":"Yang, T., Xu, P., Hu, R., et al.: ROAM: Recurrently optimizing tracking model. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 6718\u20136727 (2020)","DOI":"10.1109\/CVPR42600.2020.00675"},{"key":"2362_CR42","doi-asserted-by":"crossref","unstructured":"Yang, S., Chen, H., Xu, F. et al. High-performance UAVs visual tracking based on siamese network. Vis. Comput. (2021).","DOI":"10.1007\/s00371-021-02271-7"},{"key":"2362_CR43","doi-asserted-by":"crossref","unstructured":"Yu, Y., Xiong, Y., Huang, W., et al.: Deformable Siamese attention networks for visual object tracking. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 6728\u20136737 (2020)","DOI":"10.1109\/CVPR42600.2020.00676"},{"key":"2362_CR44","doi-asserted-by":"publisher","first-page":"260","DOI":"10.1016\/j.neucom.2020.11.046","volume":"436","author":"D Zhang","year":"2021","unstructured":"Zhang, D., Zheng, Z., Li, M., et al.: CSART: Channel and spatial attention-guided residual learning for real-time object tracking. Neurocomputing. 436, 260\u2013272 (2021)","journal-title":"Neurocomputing."},{"key":"2362_CR45","doi-asserted-by":"crossref","unstructured":"Zhang, Z., Peng, H.: Deeper and wider siamese networks for real-time visual tracking. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4591\u20134600 (2019)","DOI":"10.1109\/CVPR.2019.00472"},{"key":"2362_CR46","doi-asserted-by":"crossref","unstructured":"Zhu, Z., Wu, W., Zou, W., et al.: End-to-end flow correlation tracking with spatial-temporal attention. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 548\u2013557 (2018)","DOI":"10.1109\/CVPR.2018.00064"},{"key":"2362_CR47","doi-asserted-by":"crossref","unstructured":"Zhu, X., Wang, Y., Dai, J., et al.: Flow-guided feature aggregation for video object detection. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 408\u2013417 (2017)","DOI":"10.1109\/ICCV.2017.52"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-021-02362-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-021-02362-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-021-02362-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,2,7]],"date-time":"2023-02-07T19:27:26Z","timestamp":1675798046000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-021-02362-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,3,11]]},"references-count":47,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2023,2]]}},"alternative-id":["2362"],"URL":"https:\/\/doi.org\/10.1007\/s00371-021-02362-5","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"type":"print","value":"0178-2789"},{"type":"electronic","value":"1432-2315"}],"subject":[],"published":{"date-parts":[[2022,3,11]]},"assertion":[{"value":"10 November 2021","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 March 2022","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflicts of interest."}}]}}