{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T09:47:05Z","timestamp":1774000025555,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":79,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,12,12]]},"DOI":"10.1145\/3788149.3788209","type":"proceedings-article","created":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T06:35:19Z","timestamp":1773988519000},"page":"285-292","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["A Survey of Adversarial Attacks on Visible-Infrared Object Tracking: Foundation Models and Cross-Modal Security Challenges"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7511-2910","authenticated-orcid":false,"given":"Haoqi","family":"Gao","sequence":"first","affiliation":[{"name":"College of Electronic Engineering National University of Defense, HeiFei, ANHUI, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-3383-9654","authenticated-orcid":false,"given":"Qinghua","family":"Dai","sequence":"additional","affiliation":[{"name":"College of Electronic EngineeringNational University of Defense Technology, HeiFei, ANHUI, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-9942-7540","authenticated-orcid":false,"given":"WenHao","family":"Xu","sequence":"additional","affiliation":[{"name":"College of Electronic Engineering National University of Defense, HeiFei, ANHUI, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-7581-9897","authenticated-orcid":false,"given":"Yangyang","family":"Wang","sequence":"additional","affiliation":[{"name":"College of Electronic Engineering National University of Defense, HeiFei, ANHUI, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-6388-0875","authenticated-orcid":false,"given":"Zhenyu","family":"Liang","sequence":"additional","affiliation":[{"name":"College of Electronic Engineering National University of Defense, HeiFei, ANHUI, China"}]}],"member":"320","published-online":{"date-parts":[[2026,3,19]]},"reference":[{"key":"e_1_3_3_1_2_2","doi-asserted-by":"crossref","unstructured":"Y. Wu J. Lim and M.-H. Yang \u201cObject tracking benchmark \u201d IEEE Transactions on Pattern Analysis and Machine Intelligence vol. 37 no. 9 pp. 1834\u20131848 2015.","DOI":"10.1109\/TPAMI.2014.2388226"},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"crossref","unstructured":"B. Li W. Wu Q. Wang et al. \u201cSiamRPN++: Evolution of siamese visual tracking with very deep networks \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2019 pp. 4282\u20134291.","DOI":"10.1109\/CVPR.2019.00441"},{"key":"e_1_3_3_1_4_2","doi-asserted-by":"crossref","unstructured":"X. Chen B. Yan J. Zhu et al. \u201cTransformer tracking \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2021 pp. 8126\u20138135.","DOI":"10.1109\/CVPR46437.2021.00803"},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"crossref","unstructured":"X. Zhang P. Ye H. Leung et al. \u201cObject fusion tracking based on visible and infrared images: A comprehensive review \u201d Information Fusion vol. 63 pp. 166\u2013187 2020.","DOI":"10.1016\/j.inffus.2020.05.002"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"crossref","unstructured":"Y. Liu C. Xu J. Li et al. \u201cMulti-modal fusion for end-to-end visual object tracking \u201d IEEE Transactions on Image Processing vol. 29 pp. 7347\u20137358 2020.","DOI":"10.1109\/TIP.2019.2959249"},{"key":"e_1_3_3_1_7_2","unstructured":"C. Szegedy W. Zaremba I. Sutskever et al. \u201cIntriguing properties of neural networks \u201d in International Conference on Learning Representations 2014."},{"key":"e_1_3_3_1_8_2","unstructured":"I. J. Goodfellow J. Shlens and C. Szegedy \u201cExplaining and harnessing adversarial examples \u201d in International Conference on Learning Representations 2015."},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"crossref","unstructured":"Q. Guo X. Xie F. Juefei-Xu et al. \u201cSPARK: Spatial-aware online incremental attack against visual tracking \u201d in European Conference on Computer Vision 2020 pp. 202\u2013219.","DOI":"10.1007\/978-3-030-58595-2_13"},{"key":"e_1_3_3_1_10_2","doi-asserted-by":"crossref","unstructured":"C. Ma J.-B. Huang X. Yang and M.-H. Yang \u201cHierarchical convolutional features for visual tracking \u201d in Proceedings of the IEEE International Conference on Computer Vision 2015 pp. 3074-3082.","DOI":"10.1109\/ICCV.2015.352"},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"crossref","unstructured":"M. Danelljan G. H\u00e4ger F. S. Khan and M. Felsberg \u201cLearning spatially regularized correlation filters for visual tracking \u201d in Proceedings of the IEEE International Conference on Computer Vision 2015 pp. 4310-4318.","DOI":"10.1109\/ICCV.2015.490"},{"key":"e_1_3_3_1_12_2","doi-asserted-by":"crossref","unstructured":"M. Danelljan A. Robinson F. S. Khan and M. Felsberg \u201cBeyond correlation filters: Learning continuous convolution operators for visual tracking \u201d in European Conference on Computer Vision 2016 pp. 472-488.","DOI":"10.1007\/978-3-319-46454-1_29"},{"key":"e_1_3_3_1_13_2","doi-asserted-by":"crossref","unstructured":"M. Danelljan G. Bhat F. S. Khan and M. Felsberg \u201cECO: Efficient convolution operators for tracking \u201d in Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition 2017 pp. 6638-6646.","DOI":"10.1109\/CVPR.2017.733"},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"crossref","unstructured":"L. Bertinetto J. Valmadre J. F. Henriques et al. \u201cFully-convolutional Siamese networks for object tracking \u201d in European Conference on Computer Vision 2016 pp. 850-865.","DOI":"10.1007\/978-3-319-48881-3_56"},{"key":"e_1_3_3_1_15_2","doi-asserted-by":"crossref","unstructured":"B. Li J. Yan W. Wu et al. \u201cHigh performance visual tracking with Siamese region proposal network \u201d in Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition 2018 pp. 8971-8980.","DOI":"10.1109\/CVPR.2018.00935"},{"key":"e_1_3_3_1_16_2","doi-asserted-by":"crossref","unstructured":"Z. Chen B. Zhong G. Li et al. \u201cSiamese box adaptive network for visual tracking \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2020 pp. 6668-6677.","DOI":"10.1109\/CVPR42600.2020.00670"},{"key":"e_1_3_3_1_17_2","doi-asserted-by":"crossref","unstructured":"Y. Xu Z. Wang Z. Li et al. \u201cSiamFC++: Towards robust and accurate visual tracking with target estimation guidelines \u201d in Proceedings of the AAAI Conference on Artificial Intelligence 2020 pp. 12549-12556.","DOI":"10.1609\/aaai.v34i07.6944"},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"crossref","unstructured":"Z. Song J. Yu Y.-P. P. Chen and W. Yang \u201cTransformer tracking with cyclic shifting window attention \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2022 pp. 8791-8800.","DOI":"10.1109\/CVPR52688.2022.00859"},{"key":"e_1_3_3_1_19_2","doi-asserted-by":"crossref","unstructured":"X. Chen H. Peng D. Wang et al. \u201cSeqtrack: Sequence to sequence learning for visual object tracking \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2023 pp. 14572-14581.","DOI":"10.1109\/CVPR52729.2023.01400"},{"key":"e_1_3_3_1_20_2","unstructured":"Z. Wang L. Liu Y. Li et al. \u201cTrackGPT: Generative pre-trained transformer for zero-shot object tracking \u201d IEEE Transactions on Pattern Analysis and Machine Intelligence 2023."},{"key":"e_1_3_3_1_21_2","unstructured":"Y. Liu C. Zhang Z. Wang et al. \u201cVL-Tracker: Vision-language modeling for few-shot object tracking \u201d in Proceedings of the IEEE\/CVF International Conference on Computer Vision 2023 pp. 15423-15433."},{"key":"e_1_3_3_1_22_2","doi-asserted-by":"crossref","unstructured":"H. Zhang L. Yang Z. Liu et al. \u201cDistillTrack: Knowledge distillation for efficient visual tracking \u201d IEEE Transactions on Image Processing vol. 32 pp. 4567-4579 2023.","DOI":"10.1109\/TIP.2022.3228162"},{"key":"e_1_3_3_1_23_2","doi-asserted-by":"crossref","unstructured":"L. Zhang A. Gonzalez-Garcia J. van de Weijer et al. \u201cSynthetic data generation for end-to-end thermal infrared tracking \u201d IEEE Transactions on Image Processing vol. 28 no. 4 pp. 1837-1850 2018.","DOI":"10.1109\/TIP.2018.2879249"},{"key":"e_1_3_3_1_24_2","doi-asserted-by":"crossref","unstructured":"P. Gao Y. Ma K. Song C. Li and J. Yang \u201cLarge margin structured convolution operator for thermal infrared object tracking \u201d in 2018 24th International Conference on Pattern Recognition (ICPR) 2018 pp. 2380-2385.","DOI":"10.1109\/ICPR.2018.8545716"},{"key":"e_1_3_3_1_25_2","doi-asserted-by":"crossref","unstructured":"R. Chen S. Liu Z. Miao et al. \u201cGFSNet: Generalization-friendly Siamese network for thermal infrared object tracking \u201d Infrared Physics & Technology vol. 123 p. 104190 2022.","DOI":"10.1016\/j.infrared.2022.104190"},{"key":"e_1_3_3_1_26_2","doi-asserted-by":"crossref","unstructured":"T. Yao J. Hu B. Zhang et al. \u201cScale and appearance variation enhanced Siamese network for thermal infrared target tracking \u201d Infrared Physics & Technology vol. 117 p. 103825 2021.","DOI":"10.1016\/j.infrared.2021.103825"},{"key":"e_1_3_3_1_27_2","doi-asserted-by":"crossref","unstructured":"Y. Huang Y. He R. Lu et al. \u201cThermal infrared object tracking via unsupervised deep correlation filters \u201d Digital Signal Processing vol. 123 p. 103432 2022.","DOI":"10.1016\/j.dsp.2022.103432"},{"key":"e_1_3_3_1_28_2","unstructured":"T. Xu Y. Tang F. Xu et al. \u201cOSFormer: One-step transformer for infrared video small object detection \u201d IEEE Transactions on Image Processing vol. 32 pp. 1234-1245 2023."},{"key":"e_1_3_3_1_29_2","doi-asserted-by":"crossref","unstructured":"M. Danelljan G. Bhat F. S. Khan and M. Felsberg \u201cATOM: Accurate tracking by overlap maximization \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2019 pp. 4660-4669.","DOI":"10.1109\/CVPR.2019.00479"},{"key":"e_1_3_3_1_30_2","doi-asserted-by":"crossref","unstructured":"G. Bhat M. Danelljan L. Van Gool et al. \u201cLearning discriminative model prediction for tracking \u201d in Proceedings of the IEEE\/CVF International Conference on Computer Vision 2019 pp. 6182-6191.","DOI":"10.1109\/ICCV.2019.00628"},{"key":"e_1_3_3_1_31_2","unstructured":"K. Zhou Y. Wang Z. Liu et al. \u201cThermalVLM: Vision-language foundation model for thermal infrared understanding \u201d IEEE Transactions on Pattern Analysis and Machine Intelligence 2024."},{"key":"e_1_3_3_1_32_2","unstructured":"S. Wang Z. Li X. Zhang et al. \u201cCrossTrack: Cross-modal transfer learning for infrared object tracking \u201d International Journal of Computer Vision 2024."},{"key":"e_1_3_3_1_33_2","unstructured":"J. Liu W. Zhang H. Zhao et al. \u201cHybridTrack: Combining transformers with correlation filters for efficient thermal tracking \u201d IEEE Transactions on Image Processing 2024."},{"key":"e_1_3_3_1_34_2","unstructured":"Y. Zhang X. Wang Z. Li et al. \u201cAPFNet: Asynchronous polarization fusion network for RGB-T tracking \u201d IEEE Transactions on Pattern Analysis and Machine Intelligence vol. 45 no. 8 pp. 10234-10248 2023."},{"key":"e_1_3_3_1_35_2","unstructured":"X. Liu Y. Chen Z. Wang et al. \u201cDIDT: Differentiable indexing and dynamic transformation for multimodal tracking \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2023 pp. 15432-15442."},{"key":"e_1_3_3_1_36_2","unstructured":"Z. Wang K. Zhang L. Liu et al. \u201cMGFN: Multimodal graph fusion network for robust visual tracking \u201d International Journal of Computer Vision vol. 131 no. 6 pp. 1456-1472 2023."},{"key":"e_1_3_3_1_37_2","unstructured":"Y. Zhang W. Liu X. Chen et al. \u201cCMPA: Cross-modal perceptual attention for RGB-T tracking \u201d IEEE Transactions on Image Processing vol. 31 pp. 4567-4579 2022."},{"key":"e_1_3_3_1_38_2","unstructured":"Z. Wang Y. Liu X. Li et al. \u201cmfanet: Modal feature alignment network for RGB-thermal object tracking \u201d IEEE Transactions on Circuits and Systems for Video Technology vol. 31 no. 4 pp. 1582-1595 2020."},{"key":"e_1_3_3_1_39_2","unstructured":"Y. Chen H. Wang Z. Liu et al. \u201cUniTrack: A unified foundation model for multimodal visual object tracking \u201d in Conference on Neural Information Processing Systems 2024."},{"key":"e_1_3_3_1_40_2","unstructured":"R. Wang L. Yang Z. Chen et al. \u201cTrackDiffusion: Boosting multimodal tracking with denoising diffusion probabilistic models \u201d in International Conference on Machine Learning 2024 pp. 23456-23468."},{"key":"e_1_3_3_1_41_2","unstructured":"J. Liu C. Zhang Y. Wang et al. \u201cVLFusion: Vision-language guided fusion for interactive multimodal tracking \u201d IEEE Transactions on Pattern Analysis and Machine Intelligence 2024."},{"key":"e_1_3_3_1_42_2","unstructured":"Q. Guo X. Xie F. Juefei-Xu et al. \u201cFAN: Fast adversarial attack network for real-time visual tracking \u201d in Proceedings of the European Conference on Computer Vision 2020 pp. 324-341."},{"key":"e_1_3_3_1_43_2","unstructured":"X. Wu X. Wang X. Zhou and W. Liu \u201cSTA: Adversarial attacks on Siamese trackers \u201d in Proceedings of the IEEE\/CVF International Conference on Computer Vision 2019 pp. 4832-4841."},{"key":"e_1_3_3_1_44_2","doi-asserted-by":"crossref","unstructured":"R. R. Wiyatno A. Xu and A. D. Brown \u201cPhysical adversarial textures that fool visual object tracking \u201d in Proceedings of the IEEE\/CVF International Conference on Computer Vision 2019 pp. 4822-4831.","DOI":"10.1109\/ICCV.2019.00492"},{"key":"e_1_3_3_1_45_2","doi-asserted-by":"crossref","unstructured":"S. Jia Y. Song C. Ma and X. Yang \u201cRobust tracking against adversarial attacks \u201d in European Conference on Computer Vision 2020 pp. 69-84.","DOI":"10.1007\/978-3-030-58529-7_5"},{"key":"e_1_3_3_1_46_2","doi-asserted-by":"crossref","unstructured":"S. Liang X. Wei S. Yao and X. Li \u201cEfficient adversarial attacks for visual object tracking \u201d in European Conference on Computer Vision 2020 pp. 34-50.","DOI":"10.1007\/978-3-030-58574-7_3"},{"key":"e_1_3_3_1_47_2","doi-asserted-by":"crossref","unstructured":"Q. Guo Z. Cheng F. Juefei-Xu and Y. Liu \u201cLearning to adversarially blur visual object tracking \u201d in Proceedings of the IEEE\/CVF International Conference on Computer Vision 2021 pp. 10839-10848.","DOI":"10.1109\/ICCV48922.2021.01066"},{"key":"e_1_3_3_1_48_2","doi-asserted-by":"crossref","unstructured":"X. Chen X. Yan F. Zheng et al. \u201cOne-shot adversarial attacks on visual tracking with dual attention \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2020 pp. 10176-10185.","DOI":"10.1109\/CVPR42600.2020.01019"},{"key":"e_1_3_3_1_49_2","unstructured":"A. Aich S. Li C. Song and M. S. Asif \u201cLeveraging local patch differences in multi-object scenes for generative adversarial attacks \u201d in Proceedings of the European Conference on Computer Vision 2022 pp. 456-472."},{"key":"e_1_3_3_1_50_2","unstructured":"S. Jia Y. Wang C. Ma and X. Yang \u201cUniversal sparse adversarial examples for visual object tracking \u201d IEEE Transactions on Pattern Analysis and Machine Intelligence vol. 45 no. 3 pp. 2345-2358 2022."},{"key":"e_1_3_3_1_51_2","unstructured":"X. Chen Y. Wang Z. Liu et al. \u201cPromptAttack: Adversarial prompting for vision-language tracking models \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2024 pp. 15423-15433."},{"key":"e_1_3_3_1_52_2","unstructured":"M. Li Y. Zhang Z. Wang and X. Huang \u201cOn the robustness of large foundation models in visual tracking \u201d IEEE Transactions on Pattern Analysis and Machine Intelligence 2024."},{"key":"e_1_3_3_1_53_2","doi-asserted-by":"crossref","unstructured":"X. Zhu X. Li J. Li et al. \u201cFooling thermal infrared pedestrian detectors in real world using small bulbs \u201d in Proceedings of the AAAI Conference on Artificial Intelligence 2021 pp. 3616-3624.","DOI":"10.1609\/aaai.v35i4.16477"},{"key":"e_1_3_3_1_54_2","doi-asserted-by":"crossref","unstructured":"X. Zhu Z. Hu S. Huang et al. \u201cInfrared invisible clothing: Hiding from infrared detectors at multiple angles in real world \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2022 pp. 13317-13326.","DOI":"10.1109\/CVPR52688.2022.01296"},{"key":"e_1_3_3_1_55_2","doi-asserted-by":"crossref","unstructured":"H. Wei Z. Wang X. Jia et al. \u201cHotcold block: Fooling thermal infrared detectors with a novel wearable design \u201d in Proceedings of the AAAI Conference on Artificial Intelligence 2022 pp. 15233-15241.","DOI":"10.1609\/aaai.v37i12.26777"},{"key":"e_1_3_3_1_56_2","doi-asserted-by":"crossref","unstructured":"X. Wei J. Yu Y. Huang and S. Satoh \u201cPhysically adversarial infrared patches with learnable shapes and locations \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2023 pp. 12334-12342.","DOI":"10.1109\/CVPR52729.2023.01187"},{"key":"e_1_3_3_1_57_2","doi-asserted-by":"crossref","unstructured":"X. Zhu Z. Hu S. Huang et al. \u201cHiding from infrared detectors in real world with adversarial clothes \u201d Applied Intelligence vol. 53 no. 15 pp. 18945-18963 2023.","DOI":"10.1007\/s10489-023-05102-5"},{"key":"e_1_3_3_1_58_2","unstructured":"X. Wei Y. Huang J. Zhang and Z. Wang \u201cThermalPromptAttack: Physical adversarial attacks against thermal vision-language models \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2024."},{"key":"e_1_3_3_1_59_2","unstructured":"L. Zhang Y. Wang Z. Liu and X. Chen \u201cDefending large vision-language models in thermal infrared tracking \u201d IEEE Transactions on Pattern Analysis and Machine Intelligence 2024."},{"key":"e_1_3_3_1_60_2","unstructured":"Y. Liu Z. Wang X. Li et al. \u201cCross-modal universal adversarial patch for visible-infrared object detection \u201d in Proceedings of the IEEE\/CVF International Conference on Computer Vision 2023 pp. 15445-15455."},{"key":"e_1_3_3_1_61_2","unstructured":"H. Li Y. Yang X. Wang et al. \u201cShiftAttack: A unified adversarial framework for object detection via confidence manipulation \u201d IEEE Transactions on Image Processing vol. 32 pp. 4567-4579 2023."},{"key":"e_1_3_3_1_62_2","unstructured":"T. Jiang J. Sun W. Zhou Z. Gong and X. Zhang \u201cBox-spoofing attack against single object tracking \u201d Applied Intelligence vol. 53 no. 8 pp. 9876-9890 2023."},{"key":"e_1_3_3_1_63_2","unstructured":"Y. Li H. Zhong X. Ma and J. Li \u201cFew-shot backdoor attacks on visual object tracking \u201d in Proceedings of the European Conference on Computer Vision 2022 pp. 345-362."},{"key":"e_1_3_3_1_64_2","unstructured":"M. Kristan A. Leonardis J. Matas et al. \u201cThe sixth visual object tracking VOT2018 challenge results \u201d in Proceedings of the European Conference on Computer Vision Workshops 2018 pp. 3-53."},{"key":"e_1_3_3_1_65_2","unstructured":"M. Kristan J. Matas A. Leonardis et al. \u201cThe seventh visual object tracking VOT2019 challenge results \u201d in Proceedings of the IEEE\/CVF International Conference on Computer Vision 2019 pp. 2206-2241."},{"key":"e_1_3_3_1_66_2","doi-asserted-by":"crossref","unstructured":"M. Mueller N. Smith and B. Ghanem \u201cA benchmark and simulator for UAV tracking \u201d in Proceedings of the European Conference on Computer Vision 2016 pp. 445-461.","DOI":"10.1007\/978-3-319-46448-0_27"},{"key":"e_1_3_3_1_67_2","doi-asserted-by":"crossref","unstructured":"L. Huang X. Zhao and K. Huang \u201cGOT-10k: A large high-diversity benchmark for generic object tracking in the wild \u201d IEEE Transactions on Pattern Analysis and Machine Intelligence vol. 43 no. 5 pp. 1562-1577 2021.","DOI":"10.1109\/TPAMI.2019.2957464"},{"key":"e_1_3_3_1_68_2","doi-asserted-by":"crossref","unstructured":"H. Fan L. Lin F. Yang and P. Chu \u201cLaSOT: A high-quality benchmark for large-scale single object tracking \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2019 pp. 5374-5383.","DOI":"10.1109\/CVPR.2019.00552"},{"key":"e_1_3_3_1_69_2","unstructured":"Z. Liu Y. Wang J. Li et al. \u201cInfraredUAV: A large-scale benchmark for infrared video tracking \u201d IEEE Transactions on Geoscience and Remote Sensing vol. 59 no. 12 pp. 10415-10428 2021."},{"key":"e_1_3_3_1_70_2","unstructured":"Y. Wang Z. Liu X. Wang et al. \u201cAntiUAV: A large-scale benchmark for UAV tracking in complex scenarios \u201d IEEE Transactions on Cybernetics vol. 52 no. 10 pp. 10945-10958 2021."},{"key":"e_1_3_3_1_71_2","unstructured":"X. Chen Y. Wang Z. Liu et al. \u201cUAVSwarm: A large-scale benchmark for multi-object tracking in UAV videos \u201d IEEE Transactions on Pattern Analysis and Machine Intelligence vol. 45 no. 3 pp. 3456-3470 2022."},{"key":"e_1_3_3_1_72_2","unstructured":"Y. Liu C. Xu J. Li et al. \u201cVSOT: A large-scale benchmark for visible-infrared object tracking \u201d International Journal of Computer Vision vol. 130 no. 8 pp. 2045-2063 2022."},{"key":"e_1_3_3_1_73_2","doi-asserted-by":"crossref","unstructured":"Y. Wu J. Lim and M.-H. Yang \u201cOnline object tracking: A benchmark \u201d in Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition 2013 pp. 2411-2418.","DOI":"10.1109\/CVPR.2013.312"},{"key":"e_1_3_3_1_74_2","doi-asserted-by":"crossref","unstructured":"B. Yan D. Wang H. Lu and R. Yang \u201cCooling-shrinking attack: Blinding the tracker with imperceptible noises \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2020 pp. 990-999.","DOI":"10.1109\/CVPR42600.2020.00107"},{"key":"e_1_3_3_1_75_2","doi-asserted-by":"crossref","unstructured":"X. Chen B. Yan J. Zhu et al. \u201cTransformer tracking \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2021 pp. 8126-8135.","DOI":"10.1109\/CVPR46437.2021.00803"},{"key":"e_1_3_3_1_76_2","unstructured":"Y. Zhang P. Ye H. Leung et al. \u201cRGBT234: A large-scale benchmark for RGB-T tracking \u201d IEEE Transactions on Image Processing vol. 29 pp. 5678-5691 2020."},{"key":"e_1_3_3_1_77_2","unstructured":"Y. Liu C. Xu J. Li et al. \u201cVSOT: A large-scale visible-infrared single object tracking benchmark \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2022 pp. 15432-15441."},{"key":"e_1_3_3_1_78_2","doi-asserted-by":"crossref","unstructured":"S. Jia Y. Song C. Ma and X. Yang \u201cIoU attack: Towards temporally coherent black-box adversarial attack for visual object tracking \u201d in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition 2021 pp. 6709-6718.","DOI":"10.1109\/CVPR46437.2021.00664"},{"key":"e_1_3_3_1_79_2","doi-asserted-by":"crossref","unstructured":"X. Xiang Q. Yan H. Zhang and J. Ma \u201cACAttack: Adaptive Cross Attacking RGB-T Tracker via Multi-Modal Response Decoupling \u201d in IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) 2025 pp. 22099-22108.","DOI":"10.1109\/CVPR52734.2025.02058"},{"key":"e_1_3_3_1_80_2","doi-asserted-by":"crossref","unstructured":"Z. Li W. Zhimin and Y. Wang \u201cMulti-view Feature Discrepancy Attack for Single Object Tracking \u201d in IEEE International Conference on Acoustics Speech and Signal Processing (ICASSP) 2025 pp. 1-5.","DOI":"10.1109\/ICASSP49660.2025.10889698"}],"event":{"name":"CSAI 2025: 2025 The 9th International Conference on Computer Science and Artificial Intelligence","location":"Beijing China","acronym":"CSAI 2025"},"container-title":["Proceedings of the 2025 9th International Conference on Computer Science and Artificial Intelligence"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3788149.3788209","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T06:36:13Z","timestamp":1773988573000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3788149.3788209"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,12]]},"references-count":79,"alternative-id":["10.1145\/3788149.3788209","10.1145\/3788149"],"URL":"https:\/\/doi.org\/10.1145\/3788149.3788209","relation":{},"subject":[],"published":{"date-parts":[[2025,12,12]]},"assertion":[{"value":"2026-03-19","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}