{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T09:29:12Z","timestamp":1780392552367,"version":"3.54.1"},"publisher-location":"Singapore","reference-count":75,"publisher":"Springer Nature Singapore","isbn-type":[{"value":"9789819609000","type":"print"},{"value":"9789819609017","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,12,8]],"date-time":"2024-12-08T00:00:00Z","timestamp":1733616000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,12,8]],"date-time":"2024-12-08T00:00:00Z","timestamp":1733616000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-96-0901-7_28","type":"book-chapter","created":{"date-parts":[[2024,12,7]],"date-time":"2024-12-07T07:53:49Z","timestamp":1733558029000},"page":"483-500","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":38,"title":["BootsTAP: Bootstrapped Training for\u00a0Tracking-Any-Point"],"prefix":"10.1007","author":[{"given":"Carl","family":"Doersch","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Pauline","family":"Luc","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yi","family":"Yang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Dilara","family":"Gokay","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Skanda","family":"Koppula","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ankush","family":"Gupta","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Joseph","family":"Heyward","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ignacio","family":"Rocco","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Ross","family":"Goroshin","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jo\u00e3o","family":"Carreira","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Andrew","family":"Zisserman","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2024,12,8]]},"reference":[{"key":"28_CR1","doi-asserted-by":"crossref","unstructured":"Balasingam, A., Chandler, J., Li, C., Zhang, Z., Balakrishnan, H.: Drivetrack: A benchmark for long-range point tracking in real-world videos. arXiv preprint arXiv:2312.09523 (2023)","DOI":"10.1109\/CVPR52733.2024.02122"},{"key":"28_CR2","doi-asserted-by":"crossref","unstructured":"Bharadhwaj, H., Mottaghi, R., Gupta, A., Tulsiani, S.: Track2Act: Predicting point tracks from internet videos enables diverse zero-shot robot manipulation. arXiv preprint arXiv:2405.01527 (2024)","DOI":"10.1007\/978-3-031-73116-7_18"},{"key":"28_CR3","unstructured":"Bian, W., Huang, Z., Shi, X., Dong, Y., Li, Y., Li, H.: Context-pips: Persistent independent particles demands context features. NeurIPS (2024)"},{"key":"28_CR4","doi-asserted-by":"crossref","unstructured":"Bian, Z., Jabri, A., Efros, A.A., Owens, A.: Learning pixel trajectories with multiscale contrastive random walks. In: Proc. CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.00640"},{"key":"28_CR5","doi-asserted-by":"crossref","unstructured":"Boreczky, J.S., Rowe, L.A.: Comparison of video shot boundary detection techniques. Journal of Electronic Imaging 5(2), 122\u2013128 (1996)","DOI":"10.1117\/12.238675"},{"key":"28_CR6","unstructured":"Bousmalis, K., Vezzani, G., Rao, D., Devin, C., Lee, A.X., Bauza, M., Davchev, T., Zhou, Y., Gupta, A., Raju, A., et\u00a0al.: Robocat: A self-improving foundation agent for robotic manipulation. arXiv preprint arXiv:2306.11706 (2023)"},{"key":"28_CR7","doi-asserted-by":"crossref","unstructured":"Carreira, J., Zisserman, A.: Quo vadis, action recognition? a new model and the kinetics dataset. In: Proc. CVPR. pp. 6299\u20136308 (2017)","DOI":"10.1109\/CVPR.2017.502"},{"key":"28_CR8","doi-asserted-by":"crossref","unstructured":"Chen, W., Chen, L., Wang, R., Pollefeys, M.: Leap-vo: Long-term effective any point tracking for visual odometry. arXiv preprint arXiv:2401.01887 (2024)","DOI":"10.1109\/CVPR52733.2024.01876"},{"key":"28_CR9","doi-asserted-by":"crossref","unstructured":"Dekel, T., Rubinstein, M., Liu, C., Freeman, W.T.: On the effectiveness of visible watermarks. In: Proc. CVPR (2017)","DOI":"10.1109\/CVPR.2017.726"},{"key":"28_CR10","doi-asserted-by":"crossref","unstructured":"Denil, M., Bazzani, L., Larochelle, H., de Freitas, N.: Learning where to attend with deep architectures for image tracking. Neural computation 24(8), 2151\u20132184 (2012)","DOI":"10.1162\/NECO_a_00312"},{"key":"28_CR11","doi-asserted-by":"crossref","unstructured":"Doersch, C., Gupta, A., Efros, A.A.: Unsupervised visual representation learning by context prediction. In: Proc. ICCV (2015)","DOI":"10.1109\/ICCV.2015.167"},{"key":"28_CR12","unstructured":"Doersch, C., Gupta, A., Markeeva, L., Recasens, A., Smaira, L., Aytar, Y., Carreira, J., Zisserman, A., Yang, Y.: TAP-Vid: A benchmark for tracking any point in a video. NeurIPS (2022)"},{"key":"28_CR13","doi-asserted-by":"crossref","unstructured":"Doersch, C., Yang, Y., Vecerik, M., Gokay, D., Gupta, A., Aytar, Y., Carreira, J., Zisserman, A.: TAPIR: Tracking any point with per-frame initialization and temporal refinement. arXiv preprint arXiv:2306.08637 (2023)","DOI":"10.1109\/ICCV51070.2023.00923"},{"key":"28_CR14","doi-asserted-by":"crossref","unstructured":"Doersch, C., Zisserman, A.: Multi-task self-supervised visual learning. In: Proc. ICCV (2017)","DOI":"10.1109\/ICCV.2017.226"},{"key":"28_CR15","doi-asserted-by":"crossref","unstructured":"F\u00f6ldi\u00e1k, P.: Learning invariance from transformation sequences. Neural computation 3(2), 194\u2013200 (1991)","DOI":"10.1162\/neco.1991.3.2.194"},{"key":"28_CR16","doi-asserted-by":"crossref","unstructured":"Goroshin, R., Bruna, J., Tompson, J., Eigen, D., LeCun, Y.: Unsupervised learning of spatiotemporally coherent metrics. In: Proc. ICCV (2015)","DOI":"10.1109\/ICCV.2015.465"},{"key":"28_CR17","unstructured":"Goroshin, R., Mathieu, M.F., LeCun, Y.: Learning to linearize under uncertainty. NeurIPS (2015)"},{"key":"28_CR18","unstructured":"Goyal, P., Doll\u00e1r, P., Girshick, R., Noordhuis, P., Wesolowski, L., Kyrola, A., Tulloch, A., Jia, Y., He, K.: Accurate, large minibatch SGD: Training imagenet in 1 hour. arXiv preprint arXiv:1706.02677 (2017)"},{"key":"28_CR19","doi-asserted-by":"crossref","unstructured":"Greff, K., Belletti, F., Beyer, L., Doersch, C., Du, Y., Duckworth, D., Fleet, D.J., Gnanapragasam, D., Golemo, F., Herrmann, C., et\u00a0al.: Kubric: A scalable dataset generator. In: Proc. CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.00373"},{"key":"28_CR20","unstructured":"Grill, J.B., Strub, F., Altch\u00e9, F., Tallec, C., Richemond, P., Buchatskaya, E., Doersch, C., Avila\u00a0Pires, B., Guo, Z., Gheshlaghi\u00a0Azar, M., et\u00a0al.: Bootstrap your own latent - a new approach to self-supervised learning. In: NeurIPS (2020)"},{"key":"28_CR21","unstructured":"Hadsell, R., Chopra, S., LeCun, Y.: Dimensionality reduction by learning an invariant mapping. In: Proc. CVPR (2006)"},{"key":"28_CR22","doi-asserted-by":"crossref","unstructured":"Harley, A.W., Fang, Z., Fragkiadaki, K.: Particle video revisited: Tracking through occlusions using point trajectories. In: Proc. ECCV (2022)","DOI":"10.1007\/978-3-031-20047-2_4"},{"key":"28_CR23","doi-asserted-by":"crossref","unstructured":"Huang, H.P., Herrmann, C., Hur, J., Lu, E., Sargent, K., Stone, A., Yang, M.H., Sun, D.: Self-supervised autoflow. In: Proc. CVPR (2023)","DOI":"10.1109\/CVPR52729.2023.01098"},{"key":"28_CR24","doi-asserted-by":"crossref","unstructured":"Im, W., Lee, S., Yoon, S.E.: Semi-supervised learning of optical flow by flow supervisor. In: Proc. ECCV (2022)","DOI":"10.1007\/978-3-031-19833-5_18"},{"key":"28_CR25","unstructured":"Jabri, A., Owens, A., Efros, A.: Space-time correspondence as a contrastive random walk. NeurIPS 33, 19545\u201319560 (2020)"},{"key":"28_CR26","doi-asserted-by":"crossref","unstructured":"Janai, J., Guney, F., Ranjan, A., Black, M., Geiger, A.: Unsupervised learning of multi-frame optical flow with occlusions. In: Proc. ECCV (2018)","DOI":"10.1007\/978-3-030-01270-0_42"},{"key":"28_CR27","doi-asserted-by":"crossref","unstructured":"Janai, J., Guney, F., Wulff, J., Black, M.J., Geiger, A.: Slow flow: Exploiting high-speed cameras for accurate and diverse optical flow reference data. In: Proc. CVPR (2017)","DOI":"10.1109\/CVPR.2017.154"},{"key":"28_CR28","doi-asserted-by":"crossref","unstructured":"Jiang, W., Trulls, E., Hosang, J., Tagliasacchi, A., Yi, K.M.: COTR: Correspondence transformer for matching across images. In: Proc. ICCV (2021)","DOI":"10.1109\/ICCV48922.2021.00615"},{"key":"28_CR29","doi-asserted-by":"crossref","unstructured":"Karaev, N., Rocco, I., Graham, B., Neverova, N., Vedaldi, A., Rupprecht, C.: CoTracker: It is better to track together. arXiv preprint arXiv:2307.07635 (2023)","DOI":"10.1007\/978-3-031-73033-7_2"},{"key":"28_CR30","unstructured":"Lai, W.S., Huang, J.B., Yang, M.H.: Semi-supervised learning for optical flow with generative adversarial networks (2017)"},{"key":"28_CR31","doi-asserted-by":"crossref","unstructured":"Lai, Z., Lu, E., Xie, W.: MAST: A memory-augmented self-supervised tracker. In: Proc. CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.00651"},{"key":"28_CR32","unstructured":"Lai, Z., Xie, W.: Self-supervised learning for video correspondence flow. arXiv preprint arXiv:1905.00875 (2019)"},{"key":"28_CR33","doi-asserted-by":"crossref","unstructured":"Li, R., Zhou, S., Liu, D.: Learning fine-grained features for pixel-wise video correspondences. In: Proc. ICCV (2023)","DOI":"10.1109\/ICCV51070.2023.00883"},{"key":"28_CR34","unstructured":"Liu, B., Zhu, Y., Gao, C., Feng, Y., Liu, Q., Zhu, Y., Stone, P.: Libero: Benchmarking knowledge transfer for lifelong robot learning. NeurIPS 36 (2024)"},{"key":"28_CR35","doi-asserted-by":"crossref","unstructured":"Liu, L., Zhang, J., He, R., Liu, Y., Wang, Y., Tai, Y., Luo, D., Wang, C., Li, J., Huang, F.: Learning by analogy: Reliable supervision from transformations for unsupervised optical flow estimation. In: Proc. CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.00652"},{"key":"28_CR36","doi-asserted-by":"crossref","unstructured":"Liu, P., King, I., Lyu, M.R., Xu, J.: Ddflow: Learning optical flow with unlabeled data distillation. In: Proceedings of the AAAI conference on artificial intelligence. vol.\u00a033, pp. 8770\u20138777 (2019)","DOI":"10.1609\/aaai.v33i01.33018770"},{"key":"28_CR37","doi-asserted-by":"crossref","unstructured":"Liu, P., Lyu, M., King, I., Xu, J.: Selflow: Self-supervised learning of optical flow. In: Proc. CVPR (2019)","DOI":"10.1109\/CVPR.2019.00470"},{"key":"28_CR38","doi-asserted-by":"crossref","unstructured":"Liu, P., Lyu, M.R., King, I., Xu, J.: Learning by distillation: a self-supervised learning framework for optical flow estimation. IEEE PAMI 44(9), 5026\u20135041 (2021)","DOI":"10.1109\/TPAMI.2021.3085525"},{"key":"28_CR39","doi-asserted-by":"crossref","unstructured":"Marsal, R., Chabot, F., Loesch, A., Sahbi, H.: Brightflow: Brightness-change-aware unsupervised learning of optical flow. In: Proc. WACV (2023)","DOI":"10.1109\/WACV56688.2023.00210"},{"key":"28_CR40","unstructured":"Mas, J., Fernandez, G.: Video shot boundary detection based on color histogram. In: TRECVID (2003)"},{"key":"28_CR41","doi-asserted-by":"crossref","unstructured":"Meister, S., Hur, J., Roth, S.: Unflow: Unsupervised learning of optical flow with a bidirectional census loss. In: Proceedings of the AAAI conference on artificial intelligence. vol.\u00a032 (2018)","DOI":"10.1609\/aaai.v32i1.12276"},{"key":"28_CR42","doi-asserted-by":"crossref","unstructured":"Moing, G.L., Ponce, J., Schmid, C.: Dense optical tracking: Connecting the dots. In: Proc. CVPR (2024)","DOI":"10.1109\/CVPR52733.2024.01815"},{"key":"28_CR43","doi-asserted-by":"crossref","unstructured":"Neoral, M., \u0160er\u1ef3ch, J., Matas, J.: MFT: Long-term tracking of every pixel. In: Proc. WACV (2024)","DOI":"10.1109\/WACV57701.2024.00669"},{"key":"28_CR44","unstructured":"Nov\u00e1k, T., \u0160ochman, J., Matas, J.: A new semi-supervised method improving optical flow on distant domains. In: Computer Vision Winter Workshop. vol.\u00a03 (2020)"},{"key":"28_CR45","doi-asserted-by":"crossref","unstructured":"Ochs, P., Malik, J., Brox, T.: Segmentation of moving objects by long term video analysis. IEEE transactions on pattern analysis and machine intelligence 36(6), 1187\u20131200 (2013)","DOI":"10.1109\/TPAMI.2013.242"},{"key":"28_CR46","unstructured":"OpenAI: GPT-4V(ision) system card (September 25, 2023)"},{"key":"28_CR47","doi-asserted-by":"crossref","unstructured":"Perazzi, F., Pont-Tuset, J., McWilliams, B., Van\u00a0Gool, L., Gross, M., Sorkine-Hornung, A.: A benchmark dataset and evaluation methodology for video object segmentation. In: Proc. CVPR (2016)","DOI":"10.1109\/CVPR.2016.85"},{"key":"28_CR48","doi-asserted-by":"crossref","unstructured":"Polajnar, J., Kvinikadze, E., Harley, A.W., Malenovsk\u1ef3, I.: Wing buzzing as a mechanism for generating vibrational signals in psyllids. Insect Science (2024)","DOI":"10.1111\/1744-7917.13322"},{"key":"28_CR49","unstructured":"Raji\u010d, F., Ke, L., Tai, Y.W., Tang, C.K., Danelljan, M., Yu, F.: Segment anything meets point tracking. arXiv preprint arXiv:2307.01197 (2023)"},{"key":"28_CR50","doi-asserted-by":"crossref","unstructured":"Ren, Z., Yan, J., Ni, B., Liu, B., Yang, X., Zha, H.: Unsupervised deep learning for optical flow estimation. In: Proceedings of the AAAI conference on artificial intelligence. vol.\u00a031 (2017)","DOI":"10.1609\/aaai.v31i1.10723"},{"key":"28_CR51","doi-asserted-by":"crossref","unstructured":"Rubinstein, M., Liu, C., Freeman, W.T.: Towards longer long-range motion trajectories. In: Proc. BMVC (2012)","DOI":"10.5244\/C.26.53"},{"key":"28_CR52","doi-asserted-by":"crossref","unstructured":"Sand, P., Teller, S.: Particle video: Long-range motion estimation using point trajectories. Proc. ICCV (2008)","DOI":"10.1007\/s11263-008-0136-6"},{"key":"28_CR53","doi-asserted-by":"crossref","unstructured":"Schmidt, A., Mohareri, O., DiMaio, S., Salcudean, S.E.: Surgical tattoos in infrared: A dataset for quantifying tissue tracking and mapping. IEEE Transactions on Medical Imaging (2024)","DOI":"10.1109\/TMI.2024.3372828"},{"key":"28_CR54","doi-asserted-by":"crossref","unstructured":"Shen, Y., Hui, L., Xie, J., Yang, J.: Self-supervised 3d scene flow estimation guided by superpoints. In: Proc. CVPR (2023)","DOI":"10.1109\/CVPR52729.2023.00510"},{"key":"28_CR55","unstructured":"Sohn, K., Berthelot, D., Carlini, N., Zhang, Z., Zhang, H., Raffel, C.A., Cubuk, E.D., Kurakin, A., Li, C.L.: Fixmatch: Simplifying semi-supervised learning with consistency and confidence (2020)"},{"key":"28_CR56","doi-asserted-by":"crossref","unstructured":"Stone, A., Maurer, D., Ayvaci, A., Angelova, A., Jonschkowski, R.: Smurf: Self-teaching multi-frame unsupervised raft with full-image warping. In: Proc. CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.00388"},{"key":"28_CR57","doi-asserted-by":"crossref","unstructured":"Sun, X., Harley, A.W., Guibas, L.J.: Refining pre-trained motion models. Proc. Intl. Conf. on Robotics and Automation (2024)","DOI":"10.1109\/ICRA57147.2024.10610900"},{"key":"28_CR58","unstructured":"Tarvainen, A., Valpola, H.: Mean teachers are better role models: Weight-averaged consistency targets improve semi-supervised deep learning results. In: NeurIPS (2017)"},{"key":"28_CR59","unstructured":"Team, G., Anil, R., Borgeaud, S., Wu, Y., Alayrac, J.B., Yu, J., Soricut, R., Schalkwyk, J., Dai, A.M., Hauth, A., et\u00a0al.: Gemini: a family of highly capable multimodal models. arXiv preprint arXiv:2312.11805 (2023)"},{"key":"28_CR60","doi-asserted-by":"crossref","unstructured":"Teed, Z., Deng, J.: RAFT: Recurrent all-pairs field transforms for optical flow. In: Proc. ECCV (2020)","DOI":"10.1007\/978-3-030-58536-5_24"},{"key":"28_CR61","doi-asserted-by":"crossref","unstructured":"Truong, B.T., Dorai, C., Venkatesh, S.: New enhancements to cut, fade, and dissolve detection processes in video segmentation. In: Proceedings of the eighth ACM international conference on Multimedia. pp. 219\u2013227 (2000)","DOI":"10.1145\/354384.354481"},{"key":"28_CR62","doi-asserted-by":"crossref","unstructured":"Vecerik, M., Doersch, C., Yang, Y., Davchev, T., Aytar, Y., Zhou, G., Hadsell, R., Agapito, L., Scholz, J.: RoboTAP: Tracking arbitrary points for few-shot visual imitation. In: Proc. Intl. Conf. on Robotics and Automation (2024)","DOI":"10.1109\/ICRA57147.2024.10611409"},{"key":"28_CR63","doi-asserted-by":"crossref","unstructured":"Vondrick, C., Shrivastava, A., Fathi, A., Guadarrama, S., Murphy, K.: Tracking emerges by colorizing videos. In: Proc. ECCV (2018)","DOI":"10.1007\/978-3-030-01261-8_24"},{"key":"28_CR64","doi-asserted-by":"crossref","unstructured":"Wang, J., Karaev, N., Rupprecht, C., Novotny, D.: Visual geometry grounded deep structure from motion. Proc. CVPR (2024)","DOI":"10.1109\/CVPR52733.2024.02049"},{"key":"28_CR65","doi-asserted-by":"crossref","unstructured":"Wang, Q., Chang, Y.Y., Cai, R., Li, Z., Hariharan, B., Holynski, A., Snavely, N.: Tracking everything everywhere all at once. In: Proc. ICCV (2023)","DOI":"10.1109\/ICCV51070.2023.01813"},{"key":"28_CR66","doi-asserted-by":"crossref","unstructured":"Wang, X., Gupta, A.: Unsupervised learning of visual representations using videos. In: Proc. ICCV (2015)","DOI":"10.1109\/ICCV.2015.320"},{"key":"28_CR67","doi-asserted-by":"crossref","unstructured":"Wang, X., Jabri, A., Efros, A.A.: Learning correspondence from the cycle-consistency of time. In: Proc. CVPR (2019)","DOI":"10.1109\/CVPR.2019.00267"},{"key":"28_CR68","doi-asserted-by":"crossref","unstructured":"Wang, Y., Yang, Y., Yang, Z., Zhao, L., Wang, P., Xu, W.: Occlusion aware unsupervised learning of optical flow. In: Proc. CVPR (2018)","DOI":"10.1109\/CVPR.2018.00513"},{"key":"28_CR69","doi-asserted-by":"crossref","unstructured":"Wen, C., Lin, X., So, J., Chen, K., Dou, Q., Gao, Y., Abbeel, P.: Any-point trajectory modeling for policy learning. arXiv preprint arXiv:2401.00025 (2023)","DOI":"10.15607\/RSS.2024.XX.092"},{"key":"28_CR70","doi-asserted-by":"crossref","unstructured":"Wiskott, L., Sejnowski, T.J.: Slow feature analysis: Unsupervised learning of invariances. Neural computation 14(4), 715\u2013770 (2002)","DOI":"10.1162\/089976602317318938"},{"key":"28_CR71","doi-asserted-by":"crossref","unstructured":"Yu, E., Blackburn-Matzen, K., Nguyen, C., Wang, O., Habib Kazi, R., Bousseau, A.: VideoDoodles: Hand-drawn animations on videos with scene-aware canvases. ACM Transactions on Graphics 42(4), 1\u201312 (2023)","DOI":"10.1145\/3592413"},{"key":"28_CR72","doi-asserted-by":"crossref","unstructured":"Yu, J.J., Harley, A.W., Derpanis, K.G.: Back to basics: Unsupervised learning of optical flow via brightness constancy and motion smoothness. In: ECCV 2016 Workshops (2016)","DOI":"10.1007\/978-3-319-49409-8_1"},{"key":"28_CR73","unstructured":"Yuan, C., Wen, C., Zhang, T., Gao, Y.: General flow as foundation affordance for scalable robot learning. arXiv preprint arXiv:2401.11439 (2024)"},{"key":"28_CR74","doi-asserted-by":"crossref","unstructured":"Yusoff, Y., Christmas, W.J., Kittler, J.: Video shot cut detection using adaptive thresholding. In: Proc. BMVC (2000)","DOI":"10.5244\/C.14.37"},{"key":"28_CR75","doi-asserted-by":"crossref","unstructured":"Zheng, Y., Harley, A.W., Shen, B., Wetzstein, G., Guibas, L.J.: PointOdyssey: A large-scale synthetic dataset for long-term point tracking. In: Proc. CVPR (2023)","DOI":"10.1109\/ICCV51070.2023.01818"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ACCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-96-0901-7_28","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,7]],"date-time":"2024-12-07T08:16:21Z","timestamp":1733559381000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-96-0901-7_28"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,8]]},"ISBN":["9789819609000","9789819609017"],"references-count":75,"URL":"https:\/\/doi.org\/10.1007\/978-981-96-0901-7_28","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,12,8]]},"assertion":[{"value":"8 December 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ACCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Asian Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Hanoi","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Vietnam","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 December 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"12 December 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"accv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}