{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,26]],"date-time":"2026-06-26T04:57:48Z","timestamp":1782449868056,"version":"3.54.5"},"publisher-location":"Cham","reference-count":61,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031729454","type":"print"},{"value":"9783031729461","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,10,2]],"date-time":"2024-10-02T00:00:00Z","timestamp":1727827200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,10,2]],"date-time":"2024-10-02T00:00:00Z","timestamp":1727827200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-72946-1_20","type":"book-chapter","created":{"date-parts":[[2024,10,1]],"date-time":"2024-10-01T19:02:08Z","timestamp":1727809328000},"page":"349-367","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":11,"title":["Visual Alignment Pre-training for\u00a0Sign Language Translation"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0976-0834","authenticated-orcid":false,"given":"Peiqi","family":"Jiao","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0696-2468","authenticated-orcid":false,"given":"Yuecong","family":"Min","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3024-4404","authenticated-orcid":false,"given":"Xilin","family":"Chen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2024,10,2]]},"reference":[{"key":"20_CR1","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1007\/978-3-030-58621-8_3","volume-title":"Computer Vision \u2013 ECCV 2020","author":"S Albanie","year":"2020","unstructured":"Albanie, S., et al.: BSL-1K: scaling up co-articulated sign language recognition using mouthing cues. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12356, pp. 35\u201353. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58621-8_3"},{"key":"20_CR2","unstructured":"Bahdanau, D., Cho, K.H., Bengio, Y.: Neural machine translation by jointly learning to align and translate. In: 3rd International Conference on Learning Representations, ICLR 2015 (2015)"},{"key":"20_CR3","doi-asserted-by":"crossref","unstructured":"Ba\u00f1\u00f3n, M., et\u00a0al.: ParaCrawl: web-scale acquisition of parallel corpora. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 4555\u20134567 (2020)","DOI":"10.18653\/v1\/2020.acl-main.417"},{"key":"20_CR4","doi-asserted-by":"crossref","unstructured":"Basri, R., Roth, D., Jacobs, D.: Clustering appearances of 3d objects. In: Proceedings. 1998 IEEE Computer Society Conference on Computer Vision and Pattern Recognition, pp. 414\u2013420. IEEE (1998)","DOI":"10.1109\/CVPR.1998.698639"},{"key":"20_CR5","unstructured":"Brown, P.F., Della\u00a0Pietra, S.A., Della\u00a0Pietra, V.J., Mercer, R.L.: The mathematics of statistical machine translation: parameter estimation. Comput. Linguist. 19(2), 263\u2013311 (1993). https:\/\/aclanthology.org\/J93-2003"},{"key":"20_CR6","doi-asserted-by":"crossref","unstructured":"Camgoz, N.C., Hadfield, S., Koller, O., Ney, H., Bowden, R.: Neural sign language translation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7784\u20137793 (2018)","DOI":"10.1109\/CVPR.2018.00812"},{"key":"20_CR7","unstructured":"Camgoz, N.C., Koller, O., Hadfield, S., Bowden, R.: Sign language transformers: joint end-to-end sign language recognition and translation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10023\u201310033 (2020)"},{"key":"20_CR8","doi-asserted-by":"crossref","unstructured":"Chen, Y., Wei, F., Sun, X., Wu, Z., Lin, S.: A simple multi-modality transfer learning baseline for sign language translation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5120\u20135130 (2022)","DOI":"10.1109\/CVPR52688.2022.00506"},{"key":"20_CR9","first-page":"17043","volume":"35","author":"Y Chen","year":"2022","unstructured":"Chen, Y., Zuo, R., Wei, F., Wu, Y., Liu, S., Mak, B.: Two-stream network for sign language recognition and translation. Adv. Neural. Inf. Process. Syst. 35, 17043\u201317056 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"20_CR10","doi-asserted-by":"crossref","unstructured":"Cheng, Y., Wei, F., Bao, J., Chen, D., Zhang, W.: Cico: domain-aware sign language retrieval via cross-lingual contrastive learning. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 19016\u201319026 (2023)","DOI":"10.1109\/CVPR52729.2023.01823"},{"key":"20_CR11","unstructured":"Dosovitskiy, A., et al.: An image is worth 16x16 words: transformers for image recognition at scale. In: International Conference on Learning Representations (2021). https:\/\/openreview.net\/forum?id=YicbFdNTTy"},{"key":"20_CR12","first-page":"80","volume":"60","author":"P Dreuw","year":"2007","unstructured":"Dreuw, P., Rybach, D., Deselaers, T., Zahedi, M., Ney, H.: Speech recognition techniques for a sign language recognition system. Hand 60, 80 (2007)","journal-title":"Hand"},{"key":"20_CR13","doi-asserted-by":"crossref","unstructured":"Duarte, A., et al.: How2sign: a large-scale multimodal dataset for continuous american sign language. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2735\u20132744 (2021)","DOI":"10.1109\/CVPR46437.2021.00276"},{"key":"20_CR14","doi-asserted-by":"crossref","unstructured":"Garg, S., Peitz, S., Nallasamy, U., Paulik, M.: Jointly learning to align and translate with transformer models. In: Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing, pp. 4453\u20134462 (2019)","DOI":"10.18653\/v1\/D19-1453"},{"key":"20_CR15","doi-asserted-by":"crossref","unstructured":"Graves, A., Fern\u00e1ndez, S., Gomez, F., Schmidhuber, J.: Connectionist temporal classification: labelling unsegmented sequence data with recurrent neural networks. In: International Conference on Machine Learning, pp. 369\u2013376 (2006)","DOI":"10.1145\/1143844.1143891"},{"key":"20_CR16","doi-asserted-by":"crossref","unstructured":"Guo, L., et al.: Distilling cross-temporal contexts for continuous sign language recognition. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10771\u201310780 (2023)","DOI":"10.1109\/CVPR52729.2023.01037"},{"key":"20_CR17","doi-asserted-by":"crossref","unstructured":"He, K., Chen, X., Xie, S., Li, Y., Doll\u00e1r, P., Girshick, R.: Masked autoencoders are scalable vision learners. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16000\u201316009 (2022)","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"20_CR18","doi-asserted-by":"crossref","unstructured":"Hu, H., Zhao, W., Zhou, W., Li, H.: Signbert+: hand-model-aware self-supervised pre-training for sign language understanding. IEEE Trans. Pattern Anal. Mach. Intell. (2023)","DOI":"10.1109\/TPAMI.2023.3269220"},{"key":"20_CR19","doi-asserted-by":"crossref","unstructured":"Hu, L., Gao, L., Liu, Z., Feng, W.: Continuous sign language recognition with correlation network. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2529\u20132539 (2023)","DOI":"10.1109\/CVPR52729.2023.00249"},{"key":"20_CR20","unstructured":"Jia, C., et al.: Scaling up visual and vision-language representation learning with noisy text supervision. In: International Conference on Machine Learning, pp. 4904\u20134916. PMLR (2021)"},{"key":"20_CR21","doi-asserted-by":"crossref","unstructured":"Jiao, P., Min, Y., Li, Y., Wang, X., Lei, L., Chen, X.: Cosign: exploring co-occurrence signals in skeleton-based continuous sign language recognition. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 20676\u201320686 (2023)","DOI":"10.1109\/ICCV51070.2023.01890"},{"key":"20_CR22","doi-asserted-by":"crossref","unstructured":"Jin, T., Zhao, Z.: Contrastive disentangled meta-learning for signer-independent sign language translation. In: Proceedings of the 29th ACM International Conference on Multimedia, pp. 5065\u20135073 (2021)","DOI":"10.1145\/3474085.3475456"},{"key":"20_CR23","unstructured":"Kenton, J.D.M.W.C., Toutanova, L.K.: Bert: pre-training of deep bidirectional transformers for language understanding. In: Proceedings of NAACL-HLT, pp. 4171\u20134186 (2019)"},{"issue":"9","key":"20_CR24","doi-asserted-by":"publisher","first-page":"2306","DOI":"10.1109\/TPAMI.2019.2911077","volume":"42","author":"O Koller","year":"2019","unstructured":"Koller, O., Camgoz, N.C., Ney, H., Bowden, R.: Weakly supervised learning with multi-stream CNN-LSTM-HMMs to discover sequential parallelism in sign language videos. IEEE Trans. Pattern Anal. Mach. Intell. 42(9), 2306\u20132320 (2019)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"20_CR25","first-page":"12034","volume":"33","author":"D Li","year":"2020","unstructured":"Li, D., et al.: TSPNet: hierarchical feature learning via temporal semantic pyramid for sign language translation. Adv. Neural. Inf. Process. Syst. 33, 12034\u201312045 (2020)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"20_CR26","unstructured":"Lin, C.Y.: Rouge: a package for automatic evaluation of summaries. In: Text summarization branches out, pp. 74\u201381 (2004)"},{"key":"20_CR27","doi-asserted-by":"crossref","unstructured":"Lin, K., Wang, X., Zhu, L., Sun, K., Zhang, B., Yang, Y.: Gloss-free end-to-end sign language translation. In: Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 12904\u201312916 (2023)","DOI":"10.18653\/v1\/2023.acl-long.722"},{"key":"20_CR28","doi-asserted-by":"publisher","first-page":"726","DOI":"10.1162\/tacl_a_00343","volume":"8","author":"Y Liu","year":"2020","unstructured":"Liu, Y., et al.: Multilingual denoising pre-training for neural machine translation. Trans. Assoc. Comput. Linguist. 8, 726\u2013742 (2020)","journal-title":"Trans. Assoc. Comput. Linguist."},{"key":"20_CR29","doi-asserted-by":"crossref","unstructured":"Luong, M.T., Pham, H., Manning, C.D.: Effective approaches to attention-based neural machine translation. In: Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing, pp. 1412\u20131421 (2015)","DOI":"10.18653\/v1\/D15-1166"},{"key":"20_CR30","unstructured":"Mikolov, T., Sutskever, I., Chen, K., Corrado, G.S., Dean, J.: Distributed representations of words and phrases and their compositionality. In: Advances in Neural Information Processing Systems, vol. 26 (2013)"},{"key":"20_CR31","unstructured":"Min, Y., Chen, X.: Towards faithful sign language translation (2023). https:\/\/openreview.net\/forum?id=mWMJN0vbDF"},{"key":"20_CR32","doi-asserted-by":"crossref","unstructured":"Misra, I., Maaten, L.V.D.: Self-supervised learning of pretext-invariant representations. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6707\u20136717 (2020)","DOI":"10.1109\/CVPR42600.2020.00674"},{"key":"20_CR33","doi-asserted-by":"crossref","unstructured":"M\u00fcller, M., Jiang, Z., Moryossef, A., Rios, A., Ebling, S.: Considerations for meaningful sign language machine translation based on glosses. In: Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers), pp. 682\u2013693 (2023)","DOI":"10.18653\/v1\/2023.acl-short.60"},{"key":"20_CR34","doi-asserted-by":"crossref","unstructured":"Orbay, A., Akarun, L.: Neural sign language translation by learning tokenization. In: 2020 15th IEEE International Conference on Automatic Face and Gesture Recognition, pp. 222\u2013228. IEEE (2020)","DOI":"10.1109\/FG47880.2020.00002"},{"key":"20_CR35","doi-asserted-by":"crossref","unstructured":"Papineni, K., Roukos, S., Ward, T., Zhu, W.J.: BLEU: a method for automatic evaluation of machine translation. In: Proceedings of the 40th annual meeting of the Association for Computational Linguistics, pp. 311\u2013318 (2002)","DOI":"10.3115\/1073083.1073135"},{"key":"20_CR36","unstructured":"Patricia, Cabot, \u00c1., Xavier, Gir\u00f3, N., Laia, Tarr\u00e9s, B.: Sign language translation based on transformers for the How2Sign dataset (2022). https:\/\/imatge.upc.edu\/web\/publications\/sign-language-translation-based-transformers-how2sign-dataset"},{"key":"20_CR37","doi-asserted-by":"crossref","unstructured":"Pennington, J., Socher, R., Manning, C.D.: Glove: global vectors for word representation. In: Proceedings of the 2014 conference on Empirical Methods in Natural Language Processing, pp. 1532\u20131543 (2014)","DOI":"10.3115\/v1\/D14-1162"},{"key":"20_CR38","unstructured":"Radford, A., et\u00a0al.: Learning transferable visual models from natural language supervision. In: International Conference on Machine Learning, pp. 8748\u20138763. PMLR (2021)"},{"issue":"140","key":"20_CR39","first-page":"1","volume":"21","author":"C Raffel","year":"2020","unstructured":"Raffel, C., et al.: Exploring the limits of transfer learning with a unified text-to-text transformer. J. Mach. Learn. Res. 21(140), 1\u201367 (2020)","journal-title":"J. Mach. Learn. Res."},{"key":"20_CR40","doi-asserted-by":"crossref","unstructured":"Shi, B., Brentari, D., Shakhnarovich, G., Livescu, K.: Open-domain sign language translation learned from online video. In: Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, pp. 6365\u20136379 (2022)","DOI":"10.18653\/v1\/2022.emnlp-main.427"},{"key":"20_CR41","doi-asserted-by":"crossref","unstructured":"Sun, C., Myers, A., Vondrick, C., Murphy, K., Schmid, C.: Videobert: a joint model for video and language representation learning. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 7464\u20137473 (2019)","DOI":"10.1109\/ICCV.2019.00756"},{"key":"20_CR42","doi-asserted-by":"crossref","unstructured":"Tarr\u00e9s, L., G\u00e1llego, G.I., Duarte, A., Torres, J., Gir\u00f3-i Nieto, X.: Sign language translation from instructional videos. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops, pp. 5625\u20135635 (2023)","DOI":"10.1109\/CVPRW59228.2023.00596"},{"issue":"5500","key":"20_CR43","doi-asserted-by":"publisher","first-page":"2319","DOI":"10.1126\/science.290.5500.2319","volume":"290","author":"JB Tenenbaum","year":"2000","unstructured":"Tenenbaum, J.B., Silva, V.D., Langford, J.C.: A global geometric framework for nonlinear dimensionality reduction. Science 290(5500), 2319\u20132323 (2000)","journal-title":"Science"},{"key":"20_CR44","unstructured":"Uthus, D., Tanzer, G., Georg, M.: Youtube-asl: a large-scale, open-domain American sign language-English parallel corpus. In: Thirty-seventh Conference on Neural Information Processing Systems Datasets and Benchmarks Track (2023)"},{"key":"20_CR45","doi-asserted-by":"crossref","unstructured":"Wang, W., et\u00a0al.: Image as a foreign language: Beit pretraining for vision and vision-language tasks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 19175\u201319186 (2023)","DOI":"10.1109\/CVPR52729.2023.01838"},{"key":"20_CR46","doi-asserted-by":"crossref","unstructured":"Wei, F., Chen, Y.: Improving continuous sign language recognition with cross-lingual signs. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 23612\u201323621 (2023)","DOI":"10.1109\/ICCV51070.2023.02158"},{"key":"20_CR47","unstructured":"Wenzek, G., et al.: CCNet: extracting high quality monolingual datasets from web crawl data. In: Proceedings of the Twelfth Language Resources and Evaluation Conference, pp. 4003\u20134012 (2020)"},{"key":"20_CR48","doi-asserted-by":"crossref","unstructured":"Wong, R., Camgoz, N.C., Bowden, R.: Learnt contrastive concept embeddings for sign recognition. In: 2023 IEEE\/CVF International Conference on Computer Vision Workshops (ICCVW), pp. 1937\u20131946. IEEE Computer Society (2023)","DOI":"10.1109\/ICCVW60793.2023.00209"},{"key":"20_CR49","unstructured":"Wong, R., Camgoz, N.C., Bowden, R.: Sign2GPT: leveraging large language models for gloss-free sign language translation. In: The Twelfth International Conference on Learning Representations (2024). https:\/\/openreview.net\/forum?id=LqaEEs3UxU"},{"key":"20_CR50","doi-asserted-by":"crossref","unstructured":"Yao, H., Zhou, W., Feng, H., Hu, H., Zhou, H., Li, H.: Sign language translation with iterative prototype. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 15592\u201315601 (2023)","DOI":"10.1109\/ICCV51070.2023.01429"},{"key":"20_CR51","unstructured":"Yao, L., et al.: Filip: fine-grained interactive language-image pre-training. In: International Conference on Learning Representations (2021)"},{"key":"20_CR52","doi-asserted-by":"crossref","unstructured":"Yin, A., Zhong, T., Tang, L., Jin, W., Jin, T., Zhao, Z.: Gloss attention for gloss-free sign language translation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2551\u20132562 (2023)","DOI":"10.1109\/CVPR52729.2023.00251"},{"key":"20_CR53","doi-asserted-by":"crossref","unstructured":"Yin, K., Read, J.: Better sign language translation with STMC-transformer. In: Proceedings of the 28th International Conference on Computational Linguistics, pp. 5975\u20135989 (2020)","DOI":"10.18653\/v1\/2020.coling-main.525"},{"key":"20_CR54","unstructured":"Zhang, B., M\u00fcller, M., Sennrich, R.: SLTUNET: a simple unified model for sign language translation. In: International Conference on Learning Representations (2023)"},{"key":"20_CR55","doi-asserted-by":"crossref","unstructured":"Zhang, H., Guo, Z., Yang, Y., Liu, X., Hu, D.: C2st: cross-modal contextualized sequence transduction for continuous sign language recognition. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 21053\u201321062 (2023)","DOI":"10.1109\/ICCV51070.2023.01925"},{"key":"20_CR56","doi-asserted-by":"publisher","first-page":"2662","DOI":"10.1109\/TMM.2021.3087006","volume":"24","author":"J Zhao","year":"2021","unstructured":"Zhao, J., Qi, W., Zhou, W., Duan, N., Zhou, M., Li, H.: Conditional sentence generation and cross-modal reranking for sign language translation. IEEE Trans. Multimedia 24, 2662\u20132672 (2021)","journal-title":"IEEE Trans. Multimedia"},{"key":"20_CR57","doi-asserted-by":"crossref","unstructured":"Zheng, J., et al.: Cvt-slr: contrastive visual-textual transformation for sign language recognition with variational alignment. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 23141\u201323150 (2023)","DOI":"10.1109\/CVPR52729.2023.02216"},{"key":"20_CR58","doi-asserted-by":"crossref","unstructured":"Zhong, Y., et\u00a0al.: Regionclip: region-based language-image pretraining. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16793\u201316803 (2022)","DOI":"10.1109\/CVPR52688.2022.01629"},{"key":"20_CR59","doi-asserted-by":"crossref","unstructured":"Zhou, B., et al.: Gloss-free sign language translation: Improving from visual-language pretraining. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 20871\u201320881 (2023)","DOI":"10.1109\/ICCV51070.2023.01908"},{"key":"20_CR60","doi-asserted-by":"crossref","unstructured":"Zhou, H., Zhou, W., Qi, W., Pu, J., Li, H.: Improving sign language translation with monolingual data by sign back-translation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 1316\u20131325 (2021)","DOI":"10.1109\/CVPR46437.2021.00137"},{"key":"20_CR61","doi-asserted-by":"publisher","first-page":"768","DOI":"10.1109\/TMM.2021.3059098","volume":"24","author":"H Zhou","year":"2021","unstructured":"Zhou, H., Zhou, W., Zhou, Y., Li, H.: Spatial-temporal multi-cue network for sign language recognition and translation. IEEE Trans. Multimedia 24, 768\u2013779 (2021)","journal-title":"IEEE Trans. Multimedia"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-72946-1_20","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,1]],"date-time":"2024-10-01T19:06:13Z","timestamp":1727809573000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-72946-1_20"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,2]]},"ISBN":["9783031729454","9783031729461"],"references-count":61,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-72946-1_20","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,10,2]]},"assertion":[{"value":"2 October 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}