{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T17:37:52Z","timestamp":1777657072912,"version":"3.51.4"},"publisher-location":"Cham","reference-count":69,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031729973","type":"print"},{"value":"9783031729980","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,9,30]],"date-time":"2024-09-30T00:00:00Z","timestamp":1727654400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,9,30]],"date-time":"2024-09-30T00:00:00Z","timestamp":1727654400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-72998-0_3","type":"book-chapter","created":{"date-parts":[[2024,9,29]],"date-time":"2024-09-29T18:01:58Z","timestamp":1727632918000},"page":"37-54","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":11,"title":["Textual Query-Driven Mask Transformer for\u00a0Domain Generalized Segmentation"],"prefix":"10.1007","author":[{"given":"Byeonghyun","family":"Pak","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Byeongju","family":"Woo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sunghwan","family":"Kim","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dae-hwan","family":"Kim","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hoseong","family":"Kim","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,9,30]]},"reference":[{"key":"3_CR1","doi-asserted-by":"publisher","unstructured":"Cai, Z., et al.: X-DETR: a versatile architecture for instance-wise vision-language tasks. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) Computer Vision \u2013 ECCV 2022. ECCV 2022. LNCS, vol. 13696, pp. 290\u2013308. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-20059-5_17","DOI":"10.1007\/978-3-031-20059-5_17"},{"key":"3_CR2","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"213","DOI":"10.1007\/978-3-030-58452-8_13","volume-title":"Computer Vision \u2013 ECCV 2020","author":"N Carion","year":"2020","unstructured":"Carion, N., Massa, F., Synnaeve, G., Usunier, N., Kirillov, A., Zagoruyko, S.: End-to-end object detection with transformers. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12346, pp. 213\u2013229. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58452-8_13"},{"key":"3_CR3","doi-asserted-by":"crossref","unstructured":"Caron, M., et al.: Emerging properties in self-supervised vision transformers. In: ICCV (2021)","DOI":"10.1109\/ICCV48922.2021.00951"},{"key":"3_CR4","doi-asserted-by":"crossref","unstructured":"Cheng, B., Misra, I., Schwing, A.G., Kirillov, A., Girdhar, R.: Masked-attention mask transformer for universal image segmentation. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.00135"},{"key":"3_CR5","unstructured":"Cheng, B., Schwing, A., Kirillov, A.: Per-pixel classification is not all you need for semantic segmentation. NeurIPS (2021)"},{"key":"3_CR6","doi-asserted-by":"crossref","unstructured":"Cho, J., Nam, G., Kim, S., Yang, H., Kwak, S.: PromptStyler: prompt-driven style generation for source-free domain generalization. In: ICCV (2023)","DOI":"10.1109\/ICCV51070.2023.01439"},{"key":"3_CR7","doi-asserted-by":"crossref","unstructured":"Choi, S., Jung, S., Yun, H., Kim, J.T., Kim, S., Choo, J.: RobustNet: improving domain generalization in urban-scene segmentation via instance selective whitening. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.01141"},{"key":"3_CR8","doi-asserted-by":"crossref","unstructured":"Cordts, M., et al.: The cityscapes dataset for semantic urban scene understanding. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.350"},{"key":"3_CR9","doi-asserted-by":"crossref","unstructured":"Desai, K., Johnson, J.: VirTex: learning visual representations from textual annotations. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.01101"},{"key":"3_CR10","doi-asserted-by":"crossref","unstructured":"Ding, J., Xue, N., Xia, G.S., Schiele, B., Dai, D.: HGFormer: hierarchical grouping transformer for domain heneralized semantic segmentation. In: CVPR (2023)","DOI":"10.1109\/CVPR52729.2023.01479"},{"key":"3_CR11","unstructured":"Dosovitskiy, A., et\u00a0al.: An image is worth 16 $$\\times $$ 16 words: transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)"},{"key":"3_CR12","doi-asserted-by":"crossref","unstructured":"Fahes, M., Vu, T.H., Bursuc, A., P\u00e9rez, P., de\u00a0Charette, R.: A simple recipe for language-guided domain generalized segmentation. arXiv preprint arXiv:2311.17922 (2023)","DOI":"10.1109\/CVPR52733.2024.02211"},{"key":"3_CR13","doi-asserted-by":"crossref","unstructured":"Fang, Y., Sun, Q., Wang, X., Huang, T., Wang, X., Cao, Y.: EVA-02: a visual representation for neon genesis. arXiv preprint arXiv:2303.11331 (2023)","DOI":"10.2139\/ssrn.4813567"},{"key":"3_CR14","doi-asserted-by":"crossref","unstructured":"Fang, Y., et al.: EVA: exploring the limits of masked visual representation learning at scale. In: CVPR (2023)","DOI":"10.1109\/CVPR52729.2023.01855"},{"key":"3_CR15","unstructured":"Goyal, P., et al.: Accurate, large minibatch SGD: training imagenet in 1 hour. arXiv preprint arXiv:1706.02677 (2017)"},{"key":"3_CR16","doi-asserted-by":"crossref","unstructured":"He, K., Chen, X., Xie, S., Li, Y., Doll\u00e1r, P., Girshick, R.: Masked autoencoders are scalable vision learners. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"3_CR17","doi-asserted-by":"crossref","unstructured":"He, K., Fan, H., Wu, Y., Xie, S., Girshick, R.: Momentum contrast for unsupervised visual representation learning. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.00975"},{"key":"3_CR18","doi-asserted-by":"crossref","unstructured":"Hoyer, L., Dai, D., Van\u00a0Gool, L.: DAFormer: improving network architectures and training strategies for domain-adaptive semantic segmentation. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.00969"},{"key":"3_CR19","doi-asserted-by":"crossref","unstructured":"Huang, Z., Zhou, A., Ling, Z., Cai, M., Wang, H., Lee, Y.J.: A sentence speaks a thousand images: Domain generalization through distilling CLIP with language guidance. In: ICCV (2023)","DOI":"10.1109\/ICCV51070.2023.01073"},{"key":"3_CR20","doi-asserted-by":"crossref","unstructured":"H\u00fcmmer, C., Schwonberg, M., Zhong, L., Cao, H., Knoll, A., Gottschalk, H.: VLTSeg: simple transfer of CLIP-based vision-language representations for domain generalized semantic segmentation. arXiv preprint arXiv:2312.02021 (2023)","DOI":"10.1109\/IV55152.2023.10186752"},{"key":"3_CR21","unstructured":"Jia, C., et al.: Scaling up visual and vision-language representation learning with noisy text supervision. In: ICML (2021)"},{"key":"3_CR22","doi-asserted-by":"crossref","unstructured":"Kamath, A., Singh, M., LeCun, Y., Synnaeve, G., Misra, I., Carion, N.: MDETR \u2013 modulated detection for end-to-end multi-modal understanding. In: ICCV (2021)","DOI":"10.1109\/ICCV48922.2021.00180"},{"key":"3_CR23","doi-asserted-by":"crossref","unstructured":"Kim, S., Kim, D.H., Kim, H.: Texture learning domain randomization for domain generalized segmentation. In: ICCV (2023)","DOI":"10.1109\/ICCV51070.2023.00069"},{"key":"3_CR24","doi-asserted-by":"crossref","unstructured":"Lee, S., Seong, H., Lee, S., Kim, E.: WildNet: learning domain generalized semantic segmentation from the wild. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.00970"},{"key":"3_CR25","unstructured":"Li, B., Weinberger, K.Q., Belongie, S., Koltun, V., Ranftl, R.: Language-driven semantic segmentation. In: ICLR (2022)"},{"key":"3_CR26","doi-asserted-by":"crossref","unstructured":"Li, F., Zhang, H., Liu, S., Guo, J., Ni, L.M., Zhang, L.: DN-DETR: accelerate detr training by introducing query denoising. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.01325"},{"key":"3_CR27","unstructured":"Li, X., et al.: Transformer-based visual segmentation: a survey. arXiv preprint arXiv:2304.09854 (2023)"},{"issue":"3","key":"3_CR28","doi-asserted-by":"publisher","first-page":"1065","DOI":"10.1109\/TMI.2020.3046692","volume":"40","author":"Z Li","year":"2020","unstructured":"Li, Z., Kamnitsas, K., Glocker, B.: Analyzing overfitting under class imbalance in neural networks for image segmentation. IEEE Trans. Med. Imaging 40(3), 1065\u20131077 (2020)","journal-title":"IEEE Trans. Med. Imaging"},{"key":"3_CR29","doi-asserted-by":"crossref","unstructured":"Li, Z., et al.: Panoptic SegFormer: delving deeper into panoptic segmentation with transformers. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.00134"},{"key":"3_CR30","doi-asserted-by":"crossref","unstructured":"Liang, F., et al.: Open-vocabulary semantic segmentation with mask-adapted CLIP. In: CVPR (2023)","DOI":"10.1109\/CVPR52729.2023.00682"},{"key":"3_CR31","doi-asserted-by":"crossref","unstructured":"Lin, Y., et al.: CLIP is also an efficient segmenter: a text-driven approach for weakly supervised semantic segmentation. In: CVPR (2023)","DOI":"10.1109\/CVPR52729.2023.01469"},{"key":"3_CR32","unstructured":"Liu, S., et al.: DAB-DETR: dynamic anchor boxes are better queries for DETR. ICLR (2022)"},{"key":"3_CR33","doi-asserted-by":"crossref","unstructured":"Liu, Y., Liu, C., Han, K., Tang, Q., Qin, Z.: Boosting semantic segmentation from the perspective of explicit class embeddings. In: ICCV (2023)","DOI":"10.1109\/ICCV51070.2023.00082"},{"key":"3_CR34","unstructured":"Loshchilov, I., Hutter, F.: Decoupled weight decay regularization. ICLR (2019)"},{"key":"3_CR35","unstructured":"Lu, J., Batra, D., Parikh, D., Lee, S.: ViLBERT: pretraining task-agnostic visiolinguistic representations for vision-and-language tasks. NeurIPS (2019)"},{"key":"3_CR36","unstructured":"Mangla, P., Chandhok, S., Aggarwal, M., Balasubramanian, V.N., Krishnamurthy, B.: INDIGO: intrinsic multimodality for domain generalization. arXiv preprint arXiv:2206.05912 (2022)"},{"key":"3_CR37","doi-asserted-by":"crossref","unstructured":"Milletari, F., Navab, N., Ahmadi, S.A.: V-Net: fully convolutional neural networks for volumetric medical image segmentation. In: 3DV (2016)","DOI":"10.1109\/3DV.2016.79"},{"key":"3_CR38","doi-asserted-by":"crossref","unstructured":"Mukhoti, J., et al.: Open vocabulary semantic segmentation with patch aligned contrastive learning. In: CVPR (2023)","DOI":"10.1109\/CVPR52729.2023.01860"},{"key":"3_CR39","doi-asserted-by":"crossref","unstructured":"Neuhold, G., Ollmann, T., Rota\u00a0Bulo, S., Kontschieder, P.: The mapillary vistas dataset for semantic understanding of street scenes. In: ICCV (2017)","DOI":"10.1109\/ICCV.2017.534"},{"key":"3_CR40","unstructured":"Nguyen, T., Ilharco, G., Wortsman, M., Oh, S., Schmidt, L.: Quality not quantity: on the interaction between dataset design and robustness of CLIP. NeurIPS (2022)"},{"key":"3_CR41","unstructured":"Oquab, M., et\u00a0al.: DINOv2: learning robust visual features without supervision. arXiv preprint arXiv:2304.07193 (2023)"},{"key":"3_CR42","doi-asserted-by":"crossref","unstructured":"Pan, X., Luo, P., Shi, J., Tang, X.: Two at once: enhancing learning and generalization capacities via ibn-net. In: ECCV (2018)","DOI":"10.1007\/978-3-030-01225-0_29"},{"key":"3_CR43","doi-asserted-by":"crossref","unstructured":"Pan, X., Zhan, X., Shi, J., Tang, X., Luo, P.: Switchable whitening for deep representation learning. In: ICCV (2019)","DOI":"10.1109\/ICCV.2019.00195"},{"key":"3_CR44","doi-asserted-by":"crossref","unstructured":"Peng, D., Lei, Y., Hayat, M., Guo, Y., Li, W.: Semantic-aware domain generalized segmentation. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.00262"},{"key":"3_CR45","doi-asserted-by":"crossref","unstructured":"Pham, H., et\u00a0al.: Combined scaling for zero-shot transfer learning. Neurocomputing (2023)","DOI":"10.1016\/j.neucom.2023.126658"},{"key":"3_CR46","unstructured":"Radford, A., et\u00a0al.: Learning transferable visual models from natural language supervision. In: ICML (2021)"},{"key":"3_CR47","doi-asserted-by":"crossref","unstructured":"Rao, Y., et al.: DenseCLIP: language-guided dense prediction with context-aware prompting. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.01755"},{"key":"3_CR48","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"102","DOI":"10.1007\/978-3-319-46475-6_7","volume-title":"Computer Vision \u2013 ECCV 2016","author":"SR Richter","year":"2016","unstructured":"Richter, S.R., Vineet, V., Roth, S., Koltun, V.: Playing for data: ground truth from computer games. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9906, pp. 102\u2013118. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46475-6_7"},{"key":"3_CR49","doi-asserted-by":"crossref","unstructured":"Ros, G., Sellart, L., Materzynska, J., Vazquez, D., Lopez, A.M.: The SYNTHIA dataset: a large collection of synthetic images for semantic segmentation of urban scenes. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.352"},{"key":"3_CR50","unstructured":"Sun, Q., Chen, H., Zheng, M., Wu, Z., Felsberg, M., Tang, Y.: IBAFormer: intra-batch attention transformer for domain generalized semantic segmentation. arXiv preprint arXiv:2309.06282 (2023)"},{"key":"3_CR51","unstructured":"Sun, Q., Fang, Y., Wu, L., Wang, X., Cao, Y.: EVA-CLIP: improved training techniques for clip at scale. arXiv preprint arXiv:2303.15389 (2023)"},{"key":"3_CR52","doi-asserted-by":"crossref","unstructured":"Tan, H., Bansal, M.: LXMERT: learning cross-modality encoder representations from transformers. arXiv preprint arXiv:1908.07490 (2019)","DOI":"10.18653\/v1\/D19-1514"},{"key":"3_CR53","unstructured":"Vaswani, A., et al.: Attention is all you need. NeurIPS (2017)"},{"key":"3_CR54","doi-asserted-by":"crossref","unstructured":"Wei, Z., et al.: Stronger, fewer, & superior: harnessing vision foundation models for domain generalized semantic segmentation. arXiv preprint arXiv:2312.04265 (2023)","DOI":"10.1109\/CVPR52733.2024.02704"},{"key":"3_CR55","doi-asserted-by":"crossref","unstructured":"Wortsman, M., et\u00a0al.: Robust fine-tuning of zero-shot models. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.00780"},{"key":"3_CR56","doi-asserted-by":"publisher","unstructured":"Xu, M., et al.: A simple baseline for open-vocabulary semantic segmentation with pre-trained vision-language model. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) Computer Vision \u2013 ECCV 2022. ECCV 2022. LNCS, vol. 13689, pp. 736\u2013753. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-19818-2_42","DOI":"10.1007\/978-3-031-19818-2_42"},{"key":"3_CR57","doi-asserted-by":"crossref","unstructured":"Yu, F., et al.: BDD100k: a diverse driving dataset for heterogeneous multitask learning. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.00271"},{"key":"3_CR58","doi-asserted-by":"crossref","unstructured":"Yu, Q., et al.: kMaX-DeepLab: k-means mask transformer. In: ECCV (2022)","DOI":"10.1007\/978-3-031-19818-2_17"},{"key":"3_CR59","doi-asserted-by":"crossref","unstructured":"Yue, X., Zhang, Y., Zhao, S., Sangiovanni-Vincentelli, A., Keutzer, K., Gong, B.: Domain randomization and pyramid consistency: simulation-to-real generalization without accessing target domain data. In: ICCV (2019)","DOI":"10.1109\/ICCV.2019.00219"},{"key":"3_CR60","unstructured":"Zhang, B., Tian, Z., Tang, Q., Chu, X., Wei, X., Shen, C., et\u00a0al.: Segvit: semantic segmentation with plain vision transformers. NeurIPS (2022)"},{"key":"3_CR61","unstructured":"Zhang, H., et al.: DINO: DETR with improved denoising anchor boxes for end-to-end object detection. arXiv preprint arXiv:2203.03605 (2022)"},{"key":"3_CR62","doi-asserted-by":"crossref","unstructured":"Zhang, H., et al.: MP-Former: mask-piloted transformer for image segmentation. In: CVPR (2023)","DOI":"10.1109\/CVPR52729.2023.01733"},{"key":"3_CR63","doi-asserted-by":"publisher","unstructured":"Zhao, Y., Zhong, Z., Zhao, N., Sebe, N., Lee, G.H.: Style-hallucinated dual consistency learning for domain generalized semantic segmentation. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) Computer Vision \u2013 ECCV 2022. ECCV 2022. LNCS, vol. 13688, pp. 535\u2013552. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-19815-1_31","DOI":"10.1007\/978-3-031-19815-1_31"},{"key":"3_CR64","doi-asserted-by":"crossref","unstructured":"Zhao, Y., Zhong, Z., Zhao, N., Sebe, N., Lee, G.H.: Style-hallucinated dual consistency learning: a unified framework for visual domain generalization. IJCV (2023)","DOI":"10.1007\/s11263-023-01911-w"},{"key":"3_CR65","doi-asserted-by":"publisher","unstructured":"Zhou, C., Loy, C.C., Dai, B.: Extract free dense labels from CLIP. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) Computer Vision \u2013 ECCV 2022. ECCV 2022. LNCS, vol. 13688, pp. 696\u2013712. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-19815-1_40","DOI":"10.1007\/978-3-031-19815-1_40"},{"key":"3_CR66","doi-asserted-by":"crossref","unstructured":"Zhou, K., Yang, J., Loy, C.C., Liu, Z.: Learning to prompt for vision-language models. IJCV (2022)","DOI":"10.1007\/s11263-022-01653-1"},{"key":"3_CR67","doi-asserted-by":"crossref","unstructured":"Zhou, Z., Lei, Y., Zhang, B., Liu, L., Liu, Y.: ZegCLIP: towards adapting clip for zero-shot semantic segmentation. In: CVPR (2023)","DOI":"10.1109\/CVPR52729.2023.01075"},{"key":"3_CR68","unstructured":"Zhu, C., Chen, L.: A survey on open-vocabulary detection and segmentation: past, present, and future. arXiv preprint arXiv:2307.09220 (2023)"},{"key":"3_CR69","unstructured":"Zhu, X., Su, W., Lu, L., Li, B., Wang, X., Dai, J.: Deformable DETR: deformable transformers for end-to-end object detection. In: ICLR (2020)"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-72998-0_3","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,29]],"date-time":"2024-09-29T18:02:35Z","timestamp":1727632955000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-72998-0_3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,9,30]]},"ISBN":["9783031729973","9783031729980"],"references-count":69,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-72998-0_3","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,9,30]]},"assertion":[{"value":"30 September 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}