{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,11]],"date-time":"2026-02-11T18:15:05Z","timestamp":1770833705381,"version":"3.50.1"},"publisher-location":"Cham","reference-count":69,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031733963","type":"print"},{"value":"9783031733970","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,11,3]],"date-time":"2024-11-03T00:00:00Z","timestamp":1730592000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,3]],"date-time":"2024-11-03T00:00:00Z","timestamp":1730592000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-73397-0_12","type":"book-chapter","created":{"date-parts":[[2024,11,2]],"date-time":"2024-11-02T19:07:08Z","timestamp":1730574428000},"page":"197-214","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":16,"title":["MegaScenes: Scene-Level View Synthesis at\u00a0Scale"],"prefix":"10.1007","author":[{"given":"Joseph","family":"Tung","sequence":"first","affiliation":[]},{"given":"Gene","family":"Chou","sequence":"additional","affiliation":[]},{"given":"Ruojin","family":"Cai","sequence":"additional","affiliation":[]},{"given":"Guandao","family":"Yang","sequence":"additional","affiliation":[]},{"given":"Kai","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Gordon","family":"Wetzstein","sequence":"additional","affiliation":[]},{"given":"Bharath","family":"Hariharan","sequence":"additional","affiliation":[]},{"given":"Noah","family":"Snavely","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,3]]},"reference":[{"key":"12_CR1","doi-asserted-by":"crossref","unstructured":"Barron, J.T., Mildenhall, B., Verbin, D., Srinivasan, P.P., Hedman, P.: Mip-nerf 360: Unbounded anti-aliased neural radiance fields. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.00539"},{"key":"12_CR2","doi-asserted-by":"publisher","unstructured":"Bhat, S.F., Birkl, R., Wofk, D., Wonka, P., M\u00fcller, M.: Zoedepth: zero-shot transfer by combining relative and metric depth (2023). https:\/\/doi.org\/10.48550\/ARXIV.2302.12288. https:\/\/arxiv.org\/abs\/2302.12288","DOI":"10.48550\/ARXIV.2302.12288"},{"key":"12_CR3","unstructured":"Bi\u0144kowski, M., Sutherland, D.J., Arbel, M., Gretton, A.: Demystifying mmd gans. arXiv preprint arXiv:1801.01401 (2018)"},{"key":"12_CR4","doi-asserted-by":"crossref","unstructured":"Cai, R., Tung, J., Wang, Q., Averbuch-Elor, H., Hariharan, B., Snavely, N.: Doppelgangers: Learning to disambiguate images of similar structures. In: ICCV (2023)","DOI":"10.1109\/ICCV51070.2023.00010"},{"key":"12_CR5","doi-asserted-by":"crossref","unstructured":"Cai, S., et al.: Diffdreamer: towards consistent unsupervised single-view scene extrapolation with conditional diffusion models. In: ICCV (2023)","DOI":"10.1109\/ICCV51070.2023.00204"},{"key":"12_CR6","doi-asserted-by":"crossref","unstructured":"Chan, E.R., et al.: Generative novel view synthesis with 3d-aware diffusion models. arXiv preprint arXiv:2304.02602 (2023)","DOI":"10.1109\/ICCV51070.2023.00389"},{"key":"12_CR7","doi-asserted-by":"crossref","unstructured":"Chang, A., et al.: Matterport3d: learning from rgb-d data in indoor environments. arXiv preprint arXiv:1709.06158 (2017)","DOI":"10.1109\/3DV.2017.00081"},{"key":"12_CR8","unstructured":"Chang, A.X., et\u00a0al.: Shapenet: an information-rich 3d model repository. arXiv preprint arXiv:1512.03012 (2015)"},{"key":"12_CR9","unstructured":"Chung, J., Lee, S., Nam, H., Lee, J., Lee, K.M.: Luciddreamer: domain-free generation of 3d gaussian splatting scenes. arXiv preprint arXiv:2311.13384 (2023)"},{"key":"12_CR10","doi-asserted-by":"crossref","unstructured":"Dai, A., Chang, A.X., Savva, M., Halber, M., Funkhouser, T., Nie\u00dfner, M.: Scannet: Richly-annotated 3d reconstructions of indoor scenes. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5828\u20135839 (2017)","DOI":"10.1109\/CVPR.2017.261"},{"key":"12_CR11","doi-asserted-by":"crossref","unstructured":"Deitke, M., et al.: Objaverse-xl: a universe of 10m+ 3d objects. arXiv preprint arXiv:2307.05663 (2023)","DOI":"10.1109\/CVPR52729.2023.01263"},{"key":"12_CR12","doi-asserted-by":"crossref","unstructured":"Du, Y., Zhang, Y., Yu, H.X., Tenenbaum, J.B., Wu, J.: Neural radiance flow for 4d view synthesis and video processing. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (2021)","DOI":"10.1109\/ICCV48922.2021.01406"},{"key":"12_CR13","doi-asserted-by":"crossref","unstructured":"Edstedt, J., B\u00f6kman, G., Wadenb\u00e4ck, M., Felsberg, M.: DeDoDe: detect, Don\u2019t Describe \u2014 Describe, Don\u2019t Detect for Local Feature Matching. In: 2024 International Conference on 3D Vision (3DV). IEEE (2024)","DOI":"10.1109\/3DV62453.2024.00035"},{"key":"12_CR14","doi-asserted-by":"crossref","unstructured":"Heinly, J., Dunn, E., Frahm, J.M.: Recovering correct reconstructions from indistinguishable geometry. In: International Conference on 3D Vision (3DV) (2014)","DOI":"10.1109\/3DV.2014.84"},{"key":"12_CR15","unstructured":"Heusel, M., Ramsauer, H., Unterthiner, T., Nessler, B., Hochreiter, S.: Gans trained by a two time-scale update rule converge to a local nash equilibrium. Advances in neural information processing systems 30 (2017)"},{"key":"12_CR16","unstructured":"Hong, Y., et al.: Lrm: large reconstruction model for single image to 3d. arXiv preprint arXiv:2311.04400 (2023)"},{"key":"12_CR17","doi-asserted-by":"crossref","unstructured":"Kant, Y., Siarohin, A., Vasilkovsky, M., Guler, R.A., Ren, J., Tulyakov, S., Gilitschenski, I.: invs: repurposing diffusion inpainters for novel view synthesis. In: SIGGRAPH Asia 2023 Conference Papers (2023)","DOI":"10.1145\/3610548.3618149"},{"key":"12_CR18","doi-asserted-by":"crossref","unstructured":"Kerbl, B., Kopanas, G., Leimk\u00fchler, T., Drettakis, G.: 3d gaussian splatting for real-time radiance field rendering. ACM Trans. Graph. 42(4) (2023)","DOI":"10.1145\/3592433"},{"key":"12_CR19","doi-asserted-by":"crossref","unstructured":"Li, Y., et al.: Matrixcity: a large-scale city dataset for city-scale neural rendering and beyond. arXiv e-prints pp. arXiv\u20132308 (2023)","DOI":"10.1109\/ICCV51070.2023.00297"},{"key":"12_CR20","doi-asserted-by":"crossref","unstructured":"Li, Z., Snavely, N.: Megadepth: Learning single-view depth prediction from internet photos. In: Computer Vision and Pattern Recognition (CVPR) (2018)","DOI":"10.1109\/CVPR.2018.00218"},{"key":"12_CR21","doi-asserted-by":"crossref","unstructured":"Li, Z., Xian, W., Davis, A., Snavely, N.: Crowdsampling the plenoptic function. In: European Conference on Computer Vision, pp. 178\u2013196. Springer (2020)","DOI":"10.1007\/978-3-030-58452-8_11"},{"key":"12_CR22","doi-asserted-by":"crossref","unstructured":"Li, Z., et\u00a0al.: Openrooms: an open framework for photorealistic indoor scene datasets. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7190\u20137199 (2021)","DOI":"10.1109\/CVPR46437.2021.00711"},{"key":"12_CR23","doi-asserted-by":"crossref","unstructured":"Lindenberger, P., Sarlin, P.E., Pollefeys, M.: LightGlue: local feature matching at light speed. In: ICCV (2023)","DOI":"10.1109\/ICCV51070.2023.01616"},{"key":"12_CR24","doi-asserted-by":"crossref","unstructured":"Ling, L., et\u00a0al.: Dl3dv-10k: a large-scale scene dataset for deep learning-based 3d vision. arXiv preprint arXiv:2312.16256 (2023)","DOI":"10.1109\/CVPR52733.2024.02092"},{"key":"12_CR25","doi-asserted-by":"crossref","unstructured":"Liu, A., Tucker, R., Jampani, V., Makadia, A., Snavely, N., Kanazawa, A.: Infinite nature: Perpetual view generation of natural scenes from a single image. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (ICCV), October 2021","DOI":"10.1109\/ICCV48922.2021.01419"},{"key":"12_CR26","unstructured":"Liu, M., et al.: One-2-3-45: any single image to 3d mesh in 45 seconds without per-shape optimization. Advances in Neural Information Processing Systems 36 (2024)"},{"key":"12_CR27","doi-asserted-by":"crossref","unstructured":"Liu, R., Wu, R., Van\u00a0Hoorick, B., Tokmakov, P., Zakharov, S., Vondrick, C.: Zero-1-to-3: Zero-shot one image to 3d object. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 9298\u20139309 (2023)","DOI":"10.1109\/ICCV51070.2023.00853"},{"key":"12_CR28","unstructured":"Liu, Y., et al.: Syncdreamer: Generating multiview-consistent images from a single-view image. arXiv preprint arXiv:2309.03453 (2023)"},{"issue":"2","key":"12_CR29","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1023\/B:VISI.0000029664.99615.94","volume":"60","author":"DG Lowe","year":"2004","unstructured":"Lowe, D.G.: Distinctive image features from scale-invariant keypoints. IJCV 60(2), 91\u2013110 (2004)","journal-title":"IJCV"},{"key":"12_CR30","doi-asserted-by":"crossref","unstructured":"Martin-Brualla, R., Radwan, N., Sajjadi, M.S.M., Barron, J.T., Dosovitskiy, A., Duckworth, D.: NeRF in the Wild: Neural Radiance Fields for Unconstrained Photo Collections. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.00713"},{"issue":"1","key":"12_CR31","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1145\/3503250","volume":"65","author":"B Mildenhall","year":"2021","unstructured":"Mildenhall, B., Srinivasan, P.P., Tancik, M., Barron, J.T., Ramamoorthi, R., Ng, R.: Nerf: representing scenes as neural radiance fields for view synthesis. Commun. ACM 65(1), 99\u2013106 (2021)","journal-title":"Commun. ACM"},{"key":"12_CR32","doi-asserted-by":"crossref","unstructured":"Niemeyer, M., Barron, J.T., Mildenhall, B., Sajjadi, M.S., Geiger, A., Radwan, N.: Regnerf: regularizing neural radiance fields for view synthesis from sparse inputs. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5480\u20135490 (2022)","DOI":"10.1109\/CVPR52688.2022.00540"},{"key":"12_CR33","unstructured":"Poole, B., Jain, A., Barron, J.T., Mildenhall, B.: Dreamfusion: text-to-3d using 2d diffusion. arXiv preprint arXiv:2209.14988 (2022)"},{"key":"12_CR34","unstructured":"Qian, G., et\u00a0al.: Magic123: one image to high-quality 3d object generation using both 2d and 3d diffusion priors. arXiv preprint arXiv:2306.17843 (2023)"},{"key":"12_CR35","unstructured":"Radford, A., et\u00a0al.: Learning transferable visual models from natural language supervision. In: International Conference on Machine Learning, pp. 8748\u20138763. PMLR (2021)"},{"key":"12_CR36","unstructured":"Ramzi, E., Audebert, N., Rambour, C., Araujo, A., Bitot, X., Thome, N.: Optimization of Rank Losses for Image Retrieval. In: In submission to: IEEE Transactions on Pattern Analysis and Machine Intelligence (2023)"},{"key":"12_CR37","doi-asserted-by":"crossref","unstructured":"Reizenstein, J., Shapovalov, R., Henzler, P., Sbordone, L., Labatut, P., Novotny, D.: Common objects in 3d: large-scale learning and evaluation of real-life 3d category reconstruction. In: International Conference on Computer Vision (2021)","DOI":"10.1109\/ICCV48922.2021.01072"},{"key":"12_CR38","doi-asserted-by":"crossref","unstructured":"Roberts, M., et al.: Hypersim: a photorealistic synthetic dataset for holistic indoor scene understanding. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 10912\u201310922 (2021)","DOI":"10.1109\/ICCV48922.2021.01073"},{"key":"12_CR39","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P., Ommer, B.: High-resolution image synthesis with latent diffusion models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10684\u201310695 (2022)","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"12_CR40","first-page":"36479","volume":"35","author":"C Saharia","year":"2022","unstructured":"Saharia, C., et al.: Photorealistic text-to-image diffusion models with deep language understanding. Adv. Neural. Inf. Process. Syst. 35, 36479\u201336494 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"12_CR41","doi-asserted-by":"crossref","unstructured":"Sargent, K., et\u00a0al.: Zeronvs: zero-shot 360-degree view synthesis from a single real image. arXiv preprint arXiv:2310.17994 (2023)","DOI":"10.1109\/CVPR52733.2024.00900"},{"key":"12_CR42","doi-asserted-by":"crossref","unstructured":"Sch\u00f6nberger, J.L., Frahm, J.M.: Structure-from-motion revisited. In: Conference on Computer Vision and Pattern Recognition (CVPR) (2016)","DOI":"10.1109\/CVPR.2016.445"},{"key":"12_CR43","doi-asserted-by":"crossref","unstructured":"Sch\u00f6nberger, J.L., Price, T., Sattler, T., Frahm, J.M., Pollefeys, M.: A vote-and-verify strategy for fast spatial verification in image retrieval. In: Asian Conference on Computer Vision (ACCV) (2016)","DOI":"10.1007\/978-3-319-54181-5_21"},{"key":"12_CR44","unstructured":"Shi, Y., Wang, P., Ye, J., Long, M., Li, K., Yang, X.: Mvdream: multi-view diffusion for 3d generation. arXiv preprint arXiv:2308.16512 (2023)"},{"key":"12_CR45","doi-asserted-by":"crossref","unstructured":"S\u00f8lund, T., Buch, A.G., Kr\u00fcger, N., Aan\u00e6s, H.: A large scale 3d object recognition dataset. In: 3DV (2016)","DOI":"10.1109\/3DV.2016.16"},{"key":"12_CR46","unstructured":"Tewari, A., et al.: Diffusion with forward models: Solving stochastic inverse problems without direct supervision. Advances in Neural Information Processing Systems 36 (2024)"},{"key":"12_CR47","unstructured":"Tyszkiewicz, M., Fua, P., Trulls, E.: Disk: learning local features with policy gradient. Advances in Neural Information Processing Systems 33 (2020)"},{"key":"12_CR48","doi-asserted-by":"crossref","unstructured":"Verbin, D., Hedman, P., Mildenhall, B., Zickler, T., Barron, J.T., Srinivasan, P.P.: Ref-nerf: Structured view-dependent appearance for neural radiance fields. In: 2022 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 5481\u20135490. IEEE (2022)","DOI":"10.1109\/CVPR52688.2022.00541"},{"key":"12_CR49","doi-asserted-by":"crossref","unstructured":"Wang, H., Du, X., Li, J., Yeh, R.A., Shakhnarovich, G.: Score jacobian chaining: lifting pretrained 2d diffusion models for 3d generation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12619\u201312629 (2023)","DOI":"10.1109\/CVPR52729.2023.01214"},{"key":"12_CR50","doi-asserted-by":"crossref","unstructured":"Wang, J., Rupprecht, C., Novotny, D.: PoseDiffusion: solving pose estimation via diffusion-aided bundle adjustment (2023)","DOI":"10.1109\/ICCV51070.2023.00896"},{"key":"12_CR51","unstructured":"Wang, P., et al.: Pf-lrm: pose-free large reconstruction model for joint pose and shape prediction. arXiv preprint arXiv:2311.12024 (2023)"},{"key":"12_CR52","doi-asserted-by":"crossref","unstructured":"Wang, Q., Zhou, X., Hariharan, B., Snavely, N.: Learning feature descriptors using camera pose supervision. In: Proc. European Conference on Computer Vision (ECCV) (2020)","DOI":"10.1007\/978-3-030-58452-8_44"},{"key":"12_CR53","doi-asserted-by":"crossref","unstructured":"Wang, S., Leroy, V., Cabon, Y., Chidlovskii, B., Revaud, J.: Dust3r: geometric 3d vision made easy. arXiv preprint arXiv:2312.14132 (2023)","DOI":"10.1109\/CVPR52733.2024.01956"},{"key":"12_CR54","unstructured":"Wang, Z., Lu, C., Wang, Y., Bao, F., Li, C., Su, H., Zhu, J.: Prolificdreamer: high-fidelity and diverse text-to-3d generation with variational score distillation. Advances in Neural Information Processing Systems 36 (2024)"},{"issue":"4","key":"12_CR55","doi-asserted-by":"publisher","first-page":"600","DOI":"10.1109\/TIP.2003.819861","volume":"13","author":"Z Wang","year":"2004","unstructured":"Wang, Z., Bovik, A.C., Sheikh, H.R., Simoncelli, E.P.: Image quality assessment: from error visibility to structural similarity. IEEE Trans. Image Process. 13(4), 600\u2013612 (2004)","journal-title":"IEEE Trans. Image Process."},{"key":"12_CR56","unstructured":"Watson, D., Chan, W., Martin-Brualla, R., Ho, J., Tagliasacchi, A., Norouzi, M.: Novel view synthesis with diffusion models. arXiv preprint arXiv:2210.04628 (2022)"},{"key":"12_CR57","doi-asserted-by":"crossref","unstructured":"Weyand, T., Araujo, A., Cao, B., Sim, J.: Google landmarks dataset v2 - a large-scale benchmark for instance-level recognition and retrieval. In: Proc. CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.00265"},{"key":"12_CR58","unstructured":"Wu, R., et\u00a0al.: Reconfusion: 3d reconstruction with diffusion priors. arXiv preprint arXiv:2312.02981 (2023)"},{"key":"12_CR59","doi-asserted-by":"crossref","unstructured":"Wu, X., Averbuch-Elor, H., Sun, J., Snavely, N.: Towers of Babel: combining images, language, and 3D geometry for learning multimodal vision. In: ICCV (2021)","DOI":"10.1109\/ICCV48922.2021.00048"},{"key":"12_CR60","doi-asserted-by":"crossref","unstructured":"Yang, L., Kang, B., Huang, Z., Xu, X., Feng, J., Zhao, H.: Depth anything: unleashing the power of large-scale unlabeled data. In: CVPR (2024)","DOI":"10.1109\/CVPR52733.2024.00987"},{"key":"12_CR61","doi-asserted-by":"crossref","unstructured":"Yao, Y., et al.: Blendedmvs: a large-scale dataset for generalized multi-view stereo networks. In: Computer Vision and Pattern Recognition (CVPR) (2020)","DOI":"10.1109\/CVPR42600.2020.00186"},{"key":"12_CR62","doi-asserted-by":"crossref","unstructured":"Yeshwanth, C., Liu, Y.C., Nie\u00dfner, M., Dai, A.: Scannet++: A high-fidelity dataset of 3d indoor scenes. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 12\u201322 (2023)","DOI":"10.1109\/ICCV51070.2023.00008"},{"key":"12_CR63","doi-asserted-by":"crossref","unstructured":"Yu, A., Ye, V., Tancik, M., Kanazawa, A.: pixelnerf: Neural radiance fields from one or few images. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4578\u20134587 (2021)","DOI":"10.1109\/CVPR46437.2021.00455"},{"key":"12_CR64","doi-asserted-by":"crossref","unstructured":"Yu, H.X., et\u00a0al.: Wonderjourney: Going from anywhere to everywhere. arXiv preprint arXiv:2312.03884 (2023)","DOI":"10.1109\/CVPR52733.2024.00636"},{"key":"12_CR65","doi-asserted-by":"crossref","unstructured":"Yu, X., et al.: Mvimgnet: a large-scale dataset of multi-view images. In: CVPR (2023)","DOI":"10.1109\/CVPR52729.2023.00883"},{"key":"12_CR66","doi-asserted-by":"crossref","unstructured":"Zhang, R., Isola, P., Efros, A.A., Shechtman, E., Wang, O.: The unreasonable effectiveness of deep features as a perceptual metric. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00068"},{"key":"12_CR67","doi-asserted-by":"crossref","unstructured":"Zhou, T., Tucker, R., Flynn, J., Fyffe, G., Snavely, N.: Stereo magnification: Learning view synthesis using multiplane images. ACM Trans. Graph. (Proc. SIGGRAPH) 37 (2018), https:\/\/arxiv.org\/abs\/1805.09817","DOI":"10.1145\/3197517.3201323"},{"key":"12_CR68","doi-asserted-by":"crossref","unstructured":"Zhou, T., Tulsiani, S., Sun, W., Malik, J., Efros, A.A.: View synthesis by appearance flow. In: European Conference on Computer Vision (2016)","DOI":"10.1007\/978-3-319-46493-0_18"},{"key":"12_CR69","doi-asserted-by":"crossref","unstructured":"Zhou, Z., Tulsiani, S.: Sparsefusion: distilling view-conditioned diffusion for 3d reconstruction. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12588\u201312597 (2023)","DOI":"10.1109\/CVPR52729.2023.01211"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-73397-0_12","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,2]],"date-time":"2024-11-02T19:19:54Z","timestamp":1730575194000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-73397-0_12"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,3]]},"ISBN":["9783031733963","9783031733970"],"references-count":69,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-73397-0_12","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,11,3]]},"assertion":[{"value":"3 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}