{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,7]],"date-time":"2026-04-07T16:25:48Z","timestamp":1775579148361,"version":"3.50.1"},"publisher-location":"Cham","reference-count":74,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031726699","type":"print"},{"value":"9783031726705","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,9,30]],"date-time":"2024-09-30T00:00:00Z","timestamp":1727654400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,9,30]],"date-time":"2024-09-30T00:00:00Z","timestamp":1727654400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-72670-5_1","type":"book-chapter","created":{"date-parts":[[2024,9,29]],"date-time":"2024-09-29T07:01:50Z","timestamp":1727593310000},"page":"1-19","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":73,"title":["GS-LRM: Large Reconstruction Model for\u00a03D Gaussian Splatting"],"prefix":"10.1007","author":[{"given":"Kai","family":"Zhang","sequence":"first","affiliation":[]},{"given":"Sai","family":"Bi","sequence":"additional","affiliation":[]},{"given":"Hao","family":"Tan","sequence":"additional","affiliation":[]},{"given":"Yuanbo","family":"Xiangli","sequence":"additional","affiliation":[]},{"given":"Nanxuan","family":"Zhao","sequence":"additional","affiliation":[]},{"given":"Kalyan","family":"Sunkavalli","sequence":"additional","affiliation":[]},{"given":"Zexiang","family":"Xu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,9,30]]},"reference":[{"issue":"10","key":"1_CR1","doi-asserted-by":"publisher","first-page":"105","DOI":"10.1145\/2001269.2001293","volume":"54","author":"S Agarwal","year":"2011","unstructured":"Agarwal, S., et al.: Building Rome in a day. Commun. ACM 54(10), 105\u2013112 (2011)","journal-title":"Commun. ACM"},{"key":"1_CR2","doi-asserted-by":"crossref","unstructured":"Aliev, K.A., Sevastopolsky, A., Kolos, M., Ulyanov, D., Lempitsky, V.: Neural point-based graphics. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XXII 16, pp. 696\u2013712. Springer (2020)","DOI":"10.1007\/978-3-030-58542-6_42"},{"key":"1_CR3","unstructured":"Ba, J.L., Kiros, J.R., Hinton, G.E.: Layer normalization. arXiv preprint arXiv:1607.06450 (2016)"},{"key":"1_CR4","doi-asserted-by":"crossref","unstructured":"Barron, J.T., Mildenhall, B., Tancik, M., Hedman, P., Martin-Brualla, R., Srinivasan, P.P.: Mip-NeRF: a multiscale representation for anti-aliasing neural radiance fields. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 5855\u20135864 (2021)","DOI":"10.1109\/ICCV48922.2021.00580"},{"key":"1_CR5","doi-asserted-by":"crossref","unstructured":"Barron, J.T., Mildenhall, B., Verbin, D., Srinivasan, P.P., Hedman, P.: Mip-NeRF 360: unbounded anti-aliased neural radiance fields. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5470\u20135479 (2022)","DOI":"10.1109\/CVPR52688.2022.00539"},{"key":"1_CR6","doi-asserted-by":"crossref","unstructured":"Barron, J.T., Mildenhall, B., Verbin, D., Srinivasan, P.P., Hedman, P.: Zip-NeRF: anti-aliased grid-based neural radiance fields. arXiv preprint arXiv:2304.06706 (2023)","DOI":"10.1109\/ICCV51070.2023.01804"},{"key":"1_CR7","doi-asserted-by":"crossref","unstructured":"Chan, E.R., et\u00a0al.: Efficient geometry-aware 3D generative adversarial networks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16123\u201316133 (2022)","DOI":"10.1109\/CVPR52688.2022.01565"},{"key":"1_CR8","doi-asserted-by":"crossref","unstructured":"Charatan, D., Li, S., Tagliasacchi, A., Sitzmann, V.: pixelSplat: 3D gaussian splats from image pairs for scalable generalizable 3D reconstruction. arXiv preprint arXiv:2312.12337 (2023)","DOI":"10.1109\/CVPR52733.2024.01840"},{"key":"1_CR9","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1007\/978-3-031-19824-3_20","volume-title":"Computer Vision \u2013 ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23\u201327, 2022, Proceedings, Part XXXII","author":"A Chen","year":"2022","unstructured":"Chen, A., Xu, Z., Geiger, A., Yu, J., Su, H.: TensoRF: tensorial radiance fields. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) Computer Vision \u2013 ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23\u201327, 2022, Proceedings, Part XXXII, pp. 333\u2013350. Springer Nature Switzerland, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-19824-3_20"},{"issue":"4","key":"1_CR10","first-page":"1","volume":"42","author":"A Chen","year":"2023","unstructured":"Chen, A., Xu, Z., Wei, X., Tang, S., Su, H., Geiger, A.: Dictionary Fields: learning a neural basis decomposition. ACM Trans. Graph. (TOG) 42(4), 1\u201312 (2023)","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"1_CR11","unstructured":"Chen, A., Xu, Z., Wei, X., Tang, S., Su, H., Geiger, A.: Factor Fields: a unified framework for neural fields and beyond. arXiv preprint arXiv:2302.01226 (2023)"},{"key":"1_CR12","doi-asserted-by":"crossref","unstructured":"Chen, A., et al.: MVSNeRF: fast generalizable radiance field reconstruction from multi-view stereo. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 14124\u201314133 (2021)","DOI":"10.1109\/ICCV48922.2021.01386"},{"key":"1_CR13","doi-asserted-by":"crossref","unstructured":"Chen, E.M., Holalkere, S., Yan, R., Zhang, K., Davis, A.: Ray conditioning: trading photo-consistency for photo-realism in multi-view image generation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 23242\u201323251 (2023)","DOI":"10.1109\/ICCV51070.2023.02124"},{"key":"1_CR14","doi-asserted-by":"crossref","unstructured":"Chen, Q., Koltun, V.: Photographic image synthesis with cascaded refinement networks. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1511\u20131520 (2017)","DOI":"10.1109\/ICCV.2017.168"},{"key":"1_CR15","unstructured":"Chen, T., Xu, B., Zhang, C., Guestrin, C.: Training deep nets with sublinear memory cost. arXiv preprint arXiv:1604.06174 (2016)"},{"key":"1_CR16","doi-asserted-by":"crossref","unstructured":"Cheng, S., et al.: Deep stereo using adaptive thin volume representation with uncertainty awareness. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2524\u20132534 (2020)","DOI":"10.1109\/CVPR42600.2020.00260"},{"key":"1_CR17","doi-asserted-by":"crossref","unstructured":"Collins, J., et\u00a0al.: ABO: dataset and benchmarks for real-world 3D object understanding. In: CVPR, pp. 21126\u201321136 (2022)","DOI":"10.1109\/CVPR52688.2022.02045"},{"key":"1_CR18","unstructured":"Dao, T.: FlashAttention-2: faster attention with better parallelism and work partitioning. arXiv preprint arXiv:2307.08691 (2023)"},{"key":"1_CR19","doi-asserted-by":"crossref","unstructured":"Deitke, M., et al.: Objaverse: a universe of annotated 3D objects. In: CVPR, pp. 13142\u201313153 (2023)","DOI":"10.1109\/CVPR52729.2023.01263"},{"key":"1_CR20","unstructured":"Dosovitskiy, A., et\u00a0al.: An image is worth 16$$\\,\\times \\,$$16 words: transformers for image recognition at scale. In: International Conference on Learning Representations (2020)"},{"key":"1_CR21","doi-asserted-by":"crossref","unstructured":"Downs, L., et al.: Google scanned objects: a high-quality dataset of 3D scanned household items. In: 2022 International Conference on Robotics and Automation (ICRA), pp. 2553\u20132560. IEEE (2022)","DOI":"10.1109\/ICRA46639.2022.9811809"},{"key":"1_CR22","doi-asserted-by":"crossref","unstructured":"Du, Y., Smith, C., Tewari, A., Sitzmann, V.: Learning to render novel views from wide-baseline stereo pairs. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4970\u20134980 (2023)","DOI":"10.1109\/CVPR52729.2023.00481"},{"issue":"8","key":"1_CR23","doi-asserted-by":"publisher","first-page":"1362","DOI":"10.1109\/TPAMI.2009.161","volume":"32","author":"Y Furukawa","year":"2009","unstructured":"Furukawa, Y., Ponce, J.: Accurate, Dense, and Robust multiview stereopsis. IEEE Trans. Pattern Anal. Mach. Intell. 32(8), 1362\u20131376 (2009)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1_CR24","doi-asserted-by":"crossref","unstructured":"Gao, Q., Xu, Q., Su, H., Neumann, U., Xu, Z.: Strivec: sparse tri-vector radiance fields. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 17569\u201317579 (2023)","DOI":"10.1109\/ICCV51070.2023.01611"},{"key":"1_CR25","doi-asserted-by":"crossref","unstructured":"Gu, X., Fan, Z., Zhu, S., Dai, Z., Tan, F., Tan, P.: Cascade cost volume for high-resolution multi-view stereo and stereo matching. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2495\u20132504 (2020)","DOI":"10.1109\/CVPR42600.2020.00257"},{"key":"1_CR26","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"1_CR27","unstructured":"Hong, Y., et al.: LRM: large reconstruction model for single image to 3D (2023)"},{"key":"1_CR28","unstructured":"Jiang, H., Jiang, Z., Zhao, Y., Huang, Q.: Leap: liberate sparse-view 3D modeling from camera poses. ArXiv 2310.01410 (2023)"},{"key":"1_CR29","doi-asserted-by":"crossref","unstructured":"Johari, M.M., Lepoittevin, Y., Fleuret, F.: GeoNeRF: generalizing nerf with geometry priors. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 18365\u201318375 (2022)","DOI":"10.1109\/CVPR52688.2022.01782"},{"key":"1_CR30","doi-asserted-by":"crossref","unstructured":"Kerbl, B., Kopanas, G., Leimk\u00fchler, T., Drettakis, G.: 3D gaussian splatting for real-time radiance field rendering. ACM Trans. Graph. 42(4) (2023)","DOI":"10.1145\/3592433"},{"key":"1_CR31","unstructured":"Lefaudeux, B., et al.: xFormers: a modular and hackable transformer modelling library. https:\/\/github.com\/facebookresearch\/xformers (2022)"},{"key":"1_CR32","unstructured":"Li, J., et al.: Instant3D: fast text-to-3D with sparse-view generation and large reconstruction model (2023)"},{"key":"1_CR33","doi-asserted-by":"publisher","first-page":"328","DOI":"10.1007\/978-3-030-58601-0_20","volume-title":"Computer Vision \u2013 ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XIII","author":"K-E Lin","year":"2020","unstructured":"Lin, K.-E., et al.: Deep multi depth panoramas for view synthesis. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) Computer Vision \u2013 ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part XIII, pp. 328\u2013344. Springer International Publishing, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58601-0_20"},{"key":"1_CR34","first-page":"15651","volume":"33","author":"L Liu","year":"2020","unstructured":"Liu, L., Gu, J., Zaw Lin, K., Chua, T.S., Theobalt, C.: Neural sparse voxel fields. Adv. Neural. Inf. Process. Syst. 33, 15651\u201315663 (2020)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"issue":"4","key":"1_CR35","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3450626.3459863","volume":"40","author":"S Lombardi","year":"2021","unstructured":"Lombardi, S., Simon, T., Schwartz, G., Zollhoefer, M., Sheikh, Y., Saragih, J.: Mixture of volumetric primitives for efficient neural rendering. ACM Trans. Graph. (ToG) 40(4), 1\u201313 (2021)","journal-title":"ACM Trans. Graph. (ToG)"},{"key":"1_CR36","doi-asserted-by":"publisher","unstructured":"Long, X., Lin, C., Wang, P., Komura, T., Wang, W.: SparseNeuS: fast generalizable neural surface reconstruction from sparse views. In: European Conference on Computer Vision, pp. 210\u2013227. Springer (2022). https:\/\/doi.org\/10.1007\/978-3-031-19824-3_13","DOI":"10.1007\/978-3-031-19824-3_13"},{"key":"1_CR37","unstructured":"Micikevicius, P., et\u00a0al.: Mixed precision training. In: International Conference on Learning Representations (2018)"},{"issue":"4","key":"1_CR38","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3306346.3322980","volume":"38","author":"B Mildenhall","year":"2019","unstructured":"Mildenhall, B., et al.: Local light field fusion: practical view synthesis with prescriptive sampling guidelines. ACM Trans. Graph. (TOG) 38(4), 1\u201314 (2019)","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"1_CR39","doi-asserted-by":"crossref","unstructured":"Mildenhall, B., et al.: Local light field fusion: practical view synthesis with prescriptive sampling guidelines. ACM Trans. Graph. (TOG) (2019)","DOI":"10.1145\/3306346.3322980"},{"key":"1_CR40","doi-asserted-by":"crossref","unstructured":"Mildenhall, B., Srinivasan, P.P., Tancik, M., Barron, J.T., Ramamoorthi, R., Ng, R.: NeRF: representing scenes as neural radiance fields for view synthesis. In: ECCV (2020)","DOI":"10.1007\/978-3-030-58452-8_24"},{"issue":"4","key":"1_CR41","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3528223.3530127","volume":"41","author":"T M\u00fcller","year":"2022","unstructured":"M\u00fcller, T., Evans, A., Schied, C., Keller, A.: Instant neural graphics primitives with a multiresolution hash encoding. ACM Trans. Graph. (ToG) 41(4), 1\u201315 (2022)","journal-title":"ACM Trans. Graph. (ToG)"},{"key":"1_CR42","unstructured":"OpenAI: creating video from text (2024). https:\/\/openai.com\/sora"},{"key":"1_CR43","doi-asserted-by":"publisher","first-page":"523","DOI":"10.1007\/978-3-030-58580-8_31","volume-title":"Computer Vision \u2013 ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part III","author":"S Peng","year":"2020","unstructured":"Peng, S., Niemeyer, M., Mescheder, L., Pollefeys, M., Geiger, A.: Convolutional Occupancy Networks. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) Computer Vision \u2013 ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part III, pp. 523\u2013540. Springer International Publishing, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58580-8_31"},{"key":"1_CR44","doi-asserted-by":"publisher","unstructured":"XVII. On a new geometry of space. Philos. Trans. Royal Soc. London 155, 725\u2013791 (1865). https:\/\/doi.org\/10.1098\/rstl.1865.0017","DOI":"10.1098\/rstl.1865.0017"},{"key":"1_CR45","unstructured":"Podell, D., et al.: SDXL: improving latent diffusion models for high-resolution image synthesis. In: The Twelfth International Conference on Learning Representations (2023)"},{"key":"1_CR46","doi-asserted-by":"publisher","first-page":"143","DOI":"10.1007\/s11263-007-0086-4","volume":"78","author":"M Pollefeys","year":"2008","unstructured":"Pollefeys, M., et al.: Detailed real-time urban 3D reconstruction from video. Int. J. Comput. Vis. 78, 143\u2013167 (2008)","journal-title":"Int. J. Comput. Vis."},{"key":"1_CR47","doi-asserted-by":"publisher","first-page":"207","DOI":"10.1023\/B:VISI.0000025798.50602.3a","volume":"59","author":"M Pollefeys","year":"2004","unstructured":"Pollefeys, M., et al.: Visual modeling with a hand-held camera. Int. J. Comput. Vis. 59, 207\u2013232 (2004)","journal-title":"Int. J. Comput. Vis."},{"key":"1_CR48","doi-asserted-by":"crossref","unstructured":"Schonberger, J.L., Frahm, J.M.: Structure-from-motion revisited. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4104\u20134113 (2016)","DOI":"10.1109\/CVPR.2016.445"},{"key":"1_CR49","doi-asserted-by":"crossref","unstructured":"Sch\u00f6nberger, J.L., Frahm, J.M.: Structure-from-motion revisited. In: Conference on Computer Vision and Pattern Recognition (CVPR) (2016)","DOI":"10.1109\/CVPR.2016.445"},{"key":"1_CR50","doi-asserted-by":"crossref","unstructured":"Sch\u00f6nberger, J.L., Zheng, E., Pollefeys, M., Frahm, J.M.: Pixelwise view selection for unstructured multi-view stereo. In: European Conference on Computer Vision (ECCV) (2016)","DOI":"10.1007\/978-3-319-46487-9_31"},{"key":"1_CR51","doi-asserted-by":"crossref","unstructured":"Shen, Z., Dai, Y., Rao, Z.: CFNet: cascade and fused cost volume for robust stereo matching. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13906\u201313915 (2021)","DOI":"10.1109\/CVPR46437.2021.01369"},{"key":"1_CR52","unstructured":"Shi, R., et al.: Zero123++: a single image to consistent multi-view diffusion base model (2023)"},{"key":"1_CR53","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556 (2014)"},{"key":"1_CR54","doi-asserted-by":"crossref","unstructured":"Snavely, N., Seitz, S.M., Szeliski, R.: Photo tourism: exploring photo collections in 3D. In: ACM Siggraph 2006 Papers, pp. 835\u2013846 (2006)","DOI":"10.1145\/1141911.1141964"},{"key":"1_CR55","doi-asserted-by":"publisher","unstructured":"Suhail, M., Esteves, C., Sigal, L., Makadia, A.: Generalizable patch-based neural rendering. In: European Conference on Computer Vision. Springer (2022). https:\/\/doi.org\/10.1007\/978-3-031-19824-3_10","DOI":"10.1007\/978-3-031-19824-3_10"},{"key":"1_CR56","doi-asserted-by":"crossref","unstructured":"Suhail, M., Esteves, C., Sigal, L., Makadia, A.: Light field neural rendering. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8269\u20138279 (2022)","DOI":"10.1109\/CVPR52688.2022.00809"},{"key":"1_CR57","doi-asserted-by":"crossref","unstructured":"Sun, C., Sun, M., Chen, H.T.: Direct voxel grid optimization: super-fast convergence for radiance fields reconstruction. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5459\u20135469 (2022)","DOI":"10.1109\/CVPR52688.2022.00538"},{"key":"1_CR58","doi-asserted-by":"crossref","unstructured":"Szymanowicz, S., Rupprecht, C., Vedaldi, A.: Splatter image: ultra-fast single-view 3D reconstruction. arXiv: (2023)","DOI":"10.1109\/CVPR52733.2024.00972"},{"key":"1_CR59","doi-asserted-by":"crossref","unstructured":"Tang, J., Chen, Z., Chen, X., Wang, T., Zeng, G., Liu, Z.: LGM: large multi-view gaussian model for high-resolution 3D content creation. arXiv preprint arXiv:2402.05054 (2024)","DOI":"10.1007\/978-3-031-73235-5_1"},{"key":"1_CR60","unstructured":"Vaswani, A., et al.: Attention is all you need. In: Advances in Neural Information Processing Systems, vol. 30 (2017)"},{"key":"1_CR61","unstructured":"Wang, P., et al.: PF-LRM: pose-free large reconstruction model for joint pose and shape prediction. arXiv preprint arXiv:2311.12024 (2023)"},{"key":"1_CR62","doi-asserted-by":"crossref","unstructured":"Wang, Q., et al.: IBRNet: learning multi-view image-based rendering. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4690\u20134699 (2021)","DOI":"10.1109\/CVPR46437.2021.00466"},{"key":"1_CR63","doi-asserted-by":"crossref","unstructured":"Wang, S., Leroy, V., Cabon, Y., Chidlovskii, B., Revaud, J.: DUSt3R: geometric 3D vision made easy. arXiv preprint arXiv:2312.14132 (2023)","DOI":"10.1109\/CVPR52733.2024.01956"},{"key":"1_CR64","doi-asserted-by":"crossref","unstructured":"Wiles, O., Gkioxari, G., Szeliski, R., Johnson, J.: SynSin: end-to-end view synthesis from a single image. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7467\u20137477 (2020)","DOI":"10.1109\/CVPR42600.2020.00749"},{"key":"1_CR65","doi-asserted-by":"crossref","unstructured":"Xu, Q., et al.: Point-NeRF: point-based neural radiance fields. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5438\u20135448 (2022)","DOI":"10.1109\/CVPR52688.2022.00536"},{"key":"1_CR66","unstructured":"Xu, Y., et al.: DMV3D: denoising multi-view diffusion using 3D large reconstruction model (2023)"},{"key":"1_CR67","doi-asserted-by":"crossref","unstructured":"Yao, Y., Luo, Z., Li, S., Fang, T., Quan, L.: MVSNet: depth inference for unstructured multi-view stereo. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 767\u2013783 (2018)","DOI":"10.1007\/978-3-030-01237-3_47"},{"key":"1_CR68","doi-asserted-by":"crossref","unstructured":"Yao, Y., Luo, Z., Li, S., Shen, T., Fang, T., Quan, L.: Recurrent MVSNet for high-resolution multi-view stereo depth inference. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5525\u20135534 (2019)","DOI":"10.1109\/CVPR.2019.00567"},{"key":"1_CR69","doi-asserted-by":"crossref","unstructured":"Yifan, W., Serena, F., Wu, S., \u00d6ztireli, C., Sorkine-Hornung, O.: Differentiable surface splatting for point-based geometry processing. ACM Trans. Graph. (Proc. ACM SIGGRAPH ASIA) 38(6) (2019)","DOI":"10.1145\/3355089.3356513"},{"key":"1_CR70","doi-asserted-by":"crossref","unstructured":"Yu, A., Ye, V., Tancik, M., Kanazawa, A.: pixelNeRF: neural radiance fields from one or few images. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4578\u20134587 (2021)","DOI":"10.1109\/CVPR46437.2021.00455"},{"key":"1_CR71","doi-asserted-by":"crossref","unstructured":"Zhang, K., et al.: ARF: artistic radiance fields (2022)","DOI":"10.1007\/978-3-031-19821-2_41"},{"key":"1_CR72","unstructured":"Zhang, K., Riegler, G., Snavely, N., Koltun, V.: Nerf++: analyzing and improving neural radiance fields. arXiv preprint arXiv:2010.07492 (2020)"},{"key":"1_CR73","doi-asserted-by":"crossref","unstructured":"Zhang, R., Isola, P., Efros, A.A., Shechtman, E., Wang, O.: The unreasonable effectiveness of deep features as a perceptual metric. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00068"},{"key":"1_CR74","doi-asserted-by":"crossref","unstructured":"Zhou, T., Tucker, R., Flynn, J., Fyffe, G., Snavely, N.: Stereo magnification: learning view synthesis using multiplane images. arXiv preprint arXiv:1805.09817 (2018)","DOI":"10.1145\/3197517.3201323"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-72670-5_1","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,29]],"date-time":"2024-09-29T07:15:47Z","timestamp":1727594147000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-72670-5_1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,9,30]]},"ISBN":["9783031726699","9783031726705"],"references-count":74,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-72670-5_1","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,9,30]]},"assertion":[{"value":"30 September 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}