{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T09:24:38Z","timestamp":1780392278731,"version":"3.54.1"},"publisher-location":"Cham","reference-count":76,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031726576","type":"print"},{"value":"9783031726583","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,10,2]],"date-time":"2024-10-02T00:00:00Z","timestamp":1727827200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,10,2]],"date-time":"2024-10-02T00:00:00Z","timestamp":1727827200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-72658-3_19","type":"book-chapter","created":{"date-parts":[[2024,10,2]],"date-time":"2024-10-02T03:32:37Z","timestamp":1727839957000},"page":"324-342","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":52,"title":["DreamScene360: Unconstrained Text-to-3D Scene Generation with\u00a0Panoramic Gaussian Splatting"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9018-7539","authenticated-orcid":false,"given":"Shijie","family":"Zhou","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8302-7465","authenticated-orcid":false,"given":"Zhiwen","family":"Fan","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8474-3095","authenticated-orcid":false,"given":"Dejia","family":"Xu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-6333-239X","authenticated-orcid":false,"given":"Haoran","family":"Chang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9610-0350","authenticated-orcid":false,"given":"Pradyumna","family":"Chari","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-2370-8510","authenticated-orcid":false,"given":"Tejas","family":"Bharadwaj","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6387-7024","authenticated-orcid":false,"given":"Suya","family":"You","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2050-5693","authenticated-orcid":false,"given":"Zhangyang","family":"Wang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2444-2503","authenticated-orcid":false,"given":"Achuta","family":"Kadambi","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2024,10,2]]},"reference":[{"key":"19_CR1","unstructured":"Armandpour, M., Zheng, H., Sadeghian, A., Sadeghian, A., Zhou, M.: Re-imagine the negative prompt algorithm: transform 2d diffusion into 3d, alleviate janus problem and beyond. arXiv preprint arXiv:2304.04968 (2023)"},{"key":"19_CR2","unstructured":"Bai, J., Huang, L., Guo, J., Gong, W., Li, Y., Guo, Y.: 360-gs: layout-guided panoramic gaussian splatting for indoor roaming. arXiv preprint arXiv:2402.00763 (2024)"},{"key":"19_CR3","unstructured":"Bar-Tal, O., Yariv, L., Lipman, Y., Dekel, T.: Multidiffusion: fusing diffusion paths for controlled image generation (2023)"},{"key":"19_CR4","unstructured":"Berger, M., et al.: State of the art in surface reconstruction from point clouds. In: 35th Annual Conference of the European Association for Computer Graphics, Eurographics 2014-State of the Art Reports. No.\u00a0CONF, The Eurographics Association (2014)"},{"key":"19_CR5","doi-asserted-by":"crossref","unstructured":"Bhat, S.F., Mitra, N.J., Wonka, P.: Loosecontrol: lifting controlnet for generalized depth conditioning. arXiv preprint arXiv:2312.03079 (2023)","DOI":"10.1145\/3641519.3657525"},{"key":"19_CR6","doi-asserted-by":"crossref","unstructured":"Bian, W., Wang, Z., Li, K., Bian, J.W., Prisacariu, V.A.: Nope-nerf: optimising neural radiance field with no pose prior. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4160\u20134169 (2023)","DOI":"10.1109\/CVPR52729.2023.00405"},{"key":"19_CR7","unstructured":"Chung, J., Lee, S., Nam, H., Lee, J., Lee, K.M.: Luciddreamer: domain-free generation of 3d gaussian splatting scenes. arXiv preprint arXiv:2311.13384 (2023)"},{"key":"19_CR8","doi-asserted-by":"crossref","unstructured":"Deng, C., et\u00a0al.: Nerdi: single-view nerf synthesis with language-guided diffusion as general image priors. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 20637\u201320647 (2023)","DOI":"10.1109\/CVPR52729.2023.01977"},{"key":"19_CR9","first-page":"8780","volume":"34","author":"P Dhariwal","year":"2021","unstructured":"Dhariwal, P., Nichol, A.: Diffusion models beat gans on image synthesis. Adv. Neural. Inf. Process. Syst. 34, 8780\u20138794 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"19_CR10","unstructured":"Fan, Z., Wang, K., Wen, K., Zhu, Z., Xu, D., Wang, Z.: Lightgaussian: unbounded 3d gaussian compression with 15x reduction and 200+ fps. arXiv preprint arXiv:2311.17245 (2023)"},{"key":"19_CR11","unstructured":"Fang, C., Hu, X., Luo, K., Tan, P.: Ctrl-room: controllable text-to-3d room meshes generation with layout constraints. arXiv preprint arXiv:2310.03602 (2023)"},{"key":"19_CR12","doi-asserted-by":"crossref","unstructured":"Fridovich-Keil, S., Yu, A., Tancik, M., Chen, Q., Recht, B., Kanazawa, A.: Plenoxels: radiance fields without neural networks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5501\u20135510 (2022)","DOI":"10.1109\/CVPR52688.2022.00542"},{"key":"19_CR13","doi-asserted-by":"crossref","unstructured":"Gao, G., Liu, W., Chen, A., Geiger, A., Sch\u00f6lkopf, B.: Graphdreamer: compositional 3d scene synthesis from scene graphs. arXiv preprint arXiv:2312.00093 (2023)","DOI":"10.1109\/CVPR52733.2024.02012"},{"key":"19_CR14","unstructured":"Geng, Z., Pokle, A., Kolter, J.Z.: One-step diffusion distillation via deep equilibrium models. Adv. Neural Inf. Process. Syst. 36 (2024)"},{"issue":"11","key":"19_CR15","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1145\/3422622","volume":"63","author":"I Goodfellow","year":"2020","unstructured":"Goodfellow, I., et al.: Generative adversarial networks. Commun. ACM 63(11), 139\u2013144 (2020)","journal-title":"Commun. ACM"},{"issue":"4","key":"19_CR16","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3197517.3201384","volume":"37","author":"P Hedman","year":"2018","unstructured":"Hedman, P., Kopf, J.: Instant 3d photography. ACM Trans. Graph. (TOG) 37(4), 1\u201312 (2018)","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"19_CR17","unstructured":"H\u00e9naff, O.J., et al.: Object discovery and representation networks. arXiv preprint arXiv:2203.08777 (2022)"},{"key":"19_CR18","first-page":"6840","volume":"33","author":"J Ho","year":"2020","unstructured":"Ho, J., Jain, A., Abbeel, P.: Denoising diffusion probabilistic models. Adv. Neural. Inf. Process. Syst. 33, 6840\u20136851 (2020)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"19_CR19","unstructured":"Ho, J., Salimans, T.: Classifier-free diffusion guidance. arXiv preprint arXiv:2207.12598 (2022)"},{"key":"19_CR20","doi-asserted-by":"crossref","unstructured":"H\u00f6llein, L., Cao, A., Owens, A., Johnson, J., Nie\u00dfner, M.: Text2room: extracting textured 3d meshes from 2d text-to-image models. arXiv preprint arXiv:2303.11989 (2023)","DOI":"10.1109\/ICCV51070.2023.00727"},{"key":"19_CR21","unstructured":"Hu, E.J., et al.: Lora: low-rank adaptation of large language models. arXiv preprint arXiv:2106.09685 (2021)"},{"key":"19_CR22","unstructured":"Jun, H., Nichol, A.: Shap-e: generating conditional 3d implicit functions. arXiv preprint arXiv:2305.02463 (2023)"},{"key":"19_CR23","doi-asserted-by":"crossref","unstructured":"Karnewar, A., Vedaldi, A., Novotny, D., Mitra, N.J.: Holodiffusion: training a 3d diffusion model using 2d images. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 18423\u201318433 (2023)","DOI":"10.1109\/CVPR52729.2023.01767"},{"key":"19_CR24","doi-asserted-by":"crossref","unstructured":"Karras, T., Laine, S., Aila, T.: A style-based generator architecture for generative adversarial networks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4401\u20134410 (2019)","DOI":"10.1109\/CVPR.2019.00453"},{"issue":"4","key":"19_CR25","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3592433","volume":"42","author":"B Kerbl","year":"2023","unstructured":"Kerbl, B., Kopanas, G., Leimk\u00fchler, T., Drettakis, G.: 3d gaussian splatting for real-time radiance field rendering. ACM Trans. Graph. (ToG) 42(4), 1\u201314 (2023)","journal-title":"ACM Trans. Graph. (ToG)"},{"key":"19_CR26","doi-asserted-by":"crossref","unstructured":"Kopanas, G., Philip, J., Leimk\u00fchler, T., Drettakis, G.: Point-based neural rendering with per-view optimization. In: Computer Graphics Forum, vol.\u00a040, pp. 29\u201343. Wiley Online Library (2021)","DOI":"10.1111\/cgf.14339"},{"key":"19_CR27","doi-asserted-by":"crossref","unstructured":"Lee, J.C., Rho, D., Sun, X., Ko, J.H., Park, E.: Compact 3d gaussian representation for radiance field. arXiv preprint arXiv:2311.13681 (2023)","DOI":"10.1109\/CVPR52733.2024.02052"},{"key":"19_CR28","unstructured":"Li, R., et al.: 4k4dgen: panoramic 4d generation at 4k resolution. arXiv preprint arXiv:2406.13527 (2024)"},{"key":"19_CR29","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"638","DOI":"10.1007\/978-3-030-20893-6_40","volume-title":"Computer Vision \u2013 ACCV 2018","author":"W Li","year":"2019","unstructured":"Li, W., Hosseini\u00a0Jafari, O., Rother, C.: Deep object co-segmentation. In: Jawahar, C.V., Li, H., Mori, G., Schindler, K. (eds.) ACCV 2018. LNCS, vol. 11363, pp. 638\u2013653. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-20893-6_40"},{"key":"19_CR30","unstructured":"Lin, Y., et al.: Componerf: text-guided multi-object compositional nerf with editable 3d scene layout. arXiv preprint arXiv:2303.13843 (2023)"},{"key":"19_CR31","doi-asserted-by":"crossref","unstructured":"Lombardi, S., Simon, T., Saragih, J., Schwartz, G., Lehrmann, A., Sheikh, Y.: Neural volumes: learning dynamic renderable volumes from images. arXiv preprint arXiv:1906.07751 (2019)","DOI":"10.1145\/3306346.3323020"},{"key":"19_CR32","unstructured":"Mao, W., Cao, Y.P., Liu, J.W., Xu, Z., Shou, M.Z.: Showroom3d: text to high-quality 3d room generation using 3d priors. arXiv preprint arXiv:2312.13324 (2023)"},{"key":"19_CR33","doi-asserted-by":"crossref","unstructured":"Meng, C., et al.: On distillation of guided diffusion models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 14297\u201314306 (2023)","DOI":"10.1109\/CVPR52729.2023.01374"},{"key":"19_CR34","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1007\/978-3-030-58452-8_24","volume-title":"Computer Vision \u2013 ECCV 2020","author":"B Mildenhall","year":"2020","unstructured":"Mildenhall, B., Srinivasan, P.P., Tancik, M., Barron, J.T., Ramamoorthi, R., Ng, R.: NeRF: representing scenes as neural radiance fields for view synthesis. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12346, pp. 405\u2013421. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58452-8_24"},{"issue":"1","key":"19_CR35","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1145\/3503250","volume":"65","author":"B Mildenhall","year":"2021","unstructured":"Mildenhall, B., Srinivasan, P.P., Tancik, M., Barron, J.T., Ramamoorthi, R., Ng, R.: Nerf: representing scenes as neural radiance fields for view synthesis. Commun. ACM 65(1), 99\u2013106 (2021)","journal-title":"Commun. ACM"},{"issue":"12","key":"19_CR36","doi-asserted-by":"publisher","first-page":"4695","DOI":"10.1109\/TIP.2012.2214050","volume":"21","author":"A Mittal","year":"2012","unstructured":"Mittal, A., Moorthy, A.K., Bovik, A.C.: No-reference image quality assessment in the spatial domain. IEEE Trans. Image Process. 21(12), 4695\u20134708 (2012)","journal-title":"IEEE Trans. Image Process."},{"issue":"3","key":"19_CR37","doi-asserted-by":"publisher","first-page":"209","DOI":"10.1109\/LSP.2012.2227726","volume":"20","author":"A Mittal","year":"2012","unstructured":"Mittal, A., Soundararajan, R., Bovik, A.C.: Making a \u201ccompletely blind\" image quality analyzer. IEEE Signal Process. Lett. 20(3), 209\u2013212 (2012)","journal-title":"IEEE Signal Process. Lett."},{"key":"19_CR38","doi-asserted-by":"crossref","unstructured":"Morgenstern, W., Barthel, F., Hilsmann, A., Eisert, P.: Compact 3d scene representation via self-organizing gaussian grids. arXiv preprint arXiv:2312.13299 (2023)","DOI":"10.1007\/978-3-031-73013-9_2"},{"key":"19_CR39","doi-asserted-by":"crossref","unstructured":"M\u00fcller, T., Evans, A., Schied, C., Keller, A.: Instant neural graphics primitives with a multiresolution hash encoding. arXiv preprint arXiv:2201.05989 (2022)","DOI":"10.1145\/3528223.3530127"},{"key":"19_CR40","unstructured":"Navaneet, K., Meibodi, K.P., Koohpayegani, S.A., Pirsiavash, H.: Compact3d: compressing gaussian splat radiance field models with vector quantization. arXiv preprint arXiv:2311.18159 (2023)"},{"key":"19_CR41","doi-asserted-by":"crossref","unstructured":"Nguyen-Phuoc, T., Li, C., Theis, L., Richardt, C., Yang, Y.L.: Hologan: unsupervised learning of 3d representations from natural images. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 7588\u20137597 (2019)","DOI":"10.1109\/ICCV.2019.00768"},{"key":"19_CR42","doi-asserted-by":"crossref","unstructured":"Niedermayr, S., Stumpfegger, J., Westermann, R.: Compressed 3d gaussian splatting for accelerated novel view synthesis. arXiv preprint arXiv:2401.02436 (2023)","DOI":"10.1109\/CVPR52733.2024.00985"},{"key":"19_CR43","unstructured":"Oquab, M., et\u00a0al.: Dinov2: learning robust visual features without supervision. arXiv preprint arXiv:2304.07193 (2023)"},{"key":"19_CR44","unstructured":"Ouyang, H., Heal, K., Lombardi, S., Sun, T.: Text2immersion: generative immersive scene with 3d gaussians. arXiv preprint arXiv:2312.09242 (2023)"},{"key":"19_CR45","doi-asserted-by":"crossref","unstructured":"Po, R., Wetzstein, G.: Compositional 3d scene generation using locally conditioned diffusion. arXiv preprint arXiv:2303.12218 (2023)","DOI":"10.1109\/3DV62453.2024.00026"},{"key":"19_CR46","unstructured":"Poole, B., Jain, A., Barron, J.T., Mildenhall, B.: Dreamfusion: text-to-3d using 2d diffusion. arXiv preprint arXiv:2209.14988 (2022)"},{"key":"19_CR47","unstructured":"Radford, A., et\u00a0al.: Learning transferable visual models from natural language supervision. In: International Conference on Machine Learning, pp. 8748\u20138763. PMLR (2021)"},{"key":"19_CR48","unstructured":"Ramesh, A., Dhariwal, P., Nichol, A., Chu, C., Chen, M.: Hierarchical text-conditional image generation with clip latents, 1(2), 3. arXiv preprint arXiv:2204.06125 (2022)"},{"key":"19_CR49","doi-asserted-by":"crossref","unstructured":"Ranftl, R., Bochkovskiy, A., Koltun, V.: Vision transformers for dense prediction. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 12179\u201312188 (2021)","DOI":"10.1109\/ICCV48922.2021.01196"},{"key":"19_CR50","doi-asserted-by":"crossref","unstructured":"Rey-Area, M., Yuan, M., Richardt, C.: 360monodepth: high-resolution 360deg monocular depth estimation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3762\u20133772 (2022)","DOI":"10.1109\/CVPR52688.2022.00374"},{"key":"19_CR51","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P., Ommer, B.: High-resolution image synthesis with latent diffusion models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10684\u201310695 (2022)","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"19_CR52","unstructured":"Saharia, C., et al.: Photorealistic text-to-image diffusion models with deep language understanding. In: Oh, A.H., Agarwal, A., Belgrave, D., Cho, K. (eds.) Advances in Neural Information Processing Systems (2022). https:\/\/openreview.net\/forum?id=08Yk-n5l2Al"},{"key":"19_CR53","first-page":"36479","volume":"35","author":"C Saharia","year":"2022","unstructured":"Saharia, C., et al.: Photorealistic text-to-image diffusion models with deep language understanding. Adv. Neural. Inf. Process. Syst. 35, 36479\u201336494 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"19_CR54","unstructured":"Salimans, T., Ho, J.: Progressive distillation for fast sampling of diffusion models. arXiv preprint arXiv:2202.00512 (2022)"},{"key":"19_CR55","doi-asserted-by":"crossref","unstructured":"Schonberger, J.L., Frahm, J.M.: Structure-from-motion revisited. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4104\u20134113 (2016)","DOI":"10.1109\/CVPR.2016.445"},{"key":"19_CR56","unstructured":"Song, J., Meng, C., Ermon, S.: Denoising diffusion implicit models. arXiv preprint arXiv:2010.02502 (2020)"},{"key":"19_CR57","doi-asserted-by":"crossref","unstructured":"Song, L., et al.: Roomdreamer: text-driven 3d indoor scene synthesis with coherent geometry and texture. arXiv preprint arXiv:2305.11337 (2023)","DOI":"10.1145\/3581783.3611800"},{"key":"19_CR58","unstructured":"Tang, J., Ren, J., Zhou, H., Liu, Z., Zeng, G.: Dreamgaussian: generative gaussian splatting for efficient 3d content creation. arXiv preprint arXiv:2309.16653 (2023)"},{"key":"19_CR59","doi-asserted-by":"crossref","unstructured":"Tumanyan, N., Bar-Tal, O., Bagon, S., Dekel, T.: Splicing vit features for semantic appearance transfer. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10748\u201310757 (2022)","DOI":"10.1109\/CVPR52688.2022.01048"},{"key":"19_CR60","unstructured":"Vilesov, A., Chari, P., Kadambi, A.: Cg3d: compositional generation for text-to-3d via gaussian splatting. arXiv preprint arXiv:2311.17907 (2023)"},{"key":"19_CR61","doi-asserted-by":"crossref","unstructured":"Wang, G., Wang, P., Chen, Z., Wang, W., Loy, C.C., Liu, Z.: Perf: panoramic neural radiance field from a single panorama. arXiv preprint arXiv:2310.16831 (2023)","DOI":"10.1109\/TPAMI.2024.3387307"},{"key":"19_CR62","doi-asserted-by":"crossref","unstructured":"Wang, H., Xiang, X., Fan, Y., Xue, J.H.: Customizing 360-degree panoramas through text-to-image diffusion models. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 4933\u20134943 (2024)","DOI":"10.1109\/WACV57701.2024.00486"},{"key":"19_CR63","doi-asserted-by":"crossref","unstructured":"Wang, H., Du, X., Li, J., Yeh, R.A., Shakhnarovich, G.: Score jacobian chaining: Lifting pretrained 2d diffusion models for 3d generation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12619\u201312629 (2023)","DOI":"10.1109\/CVPR52729.2023.01214"},{"key":"19_CR64","unstructured":"Wang, Z., et al.: Prolificdreamer: high-fidelity and diverse text-to-3d generation with variational score distillation. arXiv preprint arXiv:2305.16213 (2023)"},{"key":"19_CR65","unstructured":"Wu, H., et\u00a0al.: Q-align: teaching lmms for visual scoring via discrete text-defined levels. arXiv preprint arXiv:2312.17090 (2023)"},{"key":"19_CR66","unstructured":"Xiong, H., Muttukuru, S., Upadhyay, R., Chari, P., Kadambi, A.: Sparsegs: real-time 360$$\\{$$deg$$\\}$$ sparse view synthesis using gaussian splatting. arXiv preprint arXiv:2312.00206 (2023)"},{"key":"19_CR67","doi-asserted-by":"publisher","unstructured":"Xu, D., Jiang, Y., Wang, P., Fan, Z., Shi, H., Wang, Z.: Sinnerf: training neural radiance fields on complex scenes from a single image. In: Computer Vision\u2013ECCV 2022: 17th European Conference, Tel Aviv, Israel, 23\u201327 October 2022, Proceedings, Part XXII, pp. 736\u2013753. Springer, Heidelberg (2022). https:\/\/doi.org\/10.1007\/978-3-031-20047-2_42","DOI":"10.1007\/978-3-031-20047-2_42"},{"key":"19_CR68","doi-asserted-by":"crossref","unstructured":"Xu, D., Jiang, Y., Wang, P., Fan, Z., Wang, Y., Wang, Z.: Neurallift-360: lifting an in-the-wild 2d photo to a 3d object with 360deg views. arXiv preprint arXiv:2211.16431 (2022)","DOI":"10.1109\/CVPR52729.2023.00435"},{"key":"19_CR69","doi-asserted-by":"crossref","unstructured":"Yang, Z., et al.: Idea2img: iterative self-refinement with gpt-4v (ision) for automatic image design and generation. arXiv preprint arXiv:2310.08541 (2023)","DOI":"10.1007\/978-3-031-72920-1_10"},{"key":"19_CR70","doi-asserted-by":"crossref","unstructured":"Yu, H.X., et\u00a0al.: Wonderjourney: going from anywhere to everywhere. arXiv preprint arXiv:2312.03884 (2023)","DOI":"10.1109\/CVPR52733.2024.00636"},{"key":"19_CR71","doi-asserted-by":"crossref","unstructured":"Zhang, C., Chen, T.: Efficient feature extraction for 2d\/3d objects in mesh representation. In: Proceedings 2001 International Conference on Image Processing (Cat. No. 01CH37205), vol.\u00a03, pp. 935\u2013938. IEEE (2001)","DOI":"10.1109\/ICIP.2001.958278"},{"key":"19_CR72","doi-asserted-by":"crossref","unstructured":"Zhang, J., Li, X., Wan, Z., Wang, C., Liao, J.: Text2nerf: text-driven 3d scene generation with neural radiance fields. IEEE Trans. Visualization Comput. Graph. (2024)","DOI":"10.1109\/TVCG.2024.3361502"},{"key":"19_CR73","doi-asserted-by":"crossref","unstructured":"Zhang, L., Rao, A., Agrawala, M.: Adding conditional control to text-to-image diffusion models. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3836\u20133847 (2023)","DOI":"10.1109\/ICCV51070.2023.00355"},{"key":"19_CR74","doi-asserted-by":"crossref","unstructured":"Zheng, G., Zhou, X., Li, X., Qi, Z., Shan, Y., Li, X.: Layoutdiffusion: controllable diffusion model for layout-to-image generation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 22490\u201322499 (2023)","DOI":"10.1109\/CVPR52729.2023.02154"},{"key":"19_CR75","doi-asserted-by":"crossref","unstructured":"Zhou, S., et al.: Feature 3dgs: supercharging 3d gaussian splatting to enable distilled feature fields. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 21676\u201321685 (2024)","DOI":"10.1109\/CVPR52733.2024.02048"},{"key":"19_CR76","doi-asserted-by":"crossref","unstructured":"Zhu, Z., Fan, Z., Jiang, Y., Wang, Z.: FSGS: real-time few-shot view synthesis using gaussian splatting. arXiv preprint arXiv:2312.00451 (2023)","DOI":"10.1007\/978-3-031-72933-1_9"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-72658-3_19","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,28]],"date-time":"2024-11-28T23:54:10Z","timestamp":1732838050000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-72658-3_19"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,2]]},"ISBN":["9783031726576","9783031726583"],"references-count":76,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-72658-3_19","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,10,2]]},"assertion":[{"value":"2 October 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}