{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T16:00:05Z","timestamp":1774022405530,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":57,"publisher":"ACM","funder":[{"name":"EuroHPC","award":["EHPC-AI-2024A02-031"],"award-info":[{"award-number":["EHPC-AI-2024A02-031"]}]},{"name":"BAGEP Award"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,8,10]]},"DOI":"10.1145\/3721238.3730636","type":"proceedings-article","created":{"date-parts":[[2025,7,23]],"date-time":"2025-07-23T08:42:43Z","timestamp":1753260163000},"page":"1-11","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["3D Stylization via Large Reconstruction Model"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-4404-0517","authenticated-orcid":false,"given":"Ipek","family":"Oztas","sequence":"first","affiliation":[{"name":"Bilkent University, Ankara, Turkiye"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2307-9052","authenticated-orcid":false,"given":"Duygu","family":"Ceylan","sequence":"additional","affiliation":[{"name":"Adobe Research, London, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2014-6325","authenticated-orcid":false,"given":"Aysegul","family":"Dundar","sequence":"additional","affiliation":[{"name":"Bilkent University, Ankara, Turkiye"}]}],"member":"320","published-online":{"date-parts":[[2025,7,27]]},"reference":[{"key":"e_1_3_3_3_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/3641519.3657423"},{"key":"e_1_3_3_3_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00602"},{"key":"e_1_3_3_3_4_1","unstructured":"Duygu Ceylan Valentin Deschaintre Thibault Groueix Rosalie Martin Chun-Hao Huang Romain Rouffet Vladimir Kim and Ga\u00ebtan Lassagne. 2024. MatAtlas: Text-driven Consistent Geometry Texturing and Material Assignment. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2404.02899 (2024)."},{"key":"e_1_3_3_3_5_1","first-page":"9609","volume-title":"Advances in Neural Information Processing Systems","author":"Chen Wenzheng","year":"2019","unstructured":"Wenzheng Chen, Huan Ling, Jun Gao, Edward Smith, Jaakko Lehtinen, Alec Jacobson, and Sanja Fidler. 2019. Learning to predict 3d objects with an interpolation-based differentiable renderer. In Advances in Neural Information Processing Systems. 9609\u20139619."},{"key":"e_1_3_3_3_6_1","unstructured":"Zilong Chen Yikai Wang Feng Wang Zhengyi Wang and Huaping Liu. 2024. V3D: Video Diffusion Models are Effective 3D Generators. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2403.06738 (2024)."},{"key":"e_1_3_3_3_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00840"},{"key":"e_1_3_3_3_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9811809"},{"key":"e_1_3_3_3_9_1","doi-asserted-by":"crossref","unstructured":"Aysegul Dundar Jun Gao Andrew Tao and Bryan Catanzaro. 2023a. Fine detailed texture learning for 3d meshes with generative models. IEEE Transactions on Pattern Analysis and Machine Intelligence 45 12 (2023) 14563\u201314574.","DOI":"10.1109\/TPAMI.2023.3319429"},{"key":"e_1_3_3_3_10_1","doi-asserted-by":"crossref","unstructured":"Aysegul Dundar Jun Gao Andrew Tao and Bryan Catanzaro. 2023b. Progressive learning of 3d reconstruction network from 2d gan data. IEEE Transactions on Pattern Analysis and Machine Intelligence 46 2 (2023) 793\u2013804.","DOI":"10.1109\/TPAMI.2023.3324806"},{"key":"e_1_3_3_3_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00444"},{"key":"e_1_3_3_3_12_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72684-2_11"},{"key":"e_1_3_3_3_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/3680528.3687643"},{"key":"e_1_3_3_3_14_1","unstructured":"Rinon Gal Yuval Alaluf Yuval Atzmon Or Patashnik Amit\u00a0H Bermano Gal Chechik and Daniel Cohen-Or. 2022. An image is worth one word: Personalizing text-to-image generation using textual inversion. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2208.01618 (2022)."},{"key":"e_1_3_3_3_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.265"},{"key":"e_1_3_3_3_16_1","unstructured":"Shubham Goel Angjoo Kanazawa and Jitendra Malik. 2020. Shape and Viewpoint without Keypoints. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2007.10982 (2020)."},{"key":"e_1_3_3_3_17_1","unstructured":"Qiyuan He Jinghao Wang Ziwei Liu and Angela Yao. 2024. AID: Attention Interpolation of Text-to-Image Diffusion. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2403.17924 (2024)."},{"key":"e_1_3_3_3_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00752"},{"key":"e_1_3_3_3_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00457"},{"key":"e_1_3_3_3_20_1","unstructured":"Yicong Hong Kai Zhang Jiuxiang Gu Sai Bi Yang Zhou Difan Liu Feng Liu Kalyan Sunkavalli Trung Bui and Hao Tan. 2023. Lrm: Large reconstruction model for single image to 3d. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2311.04400 (2023)."},{"key":"e_1_3_3_3_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.167"},{"key":"e_1_3_3_3_22_1","unstructured":"Jaeseok Jeong Junho Kim Yunjey Choi Gayoung Lee and Youngjung Uh. 2024. Visual Style Prompting with Swapping Self-Attention. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2402.12974 (2024)."},{"key":"e_1_3_3_3_23_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01267-0_23"},{"key":"e_1_3_3_3_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00622"},{"key":"e_1_3_3_3_25_1","doi-asserted-by":"publisher","DOI":"10.1111\/cgf.15016"},{"key":"e_1_3_3_3_26_1","doi-asserted-by":"crossref","unstructured":"\u00c1ron\u00a0Samuel Kov\u00e1cs Pedro Hermosilla and Renata\u00a0G. Raidou. 2024. G-Style: Stylized Gaussian Splatting. Computer Graphics Forum 43 7 (2024). https:\/\/doi.org\/10.1111\/cgf.15259","DOI":"10.1111\/cgf.15259"},{"key":"e_1_3_3_3_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.618"},{"key":"e_1_3_3_3_28_1","unstructured":"Jiahao Li Hao Tan Kai Zhang Zexiang Xu Fujun Luan Yinghao Xu Yicong Hong Kalyan Sunkavalli Greg Shakhnarovich and Sai Bi. 2023. Instant3d: Fast text-to-3d with sparse-view generation and large reconstruction model. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2311.06214 (2023)."},{"key":"e_1_3_3_3_29_1","unstructured":"Xueting Li Sifei Liu Kihwan Kim Shalini De\u00a0Mello Varun Jampani Ming-Hsuan Yang and Jan Kautz. 2020. Self-supervised Single-view 3D Reconstruction via Semantic Consistency. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2003.06473 (2020)."},{"key":"e_1_3_3_3_30_1","unstructured":"Yijun Li Chen Fang Jimei Yang Zhaowen Wang Xin Lu and Ming-Hsuan Yang. 2017. Universal style transfer via feature transforms. Advances in neural information processing systems 30 (2017)."},{"key":"e_1_3_3_3_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00806"},{"key":"e_1_3_3_3_32_1","doi-asserted-by":"crossref","unstructured":"Kunhao Liu Fangneng Zhan Muyu Xu Christian Theobalt Ling Shao and Shijian Lu. 2024b. StyleGaussian: Instant 3D Style Transfer with Gaussian Splatting. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2403.07807 (2024).","DOI":"10.1145\/3681758.3698002"},{"key":"e_1_3_3_3_33_1","unstructured":"Minghua Liu Chao Xu Haian Jin Linghao Chen Mukund Varma\u00a0T Zexiang Xu and Hao Su. 2024a. One-2-3-45: Any single image to 3d mesh in 45 seconds without per-shape optimization. Advances in Neural Information Processing Systems 36 (2024)."},{"key":"e_1_3_3_3_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00853"},{"key":"e_1_3_3_3_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00605"},{"key":"e_1_3_3_3_36_1","doi-asserted-by":"crossref","unstructured":"Ben Mildenhall Pratul\u00a0P Srinivasan Matthew Tancik Jonathan\u00a0T Barron Ravi Ramamoorthi and Ren Ng. 2021. Nerf: Representing scenes as neural radiance fields for view synthesis. Commun. ACM 65 1 (2021) 99\u2013106.","DOI":"10.1145\/3503250"},{"key":"e_1_3_3_3_37_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i5.28226"},{"key":"e_1_3_3_3_38_1","doi-asserted-by":"crossref","unstructured":"Sai Raj\u00a0Kishore Perla Yizhi Wang Ali Mahdavi-Amiri and Hao Zhang. 2024. EASI-Tex: Edge-Aware Mesh Texturing from Single Image. ACM Transactions on Graphics (Proceedings of SIGGRAPH) 43 4 Article 40 (2024). https:\/\/doi.org\/10.1145\/3658222","DOI":"10.1145\/3658222"},{"key":"e_1_3_3_3_39_1","first-page":"8821","volume-title":"International conference on machine learning","author":"Ramesh Aditya","year":"2021","unstructured":"Aditya Ramesh, Mikhail Pavlov, Gabriel Goh, Scott Gray, Chelsea Voss, Alec Radford, Mark Chen, and Ilya Sutskever. 2021. Zero-shot text-to-image generation. In International conference on machine learning. Pmlr, 8821\u20138831."},{"key":"e_1_3_3_3_40_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"e_1_3_3_3_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02155"},{"key":"e_1_3_3_3_42_1","unstructured":"Ruoxi Shi Hansheng Chen Zhuoyang Zhang Minghua Liu Chao Xu Xinyue Wei Linghao Chen Chong Zeng and Hao Su. 2023. Zero123++: a single image to consistent multi-view diffusion base model. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2310.15110 (2023)."},{"key":"e_1_3_3_3_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/WACV57701.2024.00714"},{"key":"e_1_3_3_3_44_1","doi-asserted-by":"crossref","unstructured":"Wei\u00a0Ren Tan Chee\u00a0Seng Chan Hernan\u00a0E Aguirre and Kiyoshi Tanaka. 2018. Improved ArtGAN for conditional synthesis of natural image and artwork. IEEE Transactions on Image Processing 28 1 (2018) 394\u2013409.","DOI":"10.1109\/TIP.2018.2866698"},{"key":"e_1_3_3_3_45_1","doi-asserted-by":"crossref","unstructured":"Jiaxiang Tang Zhaoxi Chen Xiaokang Chen Tengfei Wang Gang Zeng and Ziwei Liu. 2024. LGM: Large Multi-View Gaussian Model for High-Resolution 3D Content Creation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2402.05054 (2024).","DOI":"10.1007\/978-3-031-73235-5_1"},{"key":"e_1_3_3_3_46_1","unstructured":"Haofan Wang Matteo Spinelli Qixun Wang Xu Bai Zekui Qin and Anthony Chen. 2024. Instantstyle: Free lunch towards style-preserving in text-to-image generation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2404.02733 (2024)."},{"key":"e_1_3_3_3_47_1","unstructured":"Zhouxia Wang Xintao Wang Liangbin Xie Zhongang Qi Ying Shan Wenping Wang and Ping Luo. 2023. Styleadapter: A single-pass lora-free model for stylized image generation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2309.01770 (2023)."},{"key":"e_1_3_3_3_48_1","unstructured":"Xinyue Wei Kai Zhang Sai Bi Hao Tan Fujun Luan Valentin Deschaintre Kalyan Sunkavalli Hao Su and Zexiang Xu. 2024. MeshLRM: Large Reconstruction Model for High-Quality Mesh. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2404.12385 (2024)."},{"key":"e_1_3_3_3_49_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00084"},{"key":"e_1_3_3_3_50_1","unstructured":"Jiale Xu Weihao Cheng Yiming Gao Xintao Wang Shenghua Gao and Ying Shan. 2024a. Instantmesh: Efficient 3d mesh generation from a single image with sparse-view large reconstruction models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2404.07191 (2024)."},{"key":"e_1_3_3_3_51_1","unstructured":"Yinghao Xu Zifan Shi Wang Yifan Sida Peng Ceyuan Yang Yujun Shen and Wetzstein Gordon. 2024b. GRM: Large Gaussian Reconstruction Model for Efficient 3D Reconstruction and Generation. arxiv:https:\/\/arXiv.org\/abs\/2403.14621 (2024)."},{"key":"e_1_3_3_3_52_1","unstructured":"Hu Ye Jun Zhang Sibo Liu Xiao Han and Wei Yang. 2023. Ip-adapter: Text compatible image prompt adapter for text-to-image diffusion models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2308.06721 (2023)."},{"key":"e_1_3_3_3_53_1","unstructured":"Ahmet\u00a0Burak Yildirim Mustafa\u00a0Utku Aydogdu Duygu Ceylan and Aysegul Dundar. 2025. MD-ProjTex: Texturing 3D Shapes with Multi-Diffusion Projection. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2504.02762 (2025)."},{"key":"e_1_3_3_3_54_1","unstructured":"Wangbo Yu Jinbo Xing Li Yuan Wenbo Hu Xiaoyu Li Zhipeng Huang Xiangjun Gao Tien-Tsin Wong Ying Shan and Yonghong Tian. 2024. ViewCrafter: Taming Video Diffusion Models for High-fidelity Novel View Synthesis. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2409.02048 (2024)."},{"key":"e_1_3_3_3_55_1","doi-asserted-by":"crossref","unstructured":"Kai Zhang Sai Bi Hao Tan Yuanbo Xiangli Nanxuan Zhao Kalyan Sunkavalli and Zexiang Xu. 2024. GS-LRM: Large Reconstruction Model for 3D Gaussian Splatting. European Conference on Computer Vision (2024).","DOI":"10.1007\/978-3-031-72670-5_1"},{"key":"e_1_3_3_3_56_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19821-2_41"},{"key":"e_1_3_3_3_57_1","doi-asserted-by":"publisher","DOI":"10.1145\/3528233.3530736"},{"key":"e_1_3_3_3_58_1","unstructured":"Shihao Zhao Dongdong Chen Yen-Chun Chen Jianmin Bao Shaozhe Hao Lu Yuan and Kwan-Yee\u00a0K Wong. 2024. Uni-controlnet: All-in-one control to text-to-image diffusion models. Advances in Neural Information Processing Systems 36 (2024)."}],"event":{"name":"SIGGRAPH Conference Papers '25: Special Interest Group on Computer Graphics and Interactive Techniques Conference Conference Papers","location":"Vancouver BC Canada","acronym":"SIGGRAPH Conference Papers '25","sponsor":["SIGGRAPH ACM Special Interest Group on Computer Graphics and Interactive Techniques"]},"container-title":["Proceedings of the Special Interest Group on Computer Graphics and Interactive Techniques Conference Conference Papers"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3721238.3730636","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T15:02:29Z","timestamp":1774018949000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3721238.3730636"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,7,27]]},"references-count":57,"alternative-id":["10.1145\/3721238.3730636","10.1145\/3721238"],"URL":"https:\/\/doi.org\/10.1145\/3721238.3730636","relation":{},"subject":[],"published":{"date-parts":[[2025,7,27]]},"assertion":[{"value":"2025-07-27","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}