{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T03:28:20Z","timestamp":1777865300057,"version":"3.51.4"},"reference-count":49,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/5011000018091","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["2023YFF0725001"],"award-info":[{"award-number":["2023YFF0725001"]}],"id":[{"id":"10.13039\/5011000018091","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,19]]},"DOI":"10.1109\/iccv51701.2025.02349","type":"proceedings-article","created":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T19:45:49Z","timestamp":1777491949000},"page":"25325-25334","source":"Crossref","is-referenced-by-count":0,"title":["MagicCity: Geometry-Aware 3D City Generation from Satellite Imagery with Multi-View Consistency"],"prefix":"10.1109","author":[{"given":"Xingbo","family":"Yao","sequence":"first","affiliation":[{"name":"Hong Kong University of Science and Technology (Guangzhou)"}]},{"given":"Xuanmin","family":"Wang","sequence":"additional","affiliation":[{"name":"Tianjin University"}]},{"given":"Hao","family":"Wu","sequence":"additional","affiliation":[{"name":"Hong Kong University of Science and Technology (Guangzhou)"}]},{"given":"Chengliang","family":"Ping","sequence":"additional","affiliation":[{"name":"Hong Kong University of Science and Technology (Guangzhou)"}]},{"given":"Doudou","family":"Zhang","sequence":"additional","affiliation":[{"name":"Hong Kong University of Science and Technology (Guangzhou)"}]},{"given":"Hui","family":"Xiong","sequence":"additional","affiliation":[{"name":"Hong Kong University of Science and Technology (Guangzhou)"}]}],"member":"263","reference":[{"key":"ref1","author":"Bi\u0144kowski","year":"2018","journal-title":"Demystifying mmd gans"},{"key":"ref2","author":"Blattmann","year":"2023","journal-title":"Stable video diffusion: Scaling latent video diffusion models to large datasets"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW63382.2024.00753"},{"key":"ref4","first-page":"16123","article-title":"Efficient geometry-aware 3d generative adversarial networks","volume-title":"In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition","author":"Eric","year":"2022"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3641519.3657513"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/cvprw67362.2025.00187"},{"key":"ref7","author":"Deng","year":"2024","journal-title":"Citycraft: A real crafter for 3d city generation"},{"key":"ref8","article-title":"Magicdrive: Street view generation with diverse 3d geometry control","volume-title":"In The Twelfth International Conference on Learning Representations","author":"Gao","year":"2023"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.52202\/079017-2403"},{"issue":"5","key":"ref10","first-page":"1","volume":"2","author":"Geiger","year":"2015","journal-title":"The kitti vision benchmark suite"},{"key":"ref11","article-title":"Gans trained by a two time-scale update rule converge to a local nash equilibrium","volume":"30","author":"Heusel","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00482"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00926"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1117\/12.3018858"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3592433"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/3292390.3292397"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72904-1_13"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01669"},{"key":"ref19","volume-title":"Crossviewdiff: A cross-view diffusion model for satellite-to-street view synthesis","author":"Li","year":"2024"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00297"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00682"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.02085"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20074-8_6"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr52733.2024.00951"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2012.2214050"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2012.2227726"},{"key":"ref27","author":"Oquab","year":"2023","journal-title":"Dinov2: Learning robust visual features without supervision"},{"key":"ref28","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"In International conference on machine learning","author":"Radford","year":"2021"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3019967"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.445"},{"key":"ref32","author":"Shang","year":"2024","journal-title":"Urbanworld: An urban world model for 3d city generation"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/WACVW52041.2021.00022"},{"key":"ref34","author":"Shi","year":"2023","journal-title":"Mvdream: Multi-view diffusion for 3d generation"},{"key":"ref35","author":"Sun","year":"2024","journal-title":"Dimensionx: Create any 3d and 4d scenes from a single image with controllable video diffusion"},{"key":"ref36","author":"Wang","year":"2023","journal-title":"Imagedream: Image-prompt multi-view diffusion for 3d generation"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02036"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00923"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr52734.2025.00573"},{"key":"ref40","first-page":"349","article-title":"Geospecific view generation geometry-context aware high-resolution ground view inference from satellite views","volume-title":"In European Conference on Computer Vision","author":"Xu","year":"2024"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.00676"},{"key":"ref42","article-title":"Cogvideox: Text-to-video diffusion models with an expert transformer","author":"Yang","year":"2024","journal-title":"CoRR"},{"key":"ref43","author":"Ye","year":"2023","journal-title":"Ipadapter: Text compatible image prompt adapter for text-toimage diffusion models"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2025.3613256"},{"key":"ref45","author":"Zhang","year":"2024","journal-title":"Cityx: Controllable procedural content generation for unbounded 3d cities"},{"key":"ref46","author":"Zhou","year":"2024","journal-title":"Controlcity: A multimodal diffusion model based approach for accurate geospatial data generation and urban morphology analysis"},{"key":"ref47","author":"Zhou","year":"2024","journal-title":"Motion control for enhanced complex action video generation"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72658-3_19"},{"key":"ref49","author":"Zhou","year":"2020","journal-title":"Holicity: A city-scale data platform for learning holistic 3d structures"}],"event":{"name":"2025 IEEE\/CVF International Conference on Computer Vision (ICCV)","location":"Honolulu, HI, USA","start":{"date-parts":[[2025,10,19]]},"end":{"date-parts":[[2025,10,25]]}},"container-title":["2025 IEEE\/CVF International Conference on Computer Vision (ICCV)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11443115\/11443287\/11444927.pdf?arnumber=11444927","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T06:12:40Z","timestamp":1777529560000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11444927\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,19]]},"references-count":49,"URL":"https:\/\/doi.org\/10.1109\/iccv51701.2025.02349","relation":{},"subject":[],"published":{"date-parts":[[2025,10,19]]}}}