{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,7]],"date-time":"2025-11-07T18:16:19Z","timestamp":1762539379086,"version":"build-2065373602"},"reference-count":75,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"12","license":[{"start":{"date-parts":[[2025,12,1]],"date-time":"2025-12-01T00:00:00Z","timestamp":1764547200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2025,12,1]],"date-time":"2025-12-01T00:00:00Z","timestamp":1764547200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,12,1]],"date-time":"2025-12-01T00:00:00Z","timestamp":1764547200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Visual. Comput. Graphics"],"published-print":{"date-parts":[[2025,12]]},"DOI":"10.1109\/tvcg.2025.3613388","type":"journal-article","created":{"date-parts":[[2025,9,23]],"date-time":"2025-09-23T17:25:25Z","timestamp":1758648325000},"page":"10711-10722","source":"Crossref","is-referenced-by-count":0,"title":["SketchRefiner: Text-Guided Sketch Refinement Through Latent Diffusion Models"],"prefix":"10.1109","volume":"31","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4675-0398","authenticated-orcid":false,"given":"Yingjie","family":"Tian","sequence":"first","affiliation":[{"name":"School of Economics and Management, University of Chinese Academy of Sciences, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-1660-9379","authenticated-orcid":false,"given":"Minghao","family":"Liu","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-8883-8610","authenticated-orcid":false,"given":"Haoran","family":"Jiang","sequence":"additional","affiliation":[{"name":"School of Mathematical Sciences, University of Chinese Academy of Sciences, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9525-9060","authenticated-orcid":false,"given":"Yunbin","family":"Tu","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9607-3639","authenticated-orcid":false,"given":"Duo","family":"Su","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, University of Chinese Academy of Sciences, Beijing, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1038\/nature13422"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3148853"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2022.102461"},{"key":"ref4","first-page":"23894","article-title":"Zero-shot 3D drug design by sketching and generating","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Long"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1111\/j.1756-8765.2011.01149.x"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v24i2.18827"},{"article-title":"Sketch-to-architecture: Generative AI-aided architectural design","year":"2024","author":"Li","key":"ref7"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.4324\/9780080878775"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1145\/2897824.2925954"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"ref11","first-page":"36479","article-title":"Photorealistic text-to-image diffusion models with deep language understanding","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Saharia"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00355"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19790-1_21"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00776"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2018.2866090"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/WACV51458.2022.00102"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00662"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2016.2597830"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10096348"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-26293-7_4"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2020.2968433"},{"key":"ref22","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Radford"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3528223.3530068"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00383"},{"key":"ref25","first-page":"15869","article-title":"DiffSketcher: Text guided vector sketch synthesis through latent diffusion models","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Xing"},{"article-title":"Sketchdreamer: Interactive text-augmented creative sketch ideation","year":"2023","author":"Qu","key":"ref26"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3414685.3417871"},{"article-title":"DreamFusion: Text-to-3D using 2D diffusion","year":"2022","author":"Poole","key":"ref28"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/3197517.3201314"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/3450626.3459777"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1007\/s11432-018-9694-8"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1145\/3592130"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1145\/3132703"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1145\/3414685.3417784"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1145\/2897824.2925946"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1016\/j.cag.2016.02.003"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/2601097.2601202"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2023.3346995"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413720"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2020.3040900"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA57147.2024.10610618"},{"article-title":"A neural representation of sketch drawings","year":"2017","author":"Ha","key":"ref42"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2019.00154"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-016-0963-9"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00824"},{"key":"ref46","first-page":"6840","article-title":"Denoising diffusion probabilistic models","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Ho"},{"article-title":"Denoising diffusion implicit models","year":"2020","author":"Song","key":"ref47"},{"article-title":"Score-based generative modeling through stochastic differential equations","year":"2020","author":"Song","key":"ref48"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1145\/3588432.3591560"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/WACV56688.2023.00404"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1145\/3654777.3676444"},{"article-title":"Difffacesketch: High-fidelity face image synthesis with sketch-guided latent diffusion model","year":"2023","author":"Peng","key":"ref52"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP49359.2023.10222365"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1111\/cgf.15247"},{"article-title":"Sketchknitter: Vectorized sketch generation with diffusion models","volume-title":"Proc. 11th Int. Conf. Learn. Representations","author":"Wang","key":"ref55"},{"article-title":"Representative feature extraction during diffusion process for sketch extraction with one example","year":"2024","author":"Yun","key":"ref56"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00820"},{"article-title":"Sketch2NeRF: Multi-view sketch-guided text-to-3D generation","year":"2024","author":"Chen","key":"ref58"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3612489"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr52733.2024.00414"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72946-1_19"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2021.3084944"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00726"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01583"},{"key":"ref65","first-page":"5207","article-title":"Clipdraw: Exploring text-to-drawing synthesis through language-image encoders","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Frans"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2022\/688"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i2.25326"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00190"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1145\/3658204"},{"key":"ref70","first-page":"2256","article-title":"Deep unsupervised learning using nonequilibrium thermodynamics","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Sohl-Dickstein"},{"article-title":"Classifier-free diffusion guidance","year":"2022","author":"Ho","key":"ref71"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.23915\/distill.00012"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00068"},{"article-title":"A neural representation of sketch drawings","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Ha","key":"ref74"},{"key":"ref75","article-title":"Benchmark for compositional text-to-image synthesis","volume-title":"Proc. 35th Conf. Neural Inf. Process. Syst. Datasets Benchmarks Track (Round 1)","volume":"1","author":"Park"}],"container-title":["IEEE Transactions on Visualization and Computer Graphics"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/2945\/11231102\/11176130.pdf?arnumber=11176130","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,7]],"date-time":"2025-11-07T18:10:27Z","timestamp":1762539027000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11176130\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12]]},"references-count":75,"journal-issue":{"issue":"12"},"URL":"https:\/\/doi.org\/10.1109\/tvcg.2025.3613388","relation":{},"ISSN":["1077-2626","1941-0506","2160-9306"],"issn-type":[{"type":"print","value":"1077-2626"},{"type":"electronic","value":"1941-0506"},{"type":"electronic","value":"2160-9306"}],"subject":[],"published":{"date-parts":[[2025,12]]}}}