{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,25]],"date-time":"2026-03-25T16:02:49Z","timestamp":1774454569285,"version":"3.50.1"},"publisher-location":"Cham","reference-count":79,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031729690","type":"print"},{"value":"9783031729706","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,11,23]],"date-time":"2024-11-23T00:00:00Z","timestamp":1732320000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,23]],"date-time":"2024-11-23T00:00:00Z","timestamp":1732320000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-72970-6_11","type":"book-chapter","created":{"date-parts":[[2024,11,22]],"date-time":"2024-11-22T10:49:48Z","timestamp":1732272588000},"page":"184-202","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["TexDreamer: Towards Zero-Shot High-Fidelity 3D Human Texture Generation"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0937-3340","authenticated-orcid":false,"given":"Yufei","family":"Liu","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5407-5150","authenticated-orcid":false,"given":"Junwei","family":"Zhu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6549-5257","authenticated-orcid":false,"given":"Junshu","family":"Tang","sequence":"additional","affiliation":[]},{"given":"Shijie","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Jiangning","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Weijian","family":"Cao","sequence":"additional","affiliation":[]},{"given":"Chengjie","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Yunsheng","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Dongjin","family":"Huang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,23]]},"reference":[{"key":"11_CR1","doi-asserted-by":"crossref","unstructured":"Alldieck, T., Magnor, M., Xu, W., Theobalt, C., Pons-Moll, G.: Video based reconstruction of 3D people models. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 8387\u20138397 (2018)","DOI":"10.1109\/CVPR.2018.00875"},{"key":"11_CR2","unstructured":"AXYZ: 4D Scanned People Character Animation Software (2023). https:\/\/secure.axyz-design.com\/"},{"key":"11_CR3","doi-asserted-by":"crossref","unstructured":"Bhatnagar, B.L., Tiwari, G., Theobalt, C., Pons-Moll, G.: Multi-garment net: learning to dress 3D people from images. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 5420\u20135430 (2019)","DOI":"10.1109\/ICCV.2019.00552"},{"key":"11_CR4","unstructured":"Blender - a 3D modelling and rendering package (2023). https:\/\/www.blender.org\/"},{"key":"11_CR5","doi-asserted-by":"crossref","unstructured":"Cao, Y., Cao, Y.P., Han, K., Shan, Y., Wong, K.Y.K.: DreamAvatar: text-and-shape guided 3D human avatar generation via diffusion models. arXiv preprint arXiv:2304.00916 (2023)","DOI":"10.1109\/CVPR52733.2024.00097"},{"key":"11_CR6","unstructured":"Casas, D., Trinidad, M.C.: SMPLitex: a generative model and dataset for 3D human texture estimation from single image. arXiv preprint arXiv:2309.01855 (2023)"},{"key":"11_CR7","doi-asserted-by":"crossref","unstructured":"Cha, S., Seo, K., Ashtari, A., Noh, J.: Generating texture for 3D human avatar from a single image using sampling and refinement networks. In: Computer Graphics Forum, vol.\u00a042, pp. 385\u2013396. Wiley Online Library (2023)","DOI":"10.1111\/cgf.14769"},{"key":"11_CR8","doi-asserted-by":"crossref","unstructured":"Chang, S., Cho, J., Oh, S.: Texture generation using dual-domain feature flow with multi-view hallucinations. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol.\u00a036, pp. 203\u2013211 (2022)","DOI":"10.1609\/aaai.v36i1.19895"},{"key":"11_CR9","doi-asserted-by":"crossref","unstructured":"Chen, D.Z., Siddiqui, Y., Lee, H.Y., Tulyakov, S., Nie\u00dfner, M.: Text2Tex: text-driven texture synthesis via diffusion models. arXiv preprint arXiv:2303.11396 (2023)","DOI":"10.1109\/ICCV51070.2023.01701"},{"key":"11_CR10","doi-asserted-by":"crossref","unstructured":"Chen, R., Chen, Y., Jiao, N., Jia, K.: Fantasia3D: disentangling geometry and appearance for high-quality text-to-3D content creation. arXiv preprint arXiv:2303.13873 (2023)","DOI":"10.1109\/ICCV51070.2023.02033"},{"key":"11_CR11","doi-asserted-by":"crossref","unstructured":"Debevec, P.: Rendering synthetic objects into real scenes: bridging traditional and image-based graphics with global illumination and high dynamic range photography. In: ACM SIGGRAPH 2008 Classes, pp. 1\u201310 (2008)","DOI":"10.1145\/1401132.1401175"},{"key":"11_CR12","doi-asserted-by":"crossref","unstructured":"Feng, Y., Yang, J., Pollefeys, M., Black, M.J., Bolkart, T.: Capturing and animation of body and clothing from monocular video. In: SIGGRAPH Asia 2022 Conference Papers, pp.\u00a01\u20139 (2022)","DOI":"10.1145\/3550469.3555423"},{"key":"11_CR13","unstructured":"Free Stock Photos, Royalty Free Stock Images AMD Copyright Free Pictures: Pexels. https:\/\/www.pexels.com\/"},{"key":"11_CR14","unstructured":"Gal, R., et al.: An image is worth one word: personalizing text-to-image generation using textual inversion. arXiv preprint arXiv:2208.01618 (2022)"},{"key":"11_CR15","doi-asserted-by":"crossref","unstructured":"Grigorev, A., et al.: StylePeople: a generative model of fullbody human avatars. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5151\u20135160 (2021)","DOI":"10.1109\/CVPR46437.2021.00511"},{"key":"11_CR16","doi-asserted-by":"crossref","unstructured":"G\u00fcler, R.A., Neverova, N., Kokkinos, I.: DensePose: dense human pose estimation in the wild. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7297\u20137306 (2018)","DOI":"10.1109\/CVPR.2018.00762"},{"key":"11_CR17","doi-asserted-by":"crossref","unstructured":"Hang, T., et al.: Efficient diffusion training via min-snr weighting strategy. arXiv preprint arXiv:2303.09556 (2023)","DOI":"10.1109\/ICCV51070.2023.00684"},{"key":"11_CR18","doi-asserted-by":"crossref","unstructured":"Hong, F., Zhang, M., Pan, L., Cai, Z., Yang, L., Liu, Z.: AvatarCLIP: zero-shot text-driven generation and animation of 3D avatars. arXiv preprint arXiv:2205.08535 (2022)","DOI":"10.1145\/3528223.3530094"},{"key":"11_CR19","unstructured":"Hu, E.J., et al.: LoRa: low-rank adaptation of large language models. arXiv preprint arXiv:2106.09685 (2021)"},{"key":"11_CR20","doi-asserted-by":"crossref","unstructured":"Huang, Y., et al.: TeCH: text-guided reconstruction of lifelike clothed humans. In: International Conference on 3D Vision (3DV) (2024)","DOI":"10.1109\/3DV62453.2024.00152"},{"key":"11_CR21","doi-asserted-by":"crossref","unstructured":"Isola, P., Zhu, J.Y., Zhou, T., Efros, A.A.: Image-to-image translation with conditional adversarial networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1125\u20131134 (2017)","DOI":"10.1109\/CVPR.2017.632"},{"key":"11_CR22","doi-asserted-by":"crossref","unstructured":"Jain, A., Mildenhall, B., Barron, J.T., Abbeel, P., Poole, B.: Zero-shot text-guided object generation with dream fields. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 867\u2013876 (2022)","DOI":"10.1109\/CVPR52688.2022.00094"},{"key":"11_CR23","doi-asserted-by":"crossref","unstructured":"Jiang, B., Hong, Y., Bao, H., Zhang, J.: SelfRecon: self reconstruction your digital avatar from monocular video. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5605\u20135615 (2022)","DOI":"10.1109\/CVPR52688.2022.00552"},{"key":"11_CR24","doi-asserted-by":"crossref","unstructured":"Jiang, R., et al.: AvatarCraft: transforming text into neural human avatars with parameterized shape and pose control. In: 2023 IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 14325\u201314336 (2023). https:\/\/api.semanticscholar.org\/CorpusID:257834153","DOI":"10.1109\/ICCV51070.2023.01322"},{"issue":"4","key":"11_CR25","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3528223.3530104","volume":"41","author":"Y Jiang","year":"2022","unstructured":"Jiang, Y., Yang, S., Qiu, H., Wu, W., Loy, C.C., Liu, Z.: Text2Human: text-driven controllable human image generation. ACM Trans. Graph. (TOG) 41(4), 1\u201311 (2022)","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"11_CR26","unstructured":"Kolotouros, N., Alldieck, T., Zanfir, A., Bazavan, E.G., Fieraru, M., Sminchisescu, C.: DreamHuman: animatable 3D avatars from text. arXiv preprint arXiv:2306.09329 (2023)"},{"key":"11_CR27","doi-asserted-by":"crossref","unstructured":"Lazova, V., Insafutdinov, E., Pons-Moll, G.: 360-degree textures of people in clothing from a single image. In: 2019 International Conference on 3D Vision (3DV), pp. 643\u2013653. IEEE (2019)","DOI":"10.1109\/3DV.2019.00076"},{"key":"11_CR28","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"590","DOI":"10.1007\/978-3-031-20065-6_34","volume-title":"Computer Vision \u2013 ECCV 2022","author":"Z Li","year":"2022","unstructured":"Li, Z., Liu, J., Zhang, Z., Xu, S., Yan, Y.: CLIFF: carrying location information in full frames into human pose and shape estimation. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) ECCV 2022. LNCS, vol. 13665, pp. 590\u2013606. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-20065-6_34"},{"key":"11_CR29","doi-asserted-by":"crossref","unstructured":"Liao, T., et al.: TADA! Text to animatable digital avatars. In: International Conference on 3D Vision (3DV) (2024)","DOI":"10.1109\/3DV62453.2024.00150"},{"key":"11_CR30","doi-asserted-by":"crossref","unstructured":"Lin, C.H., et al.: Magic3D: high-resolution text-to-3D content creation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 300\u2013309 (2023)","DOI":"10.1109\/CVPR52729.2023.00037"},{"key":"11_CR31","doi-asserted-by":"crossref","unstructured":"Liu, W., Piao, Z., Min, J., Luo, W., Ma, L., Gao, S.: Liquid warping GAN: a unified framework for human motion imitation, appearance transfer and novel view synthesis. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 5904\u20135913 (2019)","DOI":"10.1109\/ICCV.2019.00600"},{"key":"11_CR32","doi-asserted-by":"crossref","unstructured":"Liu, Z., Luo, P., Qiu, S., Wang, X., Tang, X.: DeepFashion: powering robust clothes recognition and retrieval with rich annotations. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1096\u20131104 (2016)","DOI":"10.1109\/CVPR.2016.124"},{"key":"11_CR33","doi-asserted-by":"crossref","unstructured":"Loper, M., Mahmood, N., Romero, J., Pons-Moll, G., Black, M.J.: SMPL: a skinned multi-person linear model. In: Seminal Graphics Papers: Pushing the Boundaries, vol. 2, pp. 851\u2013866 (2023)","DOI":"10.1145\/3596711.3596800"},{"key":"11_CR34","doi-asserted-by":"crossref","unstructured":"Lorensen, W.E., Cline, H.E.: Marching cubes: a high resolution 3D surface construction algorithm. In: Seminal Graphics: Pioneering Efforts that Shaped the Field, pp. 347\u2013353 (1998)","DOI":"10.1145\/280811.281026"},{"key":"11_CR35","doi-asserted-by":"crossref","unstructured":"Ma, Q., et al.: Learning to dress 3D people in generative clothing. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6469\u20136478 (2020)","DOI":"10.1109\/CVPR42600.2020.00650"},{"key":"11_CR36","doi-asserted-by":"crossref","unstructured":"Mahmood, N., Ghorbani, N., Troje, N.F., Pons-Moll, G., Black, M.J.: AMASS: archive of motion capture as surface shapes. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 5442\u20135451 (2019)","DOI":"10.1109\/ICCV.2019.00554"},{"key":"11_CR37","doi-asserted-by":"crossref","unstructured":"McAuley, S., Hill, S., Hoffman, N., Gotanda, Y., Smits, B., Burley, B., Martinez, A.: Practical physically-based shading in film and game production. In: ACM SIGGRAPH 2012 Courses, pp.\u00a01\u20137 (2012)","DOI":"10.1145\/2343483.2343493"},{"key":"11_CR38","doi-asserted-by":"crossref","unstructured":"Metzer, G., Richardson, E., Patashnik, O., Giryes, R., Cohen-Or, D.: Latent-NeRF for shape-guided generation of 3D shapes and textures. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12663\u201312673 (2023)","DOI":"10.1109\/CVPR52729.2023.01218"},{"key":"11_CR39","doi-asserted-by":"crossref","unstructured":"Michel, O., Bar-On, R., Liu, R., Benaim, S., Hanocka, R.: Text2Mesh: text-driven neural stylization for meshes. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.01313"},{"key":"11_CR40","doi-asserted-by":"crossref","unstructured":"Mohammad\u00a0Khalid, N., Xie, T., Belilovsky, E., Popa, T.: CLIP-mesh: generating textured meshes from text using pretrained image-text models. In: SIGGRAPH Asia 2022 Conference Papers, pp.\u00a01\u20138 (2022)","DOI":"10.1145\/3550469.3555392"},{"issue":"4","key":"11_CR41","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3528223.3530127","volume":"41","author":"T M\u00fcller","year":"2022","unstructured":"M\u00fcller, T., Evans, A., Schied, C., Keller, A.: Instant neural graphics primitives with a multiresolution hash encoding. ACM Trans. Graph. (ToG) 41(4), 1\u201315 (2022)","journal-title":"ACM Trans. Graph. (ToG)"},{"key":"11_CR42","first-page":"27730","volume":"35","author":"L Ouyang","year":"2022","unstructured":"Ouyang, L., et al.: Training language models to follow instructions with human feedback. Adv. Neural. Inf. Process. Syst. 35, 27730\u201327744 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"11_CR43","unstructured":"Poole, B., Jain, A., Barron, J.T., Mildenhall, B.: DreamFusion: text-to-3D using 2D diffusion. arXiv preprint arXiv:2209.14988 (2022)"},{"key":"11_CR44","unstructured":"Radford, A., et\u00a0al.: Learning transferable visual models from natural language supervision. In: International Conference on Machine Learning, pp. 8748\u20138763. PMLR (2021)"},{"key":"11_CR45","unstructured":"Renderpeople: Over 4,000 Scanned 3D People Models (2023). https:\/\/renderpeople.com\/"},{"key":"11_CR46","doi-asserted-by":"crossref","unstructured":"Richardson, E., Metzer, G., Alaluf, Y., Giryes, R., Cohen-Or, D.: Texture: text-guided texturing of 3D shapes. arXiv preprint arXiv:2302.01721 (2023)","DOI":"10.1145\/3588432.3591503"},{"key":"11_CR47","doi-asserted-by":"crossref","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P., Ommer, B.: High-resolution image synthesis with latent diffusion models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10684\u201310695 (2022)","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"11_CR48","doi-asserted-by":"crossref","unstructured":"Ruiz, N., Li, Y., Jampani, V., Pritch, Y., Rubinstein, M., Aberman, K.: DreamBooth: fine tuning text-to-image diffusion models for subject-driven generation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 22500\u201322510 (2023)","DOI":"10.1109\/CVPR52729.2023.02155"},{"key":"11_CR49","doi-asserted-by":"crossref","unstructured":"Saito, S., Simon, T., Saragih, J., Joo, H.: PIFuHD: multi-level pixel-aligned implicit function for high-resolution 3D human digitization. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 84\u201393 (2020)","DOI":"10.1109\/CVPR42600.2020.00016"},{"key":"11_CR50","doi-asserted-by":"crossref","unstructured":"Shen, K., et al.: X-avatar: expressive human avatars. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16911\u201316921 (2023)","DOI":"10.1109\/CVPR52729.2023.01622"},{"issue":"2","key":"11_CR51","doi-asserted-by":"publisher","first-page":"1581","DOI":"10.1109\/TPAMI.2022.3168569","volume":"45","author":"Z Su","year":"2022","unstructured":"Su, Z., Yu, T., Wang, Y., Liu, Y.: DeepCloth: neural garment representation for shape and style editing. IEEE Trans. Pattern Anal. Mach. Intell. 45(2), 1581\u20131593 (2022)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"11_CR52","doi-asserted-by":"crossref","unstructured":"Svitov, D., Gudkov, D., Bashirov, R., Lempitsky, V.: DINAR: diffusion inpainting of neural textures for one-shot human avatars. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 7062\u20137072 (2023)","DOI":"10.1109\/ICCV51070.2023.00650"},{"key":"11_CR53","doi-asserted-by":"crossref","unstructured":"Tang, J., et al.: Make-it-3D: high-fidelity 3D creation from a single image with diffusion prior, pp. 22819\u201322829 (2023)","DOI":"10.1109\/ICCV51070.2023.02086"},{"key":"11_CR54","doi-asserted-by":"crossref","unstructured":"Tang, J., et al.: Make-it-vivid: dressing your animatable biped cartoon characters from text (2024)","DOI":"10.1109\/CVPR52733.2024.00597"},{"key":"11_CR55","unstructured":"Treedy\u2019s: 3D body scanning technology (2023). https:\/\/www.treedys.com\/"},{"key":"11_CR56","unstructured":"Twindom: Full Body 3D Scanners for 3D Printed Figurines, 3D Portraits and 3D Selfies (2023). https:\/\/web.twindom.com\/"},{"key":"11_CR57","doi-asserted-by":"crossref","unstructured":"Varol, G., et al.: Learning from synthetic humans. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 109\u2013117 (2017)","DOI":"10.1109\/CVPR.2017.492"},{"key":"11_CR58","doi-asserted-by":"crossref","unstructured":"Wang, J., Zhong, Y., Li, Y., Zhang, C., Wei, Y.: Re-identification supervised texture generation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11846\u201311856 (2019)","DOI":"10.1109\/CVPR.2019.01212"},{"key":"11_CR59","unstructured":"Wang, P., Liu, L., Liu, Y., Theobalt, C., Komura, T., Wang, W.: NeUS: learning neural implicit surfaces by volume rendering for multi-view reconstruction. arXiv preprint arXiv:2106.10689 (2021)"},{"issue":"4","key":"11_CR60","doi-asserted-by":"publisher","first-page":"600","DOI":"10.1109\/TIP.2003.819861","volume":"13","author":"Z Wang","year":"2004","unstructured":"Wang, Z., Bovik, A.C., Sheikh, H.R., Simoncelli, E.P.: Image quality assessment: from error visibility to structural similarity. IEEE Trans. Image Process. 13(4), 600\u2013612 (2004)","journal-title":"IEEE Trans. Image Process."},{"key":"11_CR61","doi-asserted-by":"crossref","unstructured":"Xiu, Y., Yang, J., Cao, X., Tzionas, D., Black, M.J.: ECON: explicit clothed humans optimized via normal integration. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 512\u2013523 (2023)","DOI":"10.1109\/CVPR52729.2023.00057"},{"key":"11_CR62","doi-asserted-by":"crossref","unstructured":"Xu, C., et al.: High-fidelity generalized emotional talking face generation with multi-modal emotion space learning. In: CVPR (2023)","DOI":"10.1109\/CVPR52729.2023.00639"},{"issue":"9","key":"11_CR63","first-page":"4490","volume":"44","author":"X Xu","year":"2021","unstructured":"Xu, X., Chen, H., Moreno-Noguer, F., Jeni, L.A., De la Torre, F.: 3D human pose, shape and texture from low-resolution images and videos. IEEE Trans. Pattern Anal. Mach. Intell. 44(9), 4490\u20134504 (2021)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"11_CR64","doi-asserted-by":"crossref","unstructured":"Xu, X., Loy, C.C.: 3D human texture estimation from a single image with transformers. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 13849\u201313858 (2021)","DOI":"10.1109\/ICCV48922.2021.01359"},{"key":"11_CR65","doi-asserted-by":"crossref","unstructured":"Yang, Z., Zeng, A., Yuan, C., Li, Y.: Effective whole-body pose estimation with two-stages distillation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 4210\u20134220 (2023)","DOI":"10.1109\/ICCVW60793.2023.00455"},{"key":"11_CR66","doi-asserted-by":"crossref","unstructured":"Yang, Z., et al.: SynBody: synthetic dataset with layered human models for 3D human perception and modeling (2023)","DOI":"10.1109\/ICCV51070.2023.01855"},{"key":"11_CR67","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"173","DOI":"10.1007\/978-3-031-20062-5_11","volume-title":"Computer Vision \u2013 ECCV 2022","author":"K Youwang","year":"2022","unstructured":"Youwang, K., Ji-Yeon, K., Oh, T.H.: CLIP-actor: text-driven recommendation and stylization for animating human meshes. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) ECCV 2022. LNCS, vol. 13663, pp. 173\u2013191. Springer, Cham (2022)"},{"key":"11_CR68","unstructured":"Yu, F., Seff, A., Zhang, Y., Song, S., Funkhouser, T., Xiao, J.: LSUN: construction of a large-scale image dataset using deep learning with humans in the loop. arXiv preprint arXiv:1506.03365 (2015)"},{"key":"11_CR69","doi-asserted-by":"crossref","unstructured":"Yu, T., Zheng, Z., Guo, K., Liu, P., Dai, Q., Liu, Y.: Function4D: real-time human volumetric capture from very sparse consumer RGBD sensors. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5746\u20135756 (2021)","DOI":"10.1109\/CVPR46437.2021.00569"},{"key":"11_CR70","unstructured":"Zeng, Y., Lu, Y., Ji, X., Yao, Y., Zhu, H., Cao, X.: AvatarBooth: high-quality and customizable 3D human avatar generation. arXiv preprint arXiv:2306.09864 (2023)"},{"key":"11_CR71","doi-asserted-by":"crossref","unstructured":"Zhang, C., Pujades, S., Black, M.J., Pons-Moll, G.: Detailed, accurate, human shape estimation from clothed 3D scan sequences. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4191\u20134200 (2017)","DOI":"10.1109\/CVPR.2017.582"},{"key":"11_CR72","doi-asserted-by":"crossref","unstructured":"Zhang, J., et al.: FreeNet: multi-identity face reenactment. In: CVPR (2020)","DOI":"10.1109\/CVPR42600.2020.00537"},{"key":"11_CR73","doi-asserted-by":"crossref","unstructured":"Zhang, L., Rao, A., Agrawala, M.: Adding conditional control to text-to-image diffusion models. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3836\u20133847 (2023)","DOI":"10.1109\/ICCV51070.2023.00355"},{"key":"11_CR74","doi-asserted-by":"crossref","unstructured":"Zhang, R., Isola, P., Efros, A.A., Shechtman, E., Wang, O.: The unreasonable effectiveness of deep features as a perceptual metric. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 586\u2013595 (2018)","DOI":"10.1109\/CVPR.2018.00068"},{"key":"11_CR75","first-page":"14326","volume":"33","author":"F Zhao","year":"2020","unstructured":"Zhao, F., Liao, S., Zhang, K., Shao, L.: Human parsing based texture transfer from single image to 3D human via cross-view consistency. Adv. Neural. Inf. Process. Syst. 33, 14326\u201314337 (2020)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"11_CR76","unstructured":"Zheng, K., He, X., Wang, X.E.: MiniGPT-5: interleaved vision-and-language generation via generative vokens. arXiv preprint arXiv:2310.02239 (2023)"},{"key":"11_CR77","doi-asserted-by":"crossref","unstructured":"Zheng, L., Shen, L., Tian, L., Wang, S., Wang, J., Tian, Q.: Scalable person re-identification: a benchmark. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1116\u20131124 (2015)","DOI":"10.1109\/ICCV.2015.133"},{"issue":"6","key":"11_CR78","doi-asserted-by":"publisher","first-page":"3170","DOI":"10.1109\/TPAMI.2021.3050505","volume":"44","author":"Z Zheng","year":"2021","unstructured":"Zheng, Z., Yu, T., Liu, Y., Dai, Q.: PaMIR: parametric model-conditioned implicit representation for image-based human reconstruction. IEEE Trans. Pattern Anal. Mach. Intell. 44(6), 3170\u20133184 (2021)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"11_CR79","doi-asserted-by":"crossref","unstructured":"Zheng, Z., Yu, T., Wei, Y., Dai, Q., Liu, Y.: DeepHuman: 3D human reconstruction from a single image. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 7739\u20137749 (2019)","DOI":"10.1109\/ICCV.2019.00783"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-72970-6_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,22]],"date-time":"2024-11-22T11:14:16Z","timestamp":1732274056000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-72970-6_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,23]]},"ISBN":["9783031729690","9783031729706"],"references-count":79,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-72970-6_11","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,11,23]]},"assertion":[{"value":"23 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}