{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,5]],"date-time":"2025-11-05T10:29:57Z","timestamp":1762338597014,"version":"3.40.3"},"publisher-location":"Cham","reference-count":44,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031729393"},{"type":"electronic","value":"9783031729409"}],"license":[{"start":{"date-parts":[[2024,11,17]],"date-time":"2024-11-17T00:00:00Z","timestamp":1731801600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,17]],"date-time":"2024-11-17T00:00:00Z","timestamp":1731801600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-72940-9_7","type":"book-chapter","created":{"date-parts":[[2024,11,16]],"date-time":"2024-11-16T20:43:03Z","timestamp":1731789783000},"page":"109-125","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["PAV: Personalized Head Avatar from\u00a0Unstructured Video Collection"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2918-5603","authenticated-orcid":false,"given":"Akin","family":"Caliskan","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0002-5270-6120","authenticated-orcid":false,"given":"Berkay","family":"Kicanaoglu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2509-8230","authenticated-orcid":false,"given":"Hyeongwoo","family":"Kim","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,17]]},"reference":[{"key":"7_CR1","doi-asserted-by":"crossref","unstructured":"Athar, S., Xu, Z., Sunkavalli, K., Shechtman, E., Shu, Z.: Rignerf: fully controllable neural 3d portraits. In: Proceedings of the IEEE\/CVF conference on Computer Vision and Pattern Recognition, pp. 20364\u201320373 (2022)","DOI":"10.1109\/CVPR52688.2022.01972"},{"issue":"6","key":"7_CR2","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3130800.3130818","volume":"36","author":"H Averbuch-Elor","year":"2017","unstructured":"Averbuch-Elor, H., Cohen-Or, D., Kopf, J., Cohen, M.F.: Bringing portraits to life. ACM Trans. Graph. 36(6), 1\u201313 (2017)","journal-title":"ACM Trans. Graph."},{"key":"7_CR3","doi-asserted-by":"crossref","unstructured":"Bai, Z., et\u00a0al.: Learning personalized high quality volumetric head avatars from monocular RGB videos. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16890\u201316900 (2023)","DOI":"10.1109\/CVPR52729.2023.01620"},{"key":"7_CR4","doi-asserted-by":"crossref","unstructured":"B\u00fchler, M.C., Meka, A., Li, G., Beeler, T., Hilliges, O.: Varitex: variational neural face textures. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 13890\u201313899 (2021)","DOI":"10.1109\/ICCV48922.2021.01363"},{"key":"7_CR5","doi-asserted-by":"crossref","unstructured":"Chen, C., O\u2019Toole, M., Bharaj, G., Garrido, P.: Implicit neural head synthesis via controllable local deformation fields. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 416\u2013426 (2023)","DOI":"10.1109\/CVPR52729.2023.00048"},{"issue":"10","key":"7_CR6","doi-asserted-by":"publisher","first-page":"547","DOI":"10.1145\/360349.360354","volume":"19","author":"JH Clark","year":"1976","unstructured":"Clark, J.H.: Hierarchical geometric models for visible surface algorithms. Commun. ACM 19(10), 547\u2013554 (1976)","journal-title":"Commun. ACM"},{"key":"7_CR7","doi-asserted-by":"crossref","unstructured":"Deng, J., Guo, J., Zhou, Y., Yu, J., Kotsia, I., Zafeiriou, S.: Retinaface: single-stage dense face localisation in the wild. arXiv preprint arXiv:1905.00641 (2019)","DOI":"10.1109\/CVPR42600.2020.00525"},{"key":"7_CR8","unstructured":"Ding, K., Ma, K., Wang, S., Simoncelli, E.P.: Image Quality Assessment: Unifying Structure and Texture Similarity. In: TPAMI (2022)"},{"key":"7_CR9","doi-asserted-by":"crossref","unstructured":"Egger, B., et al.: 3D morphable face models-past, present, and future. ACM Trans. Graph. 39(5), 1\u201338 (2020)","DOI":"10.1145\/3395208"},{"key":"7_CR10","doi-asserted-by":"crossref","unstructured":"Gafni, G., Thies, J., Zollh\u00f6fer, M., Nie\u00dfner, M.: Dynamic neural radiance fields for monocular 4D facial avatar reconstruction. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 8649\u20138658 (2021)","DOI":"10.1109\/CVPR46437.2021.00854"},{"issue":"6","key":"7_CR11","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3550454.3555501","volume":"41","author":"X Gao","year":"2022","unstructured":"Gao, X., Zhong, C., Xiang, J., Hong, Y., Guo, Y., Zhang, J.: Reconstructing personalized semantic facial nerf models from monocular video. ACM Trans. Graph. 41(6), 1\u201312 (2022)","journal-title":"ACM Trans. Graph."},{"key":"7_CR12","doi-asserted-by":"crossref","unstructured":"Garrido, P., Valgaerts, L., Rehmsen, O., Thormahlen, T., Perez, P., Theobalt, C.: Automatic face reenactment. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4217\u20134224 (2014)","DOI":"10.1109\/CVPR.2014.537"},{"key":"7_CR13","doi-asserted-by":"crossref","unstructured":"Garrido, P., et al.: Vdub: modifying face video of actors for plausible visual alignment to a dubbed audio track. In: Computer Graphics Forum, vol.\u00a034, pp. 193\u2013204. Wiley Online Library (2015)","DOI":"10.1111\/cgf.12552"},{"key":"7_CR14","doi-asserted-by":"crossref","unstructured":"Grassal, P.W., Prinzler, M., Leistner, T., Rother, C., Nie\u00dfner, M., Thies, J.: Neural head avatars from monocular RGB videos. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 18653\u201318664 (2022)","DOI":"10.1109\/CVPR52688.2022.01810"},{"key":"7_CR15","unstructured":"Heusel, M., Ramsauer, H., Unterthiner, T., Nessler, B., Hochreiter, S.: Gans trained by a two time-scale update rule converge to a local nash equilibrium. Adv. Neural Inf. Process. Syst. 30 (2017)"},{"key":"7_CR16","doi-asserted-by":"crossref","unstructured":"Kim, H., et al.: Deep video portraits. ACM Trans. Graph. 37(4), 1\u201314 (2018)","DOI":"10.1145\/3197517.3201283"},{"key":"7_CR17","unstructured":"Kingma, D.P., Ba, J.: Adam: a method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)"},{"issue":"4","key":"7_CR18","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3528223.3530177","volume":"41","author":"Z Kuang","year":"2022","unstructured":"Kuang, Z., Olszewski, K., Chai, M., Huang, Z., Achlioptas, P., Tulyakov, S.: Neroic: neural rendering of objects from online image collections. ACM Trans. Graph. 41(4), 1\u201312 (2022)","journal-title":"ACM Trans. Graph."},{"key":"7_CR19","doi-asserted-by":"publisher","unstructured":"Li, T., Bolkart, T., Black, M.J., Li, H., Romero, J.: Learning a model of facial shape and expression from 4D scans. ACM Trans. Graph. (Proc. SIGGRAPH Asia) 36(6), 194:1\u2013194:17 (2017). https:\/\/doi.org\/10.1145\/3130800.3130813","DOI":"10.1145\/3130800.3130813"},{"issue":"6","key":"7_CR20","first-page":"1","volume":"40","author":"L Liu","year":"2021","unstructured":"Liu, L., Habermann, M., Rudnev, V., Sarkar, K., Gu, J., Theobalt, C.: Neural actor: neural free-view synthesis of human actors with pose control. ACM Trans. Graph. 40(6), 1\u201316 (2021)","journal-title":"ACM Trans. Graph."},{"key":"7_CR21","first-page":"22438","volume":"35","author":"A Mallya","year":"2022","unstructured":"Mallya, A., Wang, T.C., Liu, M.Y.: Implicit warping for animation with image sets. Adv. Neural. Inf. Process. Syst. 35, 22438\u201322450 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"7_CR22","doi-asserted-by":"crossref","unstructured":"Martin-Brualla, R., Radwan, N., Sajjadi, M.S., Barron, J.T., Dosovitskiy, A., Duckworth, D.: Nerf in the wild: neural radiance fields for unconstrained photo collections. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7210\u20137219 (2021)","DOI":"10.1109\/CVPR46437.2021.00713"},{"issue":"1","key":"7_CR23","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1145\/3503250","volume":"65","author":"B Mildenhall","year":"2021","unstructured":"Mildenhall, B., Srinivasan, P.P., Tancik, M., Barron, J.T., Ramamoorthi, R., Ng, R.: Nerf: representing scenes as neural radiance fields for view synthesis. Commun. ACM 65(1), 99\u2013106 (2021)","journal-title":"Commun. ACM"},{"issue":"4","key":"7_CR24","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3528223.3530127","volume":"41","author":"T M\u00fcller","year":"2022","unstructured":"M\u00fcller, T., Evans, A., Schied, C., Keller, A.: Instant neural graphics primitives with a multiresolution hash encoding. ACM Trans. Graph. 41(4), 1\u201315 (2022)","journal-title":"ACM Trans. Graph."},{"key":"7_CR25","doi-asserted-by":"crossref","unstructured":"Nirkin, Y., Keller, Y., Hassner, T.: Fsgan: subject agnostic face swapping and reenactment. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 7184\u20137193 (2019)","DOI":"10.1109\/ICCV.2019.00728"},{"key":"7_CR26","doi-asserted-by":"crossref","unstructured":"Park, K., et al.: Hypernerf: a higher-dimensional representation for topologically varying neural radiance fields. arXiv preprint arXiv:2106.13228 (2021)","DOI":"10.1145\/3478513.3480487"},{"key":"7_CR27","doi-asserted-by":"crossref","unstructured":"Peng, S., et al.: Animatable neural radiance fields for modeling dynamic human bodies. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 14314\u201314323 (2021)","DOI":"10.1109\/ICCV48922.2021.01405"},{"key":"7_CR28","doi-asserted-by":"crossref","unstructured":"Pumarola, A., Corona, E., Pons-Moll, G., Moreno-Noguer, F.: D-nerf: neural radiance fields for dynamic scenes. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10318\u201310327 (2021)","DOI":"10.1109\/CVPR46437.2021.01018"},{"key":"7_CR29","unstructured":"Siarohin, A., Lathuili\u00e8re, S., Tulyakov, S., Ricci, E., Sebe, N.: First order motion model for image animation. Adv. Neural Inf. Process. Syst. 32 (2019)"},{"key":"7_CR30","doi-asserted-by":"crossref","unstructured":"Tancik, M., et al.: Block-nerf: scalable large scene neural view synthesis. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8248\u20138258 (2022)","DOI":"10.1109\/CVPR52688.2022.00807"},{"key":"7_CR31","doi-asserted-by":"crossref","unstructured":"Tewari, A., et\u00a0al.: State of the art on neural rendering. In: Computer Graphics Forum, vol.\u00a039, pp. 701\u2013727. Wiley Online Library (2020)","DOI":"10.1111\/cgf.14022"},{"key":"7_CR32","doi-asserted-by":"crossref","unstructured":"Tewari, A., et\u00a0al.: Advances in neural rendering. In: Computer Graphics Forum, vol.\u00a041, pp. 703\u2013735. Wiley Online Library (2022)","DOI":"10.1111\/cgf.14507"},{"issue":"4","key":"7_CR33","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3306346.3323035","volume":"38","author":"J Thies","year":"2019","unstructured":"Thies, J., Zollh\u00f6fer, M., Nie\u00dfner, M.: Deferred neural rendering: image synthesis using neural textures. ACM Trans. Graph. 38(4), 1\u201312 (2019)","journal-title":"ACM Trans. Graph."},{"key":"7_CR34","doi-asserted-by":"crossref","unstructured":"Thies, J., Zollhofer, M., Stamminger, M., Theobalt, C., Nie\u00dfner, M.: Face2face: real-time face capture and reenactment of RGB videos. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2387\u20132395 (2016)","DOI":"10.1109\/CVPR.2016.262"},{"key":"7_CR35","doi-asserted-by":"crossref","unstructured":"Wang, T.C., Liu, M.Y., Zhu, J.Y., Tao, A., Kautz, J., Catanzaro, B.: High-resolution image synthesis and semantic manipulation with conditional GANs. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 8798\u20138807 (2018)","DOI":"10.1109\/CVPR.2018.00917"},{"key":"7_CR36","doi-asserted-by":"crossref","unstructured":"Wang, Z., Bovik, A.C., Sheikh, H.R., Simoncelli, E.P.: Image quality assessment: from error visibility to structural similarity. In: TIP (2004)","DOI":"10.1109\/TIP.2003.819861"},{"key":"7_CR37","doi-asserted-by":"crossref","unstructured":"Weng, C.Y., Srinivasan, P.P., Curless, B., Kemelmacher-Shlizerman, I.: Personnerf: personalized reconstruction from photo collections. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 524\u2013533 (2023)","DOI":"10.1109\/CVPR52729.2023.00058"},{"key":"7_CR38","doi-asserted-by":"publisher","unstructured":"Yang, B., et al.: NeuMesh: learning disentangled neural mesh-based implicit field for\u00a0geometry and\u00a0texture editing. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) ECCV 2022, Part XVI, pp. 597\u2013614. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-19787-1_34","DOI":"10.1007\/978-3-031-19787-1_34"},{"key":"7_CR39","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"524","DOI":"10.1007\/978-3-030-58610-2_31","volume-title":"Computer Vision \u2013 ECCV 2020","author":"E Zakharov","year":"2020","unstructured":"Zakharov, E., Ivakhnenko, A., Shysheya, A., Lempitsky, V.: Fast bi-layer neural synthesis of one-shot realistic head avatars. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12357, pp. 524\u2013540. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58610-2_31"},{"key":"7_CR40","doi-asserted-by":"crossref","unstructured":"Zhang, B., et al.: Metaportrait: identity-preserving talking head generation with fast personalized adaptation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 22096\u201322105 (2023)","DOI":"10.1109\/CVPR52729.2023.02116"},{"key":"7_CR41","doi-asserted-by":"crossref","unstructured":"Zhang, R., Isola, P., Efros, A.A., Shechtman, E., Wang, O.: The unreasonable effectiveness of deep features as a perceptual metric. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00068"},{"key":"7_CR42","doi-asserted-by":"crossref","unstructured":"Zheng, Y., Abrevaya, V.F., B\u00fchler, M.C., Chen, X., Black, M.J., Hilliges, O.: Im avatar: implicit morphable head avatars from videos. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13545\u201313555 (2022)","DOI":"10.1109\/CVPR52688.2022.01318"},{"key":"7_CR43","doi-asserted-by":"crossref","unstructured":"Zielonka, W., Bolkart, T., Thies, J.: Towards metrical reconstruction of human faces. In: European Conference on Computer Vision, pp. 250\u2013269. Springer (2022)","DOI":"10.1007\/978-3-031-19778-9_15"},{"key":"7_CR44","doi-asserted-by":"crossref","unstructured":"Zielonka, W., Bolkart, T., Thies, J.: Instant volumetric head avatars. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4574\u20134584 (2023)","DOI":"10.1109\/CVPR52729.2023.00444"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-72940-9_7","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,16]],"date-time":"2024-11-16T21:32:17Z","timestamp":1731792737000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-72940-9_7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,17]]},"ISBN":["9783031729393","9783031729409"],"references-count":44,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-72940-9_7","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024,11,17]]},"assertion":[{"value":"17 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}