{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,25]],"date-time":"2025-03-25T14:48:52Z","timestamp":1742914132390,"version":"3.40.3"},"publisher-location":"Cham","reference-count":45,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031546044"},{"type":"electronic","value":"9783031546051"}],"license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024]]},"DOI":"10.1007\/978-3-031-54605-1_11","type":"book-chapter","created":{"date-parts":[[2024,3,7]],"date-time":"2024-03-07T11:43:10Z","timestamp":1709811790000},"page":"163-177","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["GenLayNeRF: Generalizable Layered Representations with\u00a03D Model Alignment for\u00a0Human View Synthesis"],"prefix":"10.1007","author":[{"given":"Youssef","family":"Abdelkareem","sequence":"first","affiliation":[]},{"given":"Shady","family":"Shehata","sequence":"additional","affiliation":[]},{"given":"Fakhri","family":"Karray","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,3,8]]},"reference":[{"key":"11_CR1","doi-asserted-by":"crossref","unstructured":"Aliev, K.A., Ulyanov, D., Lempitsky, V.S.: Neural point-based graphics. ArXiv abs\/1906.08240 (2020)","DOI":"10.1007\/978-3-030-58542-6_42"},{"key":"11_CR2","doi-asserted-by":"crossref","unstructured":"Bogo, F., Kanazawa, A., Lassner, C., Gehler, P., Romero, J., Black, M.J.: Keep it SMPL: automatic estimation of 3d human pose and shape from a single image. ArXiv abs\/1607.08128 (2016)","DOI":"10.1007\/978-3-319-46454-1_34"},{"key":"11_CR3","unstructured":"Cheng, W., et al.: Generalizable neural performer: learning robust radiance fields for human novel view synthesis. ArXiv abs\/2204.11798 (2022)"},{"key":"11_CR4","doi-asserted-by":"crossref","unstructured":"Chibane, J., Bansal, A., Lazova, V., Pons-Moll, G.: Stereo radiance fields (SRF): learning view synthesis from sparse views of novel scenes. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR). IEEE (2021)","DOI":"10.1109\/CVPR46437.2021.00782"},{"key":"11_CR5","doi-asserted-by":"crossref","unstructured":"Flynn, J., et al.: DeepView: view synthesis with learned gradient descent. In: 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 2362\u20132371 (2019)","DOI":"10.1109\/CVPR.2019.00247"},{"key":"11_CR6","unstructured":"Gao, C., Shih, Y., Lai, W.S., Liang, C.K., Huang, J.B.: Portrait neural radiance fields from a single image. ArXiv abs\/2012.05903 (2020)"},{"key":"11_CR7","doi-asserted-by":"crossref","unstructured":"Graham, B., Engelcke, M., van der Maaten, L.: 3D semantic segmentation with submanifold sparse convolutional networks. In: 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9224\u20139232 (2018)","DOI":"10.1109\/CVPR.2018.00961"},{"key":"11_CR8","doi-asserted-by":"crossref","unstructured":"Guan, P., Weiss, A., Balan, A.O., Black, M.J.: Estimating human shape and pose from a single image. In: 2009 IEEE 12th International Conference on Computer Vision, pp. 1381\u20131388 (2009)","DOI":"10.1109\/ICCV.2009.5459300"},{"key":"11_CR9","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"11_CR10","doi-asserted-by":"crossref","unstructured":"Kocabas, M., Huang, C.H.P., Hilliges, O., Black, M.J.: PARE: part attention regressor for 3D human body estimation. In: 2021 IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 11107\u201311117 (2021)","DOI":"10.1109\/ICCV48922.2021.01094"},{"key":"11_CR11","doi-asserted-by":"crossref","unstructured":"Kundu, J.N., Rakesh, M., Jampani, V., Venkatesh, R.M., Babu, R.V.: Appearance consensus driven self-supervised human mesh recovery. ArXiv abs\/2008.01341 (2020)","DOI":"10.1007\/978-3-030-58452-8_46"},{"key":"11_CR12","unstructured":"Kwon, Y., Kim, D., Ceylan, D., Fuchs, H.: Neural human performer: learning generalizable radiance fields for human performance rendering. In: NeurIPS (2021)"},{"key":"11_CR13","doi-asserted-by":"crossref","unstructured":"Li, J., Feng, Z., She, Q., Ding, H., Wang, C., Lee, G.H.: MINE: towards continuous depth MPI with nerf for novel view synthesis. In: 2021 IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 12558\u201312568 (2021)","DOI":"10.1109\/ICCV48922.2021.01235"},{"key":"11_CR14","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3048039","author":"P Li","year":"2020","unstructured":"Li, P., Xu, Y., Wei, Y., Yang, Y.: Self-correction for human parsing. IEEE Trans. Pattern Anal. Mach. Intell. (2020). https:\/\/doi.org\/10.1109\/TPAMI.2020.3048039","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"11_CR15","unstructured":"Li, T., et al.: Neural 3D video synthesis. ArXiv abs\/2103.02597 (2021)"},{"key":"11_CR16","doi-asserted-by":"crossref","unstructured":"Lin, K., Wang, L., Liu, Z.: End-to-end human pose and mesh reconstruction with transformers. In: 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 1954\u20131963 (2020)","DOI":"10.1109\/CVPR46437.2021.00199"},{"key":"11_CR17","doi-asserted-by":"crossref","unstructured":"Lin, K., Wang, L., Liu, Z.: Mesh graphormer. In: 2021 IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 12919\u201312928 (2021)","DOI":"10.1109\/ICCV48922.2021.01270"},{"key":"11_CR18","doi-asserted-by":"crossref","unstructured":"Loper, M., Mahmood, N., Romero, J., Pons-Moll, G., Black, M.J.: SMPL: a skinned multi-person linear model. ACM Trans. Graphics (Proc. SIGGRAPH Asia) 34(6), 248:1\u2013248:16 (2015)","DOI":"10.1145\/2816795.2818013"},{"key":"11_CR19","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3414685.3417760","volume":"39","author":"E Lu","year":"2020","unstructured":"Lu, E., Cole, F., Dekel, T., Xie, W., Zisserman, A., Salesin, D., Freeman, W.T., Rubinstein, M.: Layered neural rendering for retiming people in video. ACM Trans. Graphics (TOG) 39, 1\u201314 (2020)","journal-title":"ACM Trans. Graphics (TOG)"},{"key":"11_CR20","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"179","DOI":"10.1007\/978-3-031-19784-0_11","volume-title":"Computer Vision - ECCV 2022","author":"M Mihajlovi\u0107","year":"2022","unstructured":"Mihajlovi\u0107, M., Bansal, A., Zollhoefer, M., Tang, S., Saito, S.: KeypointNeRF: generalizing image-based volumetric avatars using relative spatial encoding of keypoints. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) ECCV 2022. LNCS, vol. 13675, pp. 179\u2013197. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-19784-0_11"},{"key":"11_CR21","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1007\/978-3-030-58452-8_24","volume-title":"Computer Vision \u2013 ECCV 2020","author":"B Mildenhall","year":"2020","unstructured":"Mildenhall, B., Srinivasan, P.P., Tancik, M., Barron, J.T., Ramamoorthi, R., Ng, R.: NeRF: representing scenes as neural radiance fields for view synthesis. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12346, pp. 405\u2013421. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58452-8_24"},{"key":"11_CR22","doi-asserted-by":"crossref","unstructured":"Noh, H., Hong, S., Han, B.: Learning deconvolution network for semantic segmentation. In: 2015 IEEE International Conference on Computer Vision (ICCV), pp. 1520\u20131528 (2015)","DOI":"10.1109\/ICCV.2015.178"},{"key":"11_CR23","unstructured":"Park, K., et al.: Deformable neural radiance fields (2020). https:\/\/arxiv.org\/abs\/2011.12948"},{"key":"11_CR24","doi-asserted-by":"crossref","unstructured":"Pavlakos, G., et al.: Expressive body capture: 3D hands, face, and body from a single image. In: Proceedings IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 10975\u201310985 (2019)","DOI":"10.1109\/CVPR.2019.01123"},{"key":"11_CR25","doi-asserted-by":"crossref","unstructured":"Peng, S., et al.: Neural body: implicit neural representations with structured latent codes for novel view synthesis of dynamic humans. In: 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 9050\u20139059 (2021)","DOI":"10.1109\/CVPR46437.2021.00894"},{"key":"11_CR26","doi-asserted-by":"crossref","unstructured":"Pumarola, A., Corona, E., Pons-Moll, G., Moreno-Noguer, F.: D-NeRF: neural radiance fields for dynamic scenes (2020). https:\/\/arxiv.org\/abs\/2011.13961","DOI":"10.1109\/CVPR46437.2021.01018"},{"key":"11_CR27","doi-asserted-by":"crossref","unstructured":"Saito, S., Huang, Z., Natsume, R., Morishima, S., Kanazawa, A., Li, H.: PIFu: pixel-aligned implicit function for high-resolution clothed human digitization. In: 2019 IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 2304\u20132314 (2019)","DOI":"10.1109\/ICCV.2019.00239"},{"key":"11_CR28","doi-asserted-by":"crossref","unstructured":"Saito, S., Simon, T., Saragih, J.M., Joo, H.: PIFuHD: multi-level pixel-aligned implicit function for high-resolution 3D human digitization. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 81\u201390 (2020)","DOI":"10.1109\/CVPR42600.2020.00016"},{"key":"11_CR29","unstructured":"Shuai, Q., Geng, C., Fang, Q., Peng, S., Shen, W., Zhou, X., Bao, H.: EasyMocap - make human motion capture easier. Github (2021). https:\/\/github.com\/zju3dv\/EasyMocap"},{"key":"11_CR30","doi-asserted-by":"crossref","unstructured":"Shuai, Q., et al.: Novel view synthesis of human interactions from sparse multi-view videos. In: ACM SIGGRAPH (2022)","DOI":"10.1145\/3528233.3530704"},{"key":"11_CR31","unstructured":"Sigal, L., Balan, A.O., Black, M.J.: Combined discriminative and generative articulated pose and non-rigid shape estimation. In: NIPS (2007)"},{"key":"11_CR32","doi-asserted-by":"crossref","unstructured":"Sitzmann, V., Thies, J., Heide, F., Nie\u00dfner, M., Wetzstein, G., Zollh\u00f6fer, M.: DeepVoxels: learning persistent 3D feature embeddings. 2019 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 2432\u20132441 (2019)","DOI":"10.1109\/CVPR.2019.00254"},{"key":"11_CR33","doi-asserted-by":"crossref","unstructured":"Thies, J., Zollh\u00f6fer, M., Nie\u00dfner, M.: Deferred neural rendering: image synthesis using neural textures. arXiv Computer Vision and Pattern Recognition (2019)","DOI":"10.1145\/3306346.3323035"},{"key":"11_CR34","doi-asserted-by":"crossref","unstructured":"Trevithick, A., Yang, B.: GRF: learning a general radiance field for 3D scene representation and rendering. ArXiv abs\/2010.04595 (2020)","DOI":"10.1109\/ICCV48922.2021.01490"},{"key":"11_CR35","doi-asserted-by":"crossref","unstructured":"Wang, Q., et al.: IBRNet: learning multi-view image-based rendering. In: 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 4688\u20134697 (2021)","DOI":"10.1109\/CVPR46437.2021.00466"},{"key":"11_CR36","doi-asserted-by":"crossref","unstructured":"Wu, M., Wang, Y., Hu, Q., Yu, J.: Multi-view neural human rendering. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 1679\u20131688 (2020)","DOI":"10.1109\/CVPR42600.2020.00175"},{"key":"11_CR37","doi-asserted-by":"crossref","unstructured":"Xian, W., Huang, J.B., Kopf, J., Kim, C.: Space-time neural irradiance fields for free-viewpoint video. In: 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 9416\u20139426 (2021)","DOI":"10.1109\/CVPR46437.2021.00930"},{"key":"11_CR38","unstructured":"Yan, X., Yang, J., Yumer, E., Guo, Y., Lee, H.: Perspective transformer nets: learning single-view 3D object reconstruction without 3D supervision. ArXiv abs\/1612.00814 (2016)"},{"key":"11_CR39","doi-asserted-by":"crossref","unstructured":"Yu, A., Ye, V., Tancik, M., Kanazawa, A.: pixelNeRF: neural radiance fields from one or few images. In: 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 4576\u20134585 (2021)","DOI":"10.1109\/CVPR46437.2021.00455"},{"key":"11_CR40","doi-asserted-by":"crossref","unstructured":"Zanfir, A., Bazavan, E.G., Xu, H., Freeman, B., Sukthankar, R., Sminchisescu, C.: Weakly supervised 3D human pose and shape reconstruction with normalizing flows. ArXiv abs\/2003.10350 (2020)","DOI":"10.1007\/978-3-030-58539-6_28"},{"key":"11_CR41","doi-asserted-by":"crossref","unstructured":"Zhang, H., et al.: PyMAF: 3D human pose and shape regression with pyramidal mesh alignment feedback loop. In: 2021 IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 11426\u201311436 (2021)","DOI":"10.1109\/ICCV48922.2021.01125"},{"key":"11_CR42","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3478513.3480500","volume":"40","author":"J Zhang","year":"2021","unstructured":"Zhang, J., et al.: Editable free-viewpoint video using a layered neural representation. ACM Trans. Graphics 40, 1\u201318 (2021)","journal-title":"ACM Trans. Graphics"},{"key":"11_CR43","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Li, Z., An, L., Li, M., Yu, T., Liu, Y.: Lightweight multi-person total motion capture using sparse multi-view cameras. In: 2021 IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 5540\u20135549 (2021)","DOI":"10.1109\/ICCV48922.2021.00551"},{"key":"11_CR44","doi-asserted-by":"crossref","unstructured":"Zhao, F., et al.: HumanNeRF: generalizable neural human radiance field from sparse inputs. ArXiv abs\/2112.02789 (2021)","DOI":"10.1109\/CVPR52688.2022.00759"},{"key":"11_CR45","doi-asserted-by":"crossref","unstructured":"Zheng, Y., et al.: DeepMultiCap: performance capture of multiple characters using sparse multiview cameras. In: International Conference on Computer Vision (ICCV), pp. 6219\u20136229 (2021)","DOI":"10.1109\/ICCV48922.2021.00618"}],"container-title":["Lecture Notes in Computer Science","Pattern Recognition"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-54605-1_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,13]],"date-time":"2024-11-13T23:22:46Z","timestamp":1731540166000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-54605-1_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"ISBN":["9783031546044","9783031546051"],"references-count":45,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-54605-1_11","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024]]},"assertion":[{"value":"8 March 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"DAGM GCPR","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"DAGM German Conference on Pattern Recognition","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Heidelberg","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Germany","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"19 September 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22 September 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"45","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"dagm2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/www.dagm-gcpr.de\/year\/2023","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"CMT","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"76","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"40","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"53% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"5","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}