{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,17]],"date-time":"2026-03-17T22:42:51Z","timestamp":1773787371001,"version":"3.50.1"},"publisher-location":"Cham","reference-count":86,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031200854","type":"print"},{"value":"9783031200861","type":"electronic"}],"license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-031-20086-1_8","type":"book-chapter","created":{"date-parts":[[2022,11,10]],"date-time":"2022-11-10T10:31:55Z","timestamp":1668076315000},"page":"125-145","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":47,"title":["CHORE: Contact, Human and\u00a0Object Reconstruction from\u00a0a\u00a0Single RGB Image"],"prefix":"10.1007","author":[{"given":"Xianghui","family":"Xie","sequence":"first","affiliation":[]},{"given":"Bharat Lal","family":"Bhatnagar","sequence":"additional","affiliation":[]},{"given":"Gerard","family":"Pons-Moll","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,11,11]]},"reference":[{"key":"8_CR1","unstructured":"https:\/\/www.mturk.com"},{"key":"8_CR2","unstructured":"http:\/\/virtualhumans.mpi-inf.mpg.de\/people.html"},{"key":"8_CR3","doi-asserted-by":"crossref","unstructured":"Alldieck, T., Magnor, M., Bhatnagar, B.L., Theobalt, C., Pons-Moll, G.: Learning to reconstruct people in clothing from a single RGB camera. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 1175\u20131186 (2019)","DOI":"10.1109\/CVPR.2019.00127"},{"key":"8_CR4","doi-asserted-by":"crossref","unstructured":"Alldieck, T., Magnor, M., Xu, W., Theobalt, C., Pons-Moll, G.: Detailed human avatars from monocular video. In: International Conference on 3D Vision, pp. 98\u2013109, September 2018","DOI":"10.1109\/3DV.2018.00022"},{"key":"8_CR5","doi-asserted-by":"crossref","unstructured":"Alldieck, T., Magnor, M., Xu, W., Theobalt, C., Pons-Moll, G.: Video based reconstruction of 3D people models. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 8387\u20138397 (2018)","DOI":"10.1109\/CVPR.2018.00875"},{"key":"8_CR6","doi-asserted-by":"crossref","unstructured":"Alldieck, T., Pons-Moll, G., Theobalt, C., Magnor, M.: Tex2shape: detailed full human body geometry from a single image. In: IEEE International Conference on Computer Vision (ICCV), pp. 2293\u20132303. IEEE, October 2019","DOI":"10.1109\/ICCV.2019.00238"},{"key":"8_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"311","DOI":"10.1007\/978-3-030-58536-5_19","volume-title":"Computer Vision \u2013 ECCV 2020","author":"BL Bhatnagar","year":"2020","unstructured":"Bhatnagar, B.L., Sminchisescu, C., Theobalt, C., Pons-Moll, G.: Combining implicit function learning and parametric models for 3D human reconstruction. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12347, pp. 311\u2013329. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58536-5_19"},{"key":"8_CR8","unstructured":"Bhatnagar, B.L., Sminchisescu, C., Theobalt, C., Pons-Moll, G.: Loopreg: self-supervised learning of implicit surface correspondences, pose and shape for 3D human mesh registration. In: Advances in Neural Information Processing Systems (NeurIPS), December 2020"},{"key":"8_CR9","doi-asserted-by":"crossref","unstructured":"Bhatnagar, B.L., Tiwari, G., Theobalt, C., Pons-Moll, G.: Multi-garment net: learning to dress 3D people from images. In: IEEE International Conference on Computer Vision (ICCV), pp. 5420\u20135430. IEEE, Ovtober 2019","DOI":"10.1109\/ICCV.2019.00552"},{"key":"8_CR10","doi-asserted-by":"crossref","unstructured":"Bhatnagar, B.L., Xie, X., Petrov, I., Sminchisescu, C., Theobalt, C., Pons-Moll, G.: Behave: dataset and method for tracking human object interactions. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 15935\u201315946, June 2022","DOI":"10.1109\/CVPR52688.2022.01547"},{"key":"8_CR11","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"561","DOI":"10.1007\/978-3-319-46454-1_34","volume-title":"Computer Vision \u2013 ECCV 2016","author":"F Bogo","year":"2016","unstructured":"Bogo, F., Kanazawa, A., Lassner, C., Gehler, P., Romero, J., Black, M.J.: Keep It SMPL: automatic estimation of 3D human pose and shape from a single image. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9909, pp. 561\u2013578. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46454-1_34"},{"key":"8_CR12","doi-asserted-by":"crossref","unstructured":"Brahmbhatt, S., Ham, C., Kemp, C.C., Hays, J.: ContactDB: analyzing and predicting grasp contact via thermal imaging. In: The IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 8709\u20138719 (2019). https:\/\/contactdb.cc.gatech.edu","DOI":"10.1109\/CVPR.2019.00891"},{"key":"8_CR13","doi-asserted-by":"crossref","unstructured":"Brahmbhatt, S., Handa, A., Hays, J., Fox, D.: Contactgrasp: functional multi-finger grasp synthesis from contact. In: IROS, pp. 2386\u20132393 (04 2019)","DOI":"10.1109\/IROS40897.2019.8967960"},{"key":"8_CR14","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"361","DOI":"10.1007\/978-3-030-58601-0_22","volume-title":"Computer Vision \u2013 ECCV 2020","author":"S Brahmbhatt","year":"2020","unstructured":"Brahmbhatt, S., Tang, C., Twigg, C.D., Kemp, C.C., Hays, J.: ContactPose: a dataset of grasps with object contact and hand pose. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12358, pp. 361\u2013378. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58601-0_22"},{"key":"8_CR15","unstructured":"Chang, A.X., et al.: ShapeNet: an information-rich 3D model repository. Tech. Rep. arXiv:1512.03012 [cs.GR], Stanford University \u2013 Princeton University \u2013 Toyota Technological Institute at Chicago (2015)"},{"key":"8_CR16","doi-asserted-by":"crossref","unstructured":"Chen, Y., Huang, S., Yuan, T., Qi, S., Zhu, Y., Zhu, S.C.: Holistic++ scene understanding: single-view 3D holistic scene parsing and human pose estimation with human-object interaction and physical commonsense. In: The IEEE International Conference on Computer Vision (ICCV), pp. 8648\u20138657 (2019)","DOI":"10.1109\/ICCV.2019.00874"},{"key":"8_CR17","unstructured":"Chibane, J., Mir, A., Pons-Moll, G.: Neural unsigned distance fields for implicit function learning. In: Neural Information Processing Systems (NeurIPS), December 2020"},{"key":"8_CR18","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"628","DOI":"10.1007\/978-3-319-46484-8_38","volume-title":"Computer Vision \u2013 ECCV 2016","author":"CB Choy","year":"2016","unstructured":"Choy, C.B., Xu, D., Gwak, J.Y., Chen, K., Savarese, S.: 3D-R2N2: a unified approach for single and multi-view 3D object reconstruction. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9912, pp. 628\u2013644. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46484-8_38"},{"key":"8_CR19","doi-asserted-by":"crossref","unstructured":"Corona, E., Pons-Moll, G., Alenya, G., Moreno-Noguer, F.: Learned vertex descent: a new direction for 3D human model fitting. In: European Conference on Computer Vision (ECCV). Springer (October 2022)","DOI":"10.1007\/978-3-031-20086-1_9"},{"key":"8_CR20","doi-asserted-by":"crossref","unstructured":"Corona, E., Pumarola, A., Alenya, G., Moreno-Noguer, F., Rogez, G.: Ganhand: predicting human grasp affordances in multi-object scenes. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 5031\u20135041, June 2020","DOI":"10.1109\/CVPR42600.2020.00508"},{"key":"8_CR21","doi-asserted-by":"crossref","unstructured":"Ehsani, K., Tulsiani, S., Gupta, S., Farhadi, A., Gupta, A.: Use the force, luke! learning to predict physical forces by simulating effects. In: CVPR, pp. 224\u2013233 (2020)","DOI":"10.1109\/CVPR42600.2020.00030"},{"key":"8_CR22","doi-asserted-by":"crossref","unstructured":"Fan, H., Su, H., Guibas, L.J.: A point set generation network for 3D object reconstruction from a single image. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 605\u2013613, July 2017","DOI":"10.1109\/CVPR.2017.264"},{"key":"8_CR23","unstructured":"Fieraru, M., Zanfir, M., Oneata, E., Popa, A., Olaru, V., Sminchisescu, C.: Learning complex 3D human self-contact. CoRR abs\/2012.10366 (2020). https:\/\/arxiv.org\/abs\/2012.10366"},{"key":"8_CR24","doi-asserted-by":"crossref","unstructured":"Fieraru, M., Zanfir, M., Oneata, E., Popa, A.I., Olaru, V., Sminchisescu, C.: Three-dimensional reconstruction of human interactions. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 7214\u20137223, June 2020","DOI":"10.1109\/CVPR42600.2020.00724"},{"issue":"1","key":"8_CR25","doi-asserted-by":"publisher","first-page":"463","DOI":"10.1007\/s11042-020-09722-8","volume":"80","author":"K Fu","year":"2020","unstructured":"Fu, K., Peng, J., He, Q., Zhang, H.: Single image 3D object reconstruction based on deep learning: a review. Multimedia Tools Appl. 80(1), 463\u2013498 (2020). https:\/\/doi.org\/10.1007\/s11042-020-09722-8","journal-title":"Multimedia Tools Appl."},{"key":"8_CR26","doi-asserted-by":"crossref","unstructured":"Guler, R.A., Kokkinos, I.: Holopose: holistic 3D human reconstruction in-the-wild. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 10884\u201310894, June 2019","DOI":"10.1109\/CVPR.2019.01114"},{"key":"8_CR27","doi-asserted-by":"crossref","unstructured":"Guo, C., Chen, X., Song, J., Hilliges, O.: Human performance capture from monocular video in the wild. In: 2021 International Conference on 3D Vision (3DV), pp. 889\u2013898. IEEE (2021)","DOI":"10.1109\/3DV53792.2021.00097"},{"key":"8_CR28","doi-asserted-by":"crossref","unstructured":"Habermann, M., Xu, W., Zollhoefer, M., Pons-Moll, G., Theobalt, C.: Deepcap: monocular human performance capture using weak supervision. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 5052\u20135063. IEEE, June 2020","DOI":"10.1109\/CVPR42600.2020.00510"},{"key":"8_CR29","doi-asserted-by":"publisher","unstructured":"Habermann, M., Xu, W., Zollh\u00f6fer, M., Pons-Moll, G., Theobalt, C.: Livecap: real-time human performance capture from monocular video. ACM Trans. Graph. 38(2), 14:1\u201314:17, March 2019. https:\/\/doi.org\/10.1145\/3311970","DOI":"10.1145\/3311970"},{"key":"8_CR30","doi-asserted-by":"crossref","unstructured":"Hassan, M., Choutas, V., Tzionas, D., Black, M.J.: Resolving 3D human pose ambiguities with 3D scene constraints. In: International Conference on Computer Vision, pp. 2282\u20132292 (2019)","DOI":"10.1109\/ICCV.2019.00237"},{"key":"8_CR31","doi-asserted-by":"crossref","unstructured":"Hassan, M., Ghosh, P., Tesch, J., Tzionas, D., Black, M.J.: Populating 3D scenes by learning human-scene interaction. In: Proceedings IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 14708\u201314718, June 2021","DOI":"10.1109\/CVPR46437.2021.01447"},{"key":"8_CR32","doi-asserted-by":"crossref","unstructured":"Hasson, Y., et al.: Learning joint reconstruction of hands and manipulated objects. In: CVPR, pp. 11807\u201311816 (2019)","DOI":"10.1109\/CVPR.2019.01208"},{"key":"8_CR33","doi-asserted-by":"crossref","unstructured":"Huang, C.H.P., et al.: Capturing and inferring dense full-body human-scene contact. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 13274\u201313285, June 2022","DOI":"10.1109\/CVPR52688.2022.01292"},{"key":"8_CR34","doi-asserted-by":"crossref","unstructured":"Huang, Z., Xu, Y., Lassner, C., Li, H., Tung, T.: Arch: animatable reconstruction of clothed humans. ArXiv abs\/2004.04572 (2020)","DOI":"10.1109\/CVPR42600.2020.00316"},{"key":"8_CR35","doi-asserted-by":"publisher","unstructured":"H\u00e4ne, C., Tulsiani, S., Malik, J.: Hierarchical surface prediction for 3D object reconstruction. In: 2017 International Conference on 3D Vision (3DV), pp. 412\u2013420 (2017). https:\/\/doi.org\/10.1109\/3DV.2017.00054","DOI":"10.1109\/3DV.2017.00054"},{"key":"8_CR36","doi-asserted-by":"publisher","unstructured":"Jiang, B., Zhang, J., Hong, Y., Luo, J., Liu, L., Bao, H.: Bcnet: learning body and cloth shape from a single image. In: European Conference on Computer Vision, pp. 18\u201335. Springer (2020). https:\/\/doi.org\/10.1007\/978-3-030-58565-5_2","DOI":"10.1007\/978-3-030-58565-5_2"},{"key":"8_CR37","doi-asserted-by":"crossref","unstructured":"Jiang, J., et al.: Avatarposer: articulated full-body pose tracking from sparse motion sensing. In: European Conference on Computer Vision (2022)","DOI":"10.1007\/978-3-031-20065-6_26"},{"key":"8_CR38","doi-asserted-by":"crossref","unstructured":"Jiang, W., Kolotouros, N., Pavlakos, G., Zhou, X., Daniilidis, K.: Coherent reconstruction of multiple humans from a single image. In: CVPR, pp. 5579\u20135588 (2020)","DOI":"10.1109\/CVPR42600.2020.00562"},{"key":"8_CR39","doi-asserted-by":"crossref","unstructured":"Jiang, Y., et al.: Neuralfusion: neural volumetric rendering under human-object interactions. arXiv preprint arXiv:2202.12825 (2022)","DOI":"10.1109\/CVPR52688.2022.00606"},{"key":"8_CR40","doi-asserted-by":"crossref","unstructured":"Kanazawa, A., Black, M.J., Jacobs, D.W., Malik, J.: End-to-end recovery of human shape and pose. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 7122\u20137131. IEEE Computer Society (2018)","DOI":"10.1109\/CVPR.2018.00744"},{"key":"8_CR41","doi-asserted-by":"crossref","unstructured":"Kar, A., Tulsiani, S., Malik, J.: Category-specific object reconstruction from a single image. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 1966\u20131974 (2015)","DOI":"10.1109\/CVPR.2015.7298807"},{"key":"8_CR42","doi-asserted-by":"publisher","unstructured":"Karunratanakul, K., Yang, J., Zhang, Y., Black, M., Muandet, K., Tang, S.: Grasping field: learning implicit representations for human grasps. In: 8th International Conference on 3D Vision, pp. 333\u2013344. IEEE, November 2020. https:\/\/doi.org\/10.1109\/3DV50981.2020.00043","DOI":"10.1109\/3DV50981.2020.00043"},{"key":"8_CR43","doi-asserted-by":"publisher","unstructured":"Kocabas, M., Athanasiou, N., Black, M.J.: Vibe: video inference for human body pose and shape estimation. In: Proceedings IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 5252\u20135262. IEEE, June 2020. https:\/\/doi.org\/10.1109\/CVPR42600.2020.00530","DOI":"10.1109\/CVPR42600.2020.00530"},{"key":"8_CR44","doi-asserted-by":"crossref","unstructured":"Kolotouros, N., Pavlakos, G., Black, M.J., Daniilidis, K.: Learning to reconstruct 3D human pose and shape via model-fitting in the loop. In: ICCV, pp. 2252\u20132261 (2019)","DOI":"10.1109\/ICCV.2019.00234"},{"key":"8_CR45","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1007\/978-3-030-58523-5_8","volume-title":"Computer Vision \u2013 ECCV 2020","author":"J Lei","year":"2020","unstructured":"Lei, J., Sridhar, S., Guerrero, P., Sung, M., Mitra, N., Guibas, L.J.: Pix2Surf: learning parametric 3D surface models of objects from images. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12363, pp. 121\u2013138. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58523-5_8"},{"key":"8_CR46","doi-asserted-by":"crossref","unstructured":"Li, Z., Sedlar, J., Carpentier, J., Laptev, I., Mansard, N., Sivic, J.: Estimating 3D motion and forces of person-object interactions from monocular video. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 8640\u20138649, June 2019","DOI":"10.1109\/CVPR.2019.00884"},{"key":"8_CR47","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"740","DOI":"10.1007\/978-3-319-10602-1_48","volume-title":"Computer Vision \u2013 ECCV 2014","author":"T-Y Lin","year":"2014","unstructured":"Lin, T.-Y.: Microsoft COCO: common objects in context. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8693, pp. 740\u2013755. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-10602-1_48"},{"issue":"10","key":"8_CR48","doi-asserted-by":"publisher","first-page":"2684","DOI":"10.1109\/TPAMI.2019.2916873","volume":"42","author":"J Liu","year":"2019","unstructured":"Liu, J., Shahroudy, A., Perez, M., Wang, G., Duan, L.Y., Kot, A.C.: Ntu rgb+d 120: a large-scale benchmark for 3D human activity understanding. IEEE Trans. Pattern Anal. Mach. Intell. 42(10), 2684\u20132701 (2019). https:\/\/doi.org\/10.1109\/TPAMI.2019.2916873","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"8_CR49","doi-asserted-by":"crossref","unstructured":"Loper, M., Mahmood, N., Romero, J., Pons-Moll, G., Black, M.J.: SMPL: A skinned multi-person linear model. In: ACM Trans. Graph. 34(6), 1\u201316. ACM (2015)","DOI":"10.1145\/2816795.2818013"},{"key":"8_CR50","doi-asserted-by":"crossref","unstructured":"Mescheder, L., Oechsle, M., Niemeyer, M., Nowozin, S., Geiger, A.: Occupancy networks: learning 3D reconstruction in function space. In: Proceedings IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp.4460\u20134470 (2019)","DOI":"10.1109\/CVPR.2019.00459"},{"key":"8_CR51","doi-asserted-by":"crossref","unstructured":"Monszpart, A., Guerrero, P., Ceylan, D., Yumer, E., J. Mitra, N.: iMapper: interaction-guided scene mapping from monocular videos. In: ACM SIGGRAPH (2019)","DOI":"10.1145\/3306346.3322961"},{"key":"8_CR52","doi-asserted-by":"crossref","unstructured":"M\u00fcller, L., Osman, A.A.A., Tang, S., Huang, C.H.P., Black, M.J.: On self-contact and human pose. In: Proceedings IEEE\/CVF Confernce on Computer Vision and Pattern Recognition (CVPR), 9990\u20139999 (2021)","DOI":"10.1109\/CVPR46437.2021.00986"},{"key":"8_CR53","doi-asserted-by":"crossref","unstructured":"Mller, N., Wong, Y.S., Mitra, N.J., Dai, A., Niessner, M.: Seeing behind objects for 3D multi-object tracking in RGB-D sequences. In: Proceedings of the Computer Vision and Pattern Recognition (CVPR), pp. 6071\u20136080. IEEE (2021)","DOI":"10.1109\/CVPR46437.2021.00601"},{"key":"8_CR54","doi-asserted-by":"crossref","unstructured":"Omran, M., Lassner, C., Pons-Moll, G., Gehler, P., Schiele, B.: Neural body fitting: unifying deep learning and model based human pose and shape estimation. In: International Conference on 3D Vision, pp. 484\u2013494 (2018)","DOI":"10.1109\/3DV.2018.00062"},{"key":"8_CR55","doi-asserted-by":"crossref","unstructured":"Pavlakos, G., et al.: Expressive body capture: 3D hands, face, and body from a single image. In: Proceedings IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 10975\u201310985 (2019)","DOI":"10.1109\/CVPR.2019.01123"},{"key":"8_CR56","doi-asserted-by":"crossref","unstructured":"Pavlakos, G., Zhu, L., Zhou, X., Daniilidis, K.: Learning to estimate 3D human pose and shape from a single color image. In: IEEE Conference on Computer Vision and Pattern Recognition, pp. 459\u2013468 (2018)","DOI":"10.1109\/CVPR.2018.00055"},{"key":"8_CR57","doi-asserted-by":"publisher","unstructured":"Pons-Moll, G., Rosenhahn, B.: Model-based pose estimation, chap. 9, pp. 139\u2013170. Springer (2011). https:\/\/doi.org\/10.1007\/978-0-85729-997-0_9","DOI":"10.1007\/978-0-85729-997-0_9"},{"key":"8_CR58","doi-asserted-by":"crossref","unstructured":"Pontes, J.K., Kong, C., Sridharan, S., Lucey, S., Eriksson, A., Fookes, C.: Image2mesh: a learning framework for single image 3D reconstruction. In: ACCV, pp. 365\u2013381. Springer International Publishing (2019)","DOI":"10.1007\/978-3-030-20887-5_23"},{"key":"8_CR59","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"71","DOI":"10.1007\/978-3-030-58558-7_5","volume-title":"Computer Vision \u2013 ECCV 2020","author":"D Rempe","year":"2020","unstructured":"Rempe, D., Guibas, L.J., Hertzmann, A., Russell, B., Villegas, R., Yang, J.: Contact and human dynamics from monocular video. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12350, pp. 71\u201387. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58558-7_5"},{"key":"8_CR60","doi-asserted-by":"crossref","unstructured":"Romero, J., Tzionas, D., Black, M.J.: Embodied hands: Modeling and capturing hands and bodies together. ACM Trans. Graphics, (Proc. SIGGRAPH Asia) 36(6) (2017)","DOI":"10.1145\/3130800.3130883"},{"key":"8_CR61","doi-asserted-by":"crossref","unstructured":"Rong, Y., Shiratori, T., Joo, H.: Frankmocap: a monocular 3D whole-body pose estimation system via regression and integration. In: IEEE International Conference on Computer Vision Workshops (2021)","DOI":"10.1109\/ICCVW54120.2021.00201"},{"key":"8_CR62","doi-asserted-by":"crossref","unstructured":"Saito, S., Huang, Z., Natsume, R., Morishima, S., Kanazawa, A., Li, H.: Pifu: pixel-aligned implicit function for high-resolution clothed human digitization. In: IEEE International Conference on Computer Vision (ICCV). IEEE (2019)","DOI":"10.1109\/ICCV.2019.00239"},{"key":"8_CR63","doi-asserted-by":"crossref","unstructured":"Saito, S., Simon, T., Saragih, J., Joo, H.: Pifuhd: multi-level pixel-aligned implicit function for high-resolution 3D human digitization. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (2020)","DOI":"10.1109\/CVPR42600.2020.00016"},{"key":"8_CR64","doi-asserted-by":"crossref","unstructured":"Savva, M., Chang, A.X., Hanrahan, P., Fisher, M., Nie\u00dfner, M.: PiGraphs: Learning Interaction Snapshots from Observations. ACM Trans. Graphics (TOG) 35(4) (2016)","DOI":"10.1145\/2897824.2925867"},{"key":"8_CR65","doi-asserted-by":"crossref","unstructured":"Sun, G., et al.: Neural free-viewpoint performance rendering under complex human-object interactions. In: Proceedings of the 29th ACM International Conference on Multimedia (2021)","DOI":"10.1145\/3474085.3475442"},{"key":"8_CR66","doi-asserted-by":"crossref","unstructured":"Sun, X., et al.: Pix3d: dataset and methods for single-image 3D shape modeling. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2018)","DOI":"10.1109\/CVPR.2018.00314"},{"key":"8_CR67","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"581","DOI":"10.1007\/978-3-030-58548-8_34","volume-title":"Computer Vision \u2013 ECCV 2020","author":"O Taheri","year":"2020","unstructured":"Taheri, O., Ghorbani, N., Black, M.J., Tzionas, D.: GRAB: a dataset of whole-body human grasping of objects. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12349, pp. 581\u2013600. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58548-8_34"},{"key":"8_CR68","doi-asserted-by":"crossref","unstructured":"Tiwari, G., Antic, D., Lenssen, J.E., Sarafianos, N., Tung, T., Pons-Moll, G.: Pose-ndf: Modeling human pose manifolds with neural distance fields. In: European Conference on Computer Vision (ECCV). Springer, October 2022","DOI":"10.1007\/978-3-031-20065-6_33"},{"key":"8_CR69","doi-asserted-by":"publisher","unstructured":"Tiwari, G., Bhatnagar, B.L., Tung, T., Pons-Moll, G.: Sizer: A dataset and model for parsing 3d clothing and learning size sensitive 3D clothing. In: European Conference on Computer Vision (ECCV), pp. 1\u201318. Springer (August 2020). https:\/\/doi.org\/10.1007\/978-3-030-58580-8_1","DOI":"10.1007\/978-3-030-58580-8_1"},{"key":"8_CR70","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"55","DOI":"10.1007\/978-3-030-01252-6_4","volume-title":"Computer Vision \u2013 ECCV 2018","author":"N Wang","year":"2018","unstructured":"Wang, N., Zhang, Y., Li, Z., Fu, Y., Liu, W., Jiang, Y.-G.: Pixel2Mesh: generating 3D mesh models from single RGB images. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11215, pp. 55\u201371. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01252-6_4"},{"key":"8_CR71","doi-asserted-by":"crossref","unstructured":"Weng, Z., Yeung, S.: Holistic 3D human and scene mesh estimation from single view images. arXiv preprint arXiv:2012.01591 (2020)","DOI":"10.1109\/CVPR46437.2021.00040"},{"key":"8_CR72","unstructured":"Wu, J., Wang, Y., Xue, T., Sun, X., Freeman, W.T., Tenenbaum, J.B.: Marrnet: 3D shape reconstruction via 2.5D sketches. In: Advances In Neural Information Processing Systems (2017)"},{"key":"8_CR73","doi-asserted-by":"crossref","unstructured":"Wu, J., Zhang, C., Zhang, X., Zhang, Z., Freeman, W.T., Tenenbaum, J.B.: Learning 3D shape priors for shape completion and reconstruction. In: European Conference on Computer Vision (ECCV), pp. 646\u2013662 (2018)","DOI":"10.1007\/978-3-030-01252-6_40"},{"key":"8_CR74","doi-asserted-by":"publisher","unstructured":"Xiang, Y., et al.: Objectnet3D: a large scale database for 3D object recognition. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) Computer Vision - ECCV 2016, pp. 160\u2013176. Springer International Publishing (2016). https:\/\/doi.org\/10.1007\/978-3-319-46484-8_10","DOI":"10.1007\/978-3-319-46484-8_10"},{"key":"8_CR75","doi-asserted-by":"crossref","unstructured":"Xiu, Y., Yang, J., Tzionas, D., Black, M.J.: ICON: implicit clothed humans obtained from normals. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 13296\u201313306, Jun 2022","DOI":"10.1109\/CVPR52688.2022.01294"},{"key":"8_CR76","unstructured":"Xu, Q., Wang, W., Ceylan, D., Mech, R., Neumann, U.: Disn: deep implicit surface network for high-quality single-view 3D reconstruction. In: Wallach, H., Larochelle, H., Beygelzimer, A., d\u2019Alch\u00e9-Buc, F., Fox, E., Garnett, R. (eds.) Advances in Neural Information Processing Systems. vol. 32. Curran Associates, Inc. (2019). https:\/\/proceedings.neurips.cc\/paper\/2019\/file\/39059724f73a9969845dfe4146c5660e-Paper.pdf"},{"key":"8_CR77","doi-asserted-by":"crossref","unstructured":"Yang, L., Zhan, X., Li, K., Xu, W., Li, J., Lu, C.: CPF: learning a contact potential field to model the hand-object interaction. In: ICCV, pp. 11097\u201311106 (2021)","DOI":"10.1109\/ICCV48922.2021.01091"},{"key":"8_CR78","doi-asserted-by":"crossref","unstructured":"Yi, H., et al.: Human-aware object placement for visual environment reconstruction. In: IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 3959\u20133970, June 2022","DOI":"10.1109\/CVPR52688.2022.00393"},{"key":"8_CR79","doi-asserted-by":"publisher","unstructured":"Zhang, J.Y., Pepose, S., Joo, H., Ramanan, D., Malik, J., Kanazawa, A.: Perceiving 3D human-object spatial arrangements from a single image in the wild. In: European Conference on Computer Vision (ECCV), pp. 34\u201351 (2020). https:\/\/doi.org\/10.1007\/978-3-030-58610-2_3","DOI":"10.1007\/978-3-030-58610-2_3"},{"key":"8_CR80","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.cag.2021.04.035","volume":"98","author":"S Zhang","year":"2021","unstructured":"Zhang, S., Liu, J., Liu, Y., Ling, N.: Dimnet: dense implicit function network for 3D human body reconstruction. Comput. Graph. 98, 1\u201310 (2021). https:\/\/doi.org\/10.1016\/j.cag.2021.04.035","journal-title":"Comput. Graph."},{"key":"8_CR81","doi-asserted-by":"crossref","unstructured":"Zhang, S., Zhang, Y., Ma, Q., Black, M.J., Tang, S.: Place: proximity learning of articulation and contact in 3D environments. In: International Conference on 3D Vision (3DV), pp. 642\u2013651, November 2020","DOI":"10.1109\/3DV50981.2020.00074"},{"key":"8_CR82","doi-asserted-by":"crossref","unstructured":"Zhang, X., Bhatnagar, B.L., Guzov, V., Starke, S., Pons-Moll, G.: Couch: towards controllable human-chair interactions. arXiv preprint arXiv:2205.00541 (May 2022)","DOI":"10.1007\/978-3-031-20065-6_30"},{"key":"8_CR83","unstructured":"Zhang, X., Zhang, Z., Zhang, C., Tenenbaum, J.B., Freeman, W.T., Wu, J.: Learning to reconstruct shapes from unseen classes. In: Advances in Neural Information Processing Systems (NeurIPS) (2018)"},{"key":"8_CR84","doi-asserted-by":"crossref","unstructured":"Zhao, F., Wang, W., Liao, S., Shao, L.: Learning anchored unsigned distance functions with gradient direction alignment for single-view garment reconstruction. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 12674\u201312683 (2021)","DOI":"10.1109\/ICCV48922.2021.01244"},{"key":"8_CR85","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"387","DOI":"10.1007\/978-3-030-58452-8_23","volume-title":"Computer Vision \u2013 ECCV 2020","author":"Z Cao","year":"2020","unstructured":"Cao, Z., Gao, H., Mangalam, K., Cai, Q.-Z., Vo, M., Malik, J.: Long-term human motion prediction with scene context. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12346, pp. 387\u2013404. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58452-8_23"},{"key":"8_CR86","doi-asserted-by":"crossref","unstructured":"Zhou, K., Bhatnagar, B.L., Lenssen, J.E., Pons-Moll, G.: Toch: spatio-temporal object correspondence to hand for motion refinement. In: European Conference on Computer Vision (ECCV). Springer, October 2022","DOI":"10.1007\/978-3-031-20062-5_1"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2022"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-20086-1_8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,3,11]],"date-time":"2023-03-11T18:48:17Z","timestamp":1678560497000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-20086-1_8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"ISBN":["9783031200854","9783031200861"],"references-count":86,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-20086-1_8","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022]]},"assertion":[{"value":"11 November 2022","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Tel Aviv","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Israel","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2022","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23 October 2022","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 October 2022","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2022","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2022.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"CMT","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"5804","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1645","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"28% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.21","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.91","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}