{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,8]],"date-time":"2026-02-08T01:37:39Z","timestamp":1770514659941,"version":"3.49.0"},"publisher-location":"Cham","reference-count":62,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031729720","type":"print"},{"value":"9783031729737","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,11,1]],"date-time":"2024-11-01T00:00:00Z","timestamp":1730419200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,1]],"date-time":"2024-11-01T00:00:00Z","timestamp":1730419200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-72973-7_1","type":"book-chapter","created":{"date-parts":[[2024,10,31]],"date-time":"2024-10-31T14:03:04Z","timestamp":1730383384000},"page":"1-19","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Revisit Human-Scene Interaction via\u00a0Space Occupancy"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7525-3243","authenticated-orcid":false,"given":"Xinpeng","family":"Liu","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0002-6944-0939","authenticated-orcid":false,"given":"Haowen","family":"Hou","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2447-7917","authenticated-orcid":false,"given":"Yanchao","family":"Yang","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0478-0692","authenticated-orcid":false,"given":"Yong-Lu","family":"Li","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1533-8576","authenticated-orcid":false,"given":"Cewu","family":"Lu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,1]]},"reference":[{"key":"1_CR1","doi-asserted-by":"crossref","unstructured":"Ara\u00fajo, J.P., et al.: Circle: capture in rich contextual environments. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 21211\u201321221 (2023)","DOI":"10.1109\/CVPR52729.2023.02032"},{"key":"1_CR2","doi-asserted-by":"crossref","unstructured":"Athanasiou, N., Petrovich, M., Black, M.J., Varol, G.: Teach: temporal action composition for 3d humans. In: 2022 International Conference on 3D Vision (3DV), pp. 414\u2013423. IEEE (2022)","DOI":"10.1109\/3DV57658.2022.00053"},{"key":"1_CR3","unstructured":"Bengio, S., Vinyals, O., Jaitly, N., Shazeer, N.: Scheduled sampling for sequence prediction with recurrent neural networks. Adv. Neural Inform. Process. Syst. 28 (2015)"},{"key":"1_CR4","doi-asserted-by":"publisher","first-page":"557","DOI":"10.1007\/978-3-031-20071-7_","volume-title":"Computer Vision - ECCV 2022","author":"Z Cai","year":"2022","unstructured":"Cai, Z., et al.: Humman: multi-modal 4d human dataset for versatile sensing and modeling. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) Computer Vision - ECCV 2022, pp. 557\u2013577. Springer Nature Switzerland, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-20071-7_"},{"key":"1_CR5","doi-asserted-by":"crossref","unstructured":"Chen, L., Ng, R.: On the marriage of lp-norms and edit distance. In: Proceedings of the Thirtieth International Conference on Very Large Data Bases, vol. 30, pp. 792\u2013803 (2004)","DOI":"10.1016\/B978-012088469-8.50070-X"},{"key":"1_CR6","doi-asserted-by":"crossref","unstructured":"Chen, X., Jiang, B., Liu, W., Huang, Z., Fu, B., Chen, T., Yu, G.: Executing your commands via motion diffusion in latent space. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 18000\u201318010 (2023)","DOI":"10.1109\/CVPR52729.2023.01726"},{"key":"1_CR7","doi-asserted-by":"crossref","unstructured":"Guo, C., et al.: Generating diverse and natural 3d human motions from text. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 5152\u20135161 (June 2022)","DOI":"10.1109\/CVPR52688.2022.00509"},{"key":"1_CR8","doi-asserted-by":"crossref","unstructured":"Guo, C., et al.: Action2motion: conditioned generation of 3d human motions. In: Proceedings of the 28th ACM International Conference on Multimedia, pp. 2021\u20132029 (2020)","DOI":"10.1145\/3394171.3413635"},{"key":"1_CR9","doi-asserted-by":"crossref","unstructured":"Guo, W., Du, Y., Shen, X., Lepetit, V., Alameda-Pineda, X., Moreno-Noguer, F.: Back to mlp: a simple baseline for human motion prediction. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 4809\u20134819 (2023)","DOI":"10.1109\/WACV56688.2023.00479"},{"issue":"4","key":"1_CR10","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1145\/3386569.3392480","volume":"39","author":"FG Harvey","year":"2020","unstructured":"Harvey, F.G., Yurick, M., Nowrouzezahrai, D., Pal, C.: Robust motion in-betweening. ACM Trans. Graph. (TOG) 39(4), 60\u20131 (2020)","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"1_CR11","doi-asserted-by":"crossref","unstructured":"Hassan, M., et al.: Stochastic scene-aware motion prediction. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 11374\u201311384 (2021)","DOI":"10.1109\/ICCV48922.2021.01118"},{"key":"1_CR12","doi-asserted-by":"crossref","unstructured":"Hassan, M., Choutas, V., Tzionas, D., Black, M.J.: Resolving 3D human pose ambiguities with 3D scene constraints. In: International Conference on Computer Vision, pp. 2282\u20132292 (Oct 2019). https:\/\/prox.is.tue.mpg.de","DOI":"10.1109\/ICCV.2019.00237"},{"key":"1_CR13","doi-asserted-by":"crossref","unstructured":"Hassan, M., Ghosh, P., Tesch, J., Tzionas, D., Black, M.J.: Populating 3d scenes by learning human-scene interaction. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 14708\u201314718 (2021)","DOI":"10.1109\/CVPR46437.2021.01447"},{"key":"1_CR14","doi-asserted-by":"publisher","unstructured":"Hassan, M., Guo, Y., Wang, T., Black, M., Fidler, S., Peng, X.B.: Synthesizing physical character-scene interactions. In: ACM SIGGRAPH 2023 Conference Proceedings, SIGGRAPH 2023. Association for Computing Machinery, New York (2023). https:\/\/doi.org\/10.1145\/3588432.3591525","DOI":"10.1145\/3588432.3591525"},{"key":"1_CR15","doi-asserted-by":"crossref","unstructured":"Hernandez, A., Gall, J., Moreno-Noguer, F.: Human motion prediction via spatio-temporal inpainting. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 7134\u20137143 (2019)","DOI":"10.1109\/ICCV.2019.00723"},{"key":"1_CR16","doi-asserted-by":"crossref","unstructured":"Huang, S., et al.: Diffusion-based generation, optimization, and planning in 3d scenes. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 16750\u201316761 (2023)","DOI":"10.1109\/CVPR52729.2023.01607"},{"issue":"1","key":"1_CR17","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1109\/70.127236","volume":"8","author":"YK Hwang","year":"1992","unstructured":"Hwang, Y.K., Ahuja, N., et al.: A potential field approach to path planning. IEEE Trans. Robot. Autom. 8(1), 23\u201332 (1992)","journal-title":"IEEE Trans. Robot. Autom."},{"key":"1_CR18","doi-asserted-by":"crossref","unstructured":"Ji, Y., Xu, F., Yang, Y., Shen, F., Shen, H.T., Zheng, W.S.: A large-scale rgb-d database for arbitrary-view human action recognition. In: Proceedings of the 26th ACM international Conference on Multimedia, pp. 1510\u20131518 (2018)","DOI":"10.1145\/3240508.3240675"},{"key":"1_CR19","doi-asserted-by":"crossref","unstructured":"Lee, J., Joo, H.: Locomotion-action-manipulation: synthesizing human-scene interactions in complex 3d environments. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 9663\u20139674 (October 2023)","DOI":"10.1109\/ICCV51070.2023.00886"},{"issue":"6","key":"1_CR20","first-page":"1","volume":"42","author":"J Li","year":"2023","unstructured":"Li, J., Wu, J., Liu, C.K.: Object motion guided human motion synthesis. ACM Trans. Graph. (TOG) 42(6), 1\u201311 (2023)","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"1_CR21","doi-asserted-by":"crossref","unstructured":"Li, R., Yang, S., Ross, D.A., Kanazawa, A.: Ai choreographer: music conditioned 3d dance generation with aist++. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 13401\u201313412 (2021)","DOI":"10.1109\/ICCV48922.2021.01315"},{"key":"1_CR22","unstructured":"Li, R., Yang, S., Ross, D.A., Kanazawa, A.: Learn to dance with aist++: Music conditioned 3d dance generation, vol. 2(3). arXiv preprint arXiv:2101.08779 (2021)"},{"key":"1_CR23","doi-asserted-by":"crossref","unstructured":"Li, Y.L., et al.: Detailed 2d-3d joint representation for human-object interaction. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10166\u201310175 (2020)","DOI":"10.1109\/CVPR42600.2020.01018"},{"key":"1_CR24","unstructured":"Lin, J., et al.: Motion-x: A large-scale 3d expressive whole-body human motion dataset. arXiv preprint arXiv:2307.00818 (2023)"},{"issue":"6","key":"1_CR25","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2816795.2818013","volume":"34","author":"M Loper","year":"2015","unstructured":"Loper, M., Mahmood, N., Romero, J., Pons-Moll, G., Black, M.J.: Smpl: a skinned multi-person linear model. ACM Trans. Graph. (TOG) 34(6), 1\u201316 (2015)","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"1_CR26","doi-asserted-by":"publisher","unstructured":"Lucas, T., Baradel, F., Weinzaepfel, P., Rogez, G.: Posegpt: quantization-based 3d human motion generation and forecasting. In: Computer Vision\u2013ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23\u201327, 2022, Proceedings, Part VI, pp. 417\u2013435. Springer (2022). https:\/\/doi.org\/10.1007\/978-3-031-20068-7_24","DOI":"10.1007\/978-3-031-20068-7_24"},{"key":"1_CR27","doi-asserted-by":"crossref","unstructured":"Mahmood, N., Ghorbani, N., Troje, N.F., Pons-Moll, G., Black, M.J.: Amass: archive of motion capture as surface shapes. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 5442\u20135451 (2019)","DOI":"10.1109\/ICCV.2019.00554"},{"key":"1_CR28","doi-asserted-by":"publisher","unstructured":"Nie, Y., Dai, A., Han, X., Nie\u00dfner, M.: Pose2room: understanding 3d scenes from human activities. In: European Conference on Computer Vision, pp. 425\u2013443. Springer (2022). https:\/\/doi.org\/10.1007\/978-3-031-19812-0_25","DOI":"10.1007\/978-3-031-19812-0_25"},{"key":"1_CR29","doi-asserted-by":"crossref","unstructured":"Pavlakos, G., et al.: Expressive body capture: 3D hands, face, and body from a single image. In: Proceedings IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 10975\u201310985 (2019)","DOI":"10.1109\/CVPR.2019.01123"},{"key":"1_CR30","doi-asserted-by":"crossref","unstructured":"Petrovich, M., Black, M.J., Varol, G.: Action-conditioned 3d human motion synthesis with transformer vae. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 10985\u201310995 (2021)","DOI":"10.1109\/ICCV48922.2021.01080"},{"key":"1_CR31","doi-asserted-by":"publisher","unstructured":"Petrovich, M., Black, M.J., Varol, G.: Temos: generating diverse human motions from textual descriptions. In: Computer Vision\u2013ECCV 2022: 17th European Conference, Tel Aviv, Israel, 23\u201327 October 2022, Proceedings, Part XXII, pp. 480\u2013497. Springer (2022). https:\/\/doi.org\/10.1007\/978-3-031-20047-2_28","DOI":"10.1007\/978-3-031-20047-2_28"},{"key":"1_CR32","doi-asserted-by":"crossref","unstructured":"Petrovich, M., Black, M.J., Varol, G.: Tmr: Text-to-motion retrieval using contrastive 3d human motion synthesis. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 9488\u20139497 (October 2023)","DOI":"10.1109\/ICCV51070.2023.00870"},{"issue":"4","key":"1_CR33","doi-asserted-by":"publisher","first-page":"236","DOI":"10.1089\/big.2016.0028","volume":"4","author":"M Plappert","year":"2016","unstructured":"Plappert, M., Mandery, C., Asfour, T.: The kit motion-language dataset. Big Data 4(4), 236\u2013252 (2016)","journal-title":"Big Data"},{"key":"1_CR34","doi-asserted-by":"crossref","unstructured":"Prokudin, S., Lassner, C., Romero, J.: Efficient learning on point clouds with basis point sets. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 4332\u20134341 (2019)","DOI":"10.1109\/ICCV.2019.00443"},{"key":"1_CR35","unstructured":"Puig, X., et al.: Habitat 3.0: A co-habitat for humans, avatars and robots (2023)"},{"issue":"6","key":"1_CR36","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3355089.3356505","volume":"38","author":"S Starke","year":"2019","unstructured":"Starke, S., Zhang, H., Komura, T., Saito, J.: Neural state machine for character-scene interactions. ACM Trans. Graph. 38(6), 1\u2013209 (2019)","journal-title":"ACM Trans. Graph."},{"key":"1_CR37","unstructured":"Straub, J et\u00a0al.: The replica dataset: A digital replica of indoor spaces. arXiv preprint arXiv:1906.05797 (2019)"},{"key":"1_CR38","unstructured":"Szot, A., et al.: Habitat 2.0: training home assistants to rearrange their habitat. In: Advances in Neural Information Processing Systems (NeurIPS) (2021)"},{"key":"1_CR39","doi-asserted-by":"crossref","unstructured":"Taheri, O., Choutas, V., Black, M.J., Tzionas, D.: Goal: generating 4d whole-body motion for hand-object grasping. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13263\u201313273 (2022)","DOI":"10.1109\/CVPR52688.2022.01291"},{"key":"1_CR40","doi-asserted-by":"publisher","unstructured":"Tessler, C., Kasten, Y., Guo, Y., Mannor, S., Chechik, G., Peng, X.B.: Calm: conditional adversarial latent models for directable virtual characters. In: ACM SIGGRAPH 2023 Conference Proceedings, SIGGRAPH 2023, Association for Computing Machinery, New York (2023). https:\/\/doi.org\/10.1145\/3588432.3591541","DOI":"10.1145\/3588432.3591541"},{"key":"1_CR41","doi-asserted-by":"publisher","unstructured":"Tevet, G., Gordon, B., Hertz, A., Bermano, A.H., Cohen-Or, D.: Motionclip: Exposing human motion generation to clip space. In: Computer Vision\u2013ECCV 2022: 17th European Conference, Tel Aviv, Israel, 23\u201327 October 2022, Proceedings, Part XXII, pp. 358\u2013374. Springer (2022). https:\/\/doi.org\/10.1007\/978-3-031-20047-2_2","DOI":"10.1007\/978-3-031-20047-2_2"},{"key":"1_CR42","unstructured":"Tevet, G., Raab, S., Gordon, B., Shafir, Y., Cohen-or, D., Bermano, A.H.: Human motion diffusion model. In: The Eleventh International Conference on Learning Representations (2022)"},{"key":"1_CR43","doi-asserted-by":"crossref","unstructured":"Wang, J., Xu, H., Xu, J., Liu, S., Wang, X.: Synthesizing long-term 3d human motion and interaction in 3d scenes. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9401\u20139411 (2021)","DOI":"10.1109\/CVPR46437.2021.00928"},{"key":"1_CR44","doi-asserted-by":"crossref","unstructured":"Wang, J., Rong, Y., Liu, J., Yan, S., Lin, D., Dai, B.: Towards diverse and natural scene-aware 3d human motion synthesis. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 20460\u201320469 (2022)","DOI":"10.1109\/CVPR52688.2022.01981"},{"key":"1_CR45","first-page":"14959","volume":"35","author":"Z Wang","year":"2022","unstructured":"Wang, Z., Chen, Y., Liu, T., Zhu, Y., Liang, W., Huang, S.: Humanise: language-conditioned human motion generation in 3d scenes. Adv. Neural. Inf. Process. Syst. 35, 14959\u201314971 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"1_CR46","doi-asserted-by":"publisher","unstructured":"Wu, Y., Wang, J., Zhang, Y., Zhang, S., Hilliges, O., Yu, F., Tang, S.: Saga: stochastic whole-body grasping with contact. In: European Conference on Computer Vision, pp. 257\u2013274. Springer (2022). https:\/\/doi.org\/10.1007\/978-3-031-20068-7_1","DOI":"10.1007\/978-3-031-20068-7_1"},{"key":"1_CR47","doi-asserted-by":"crossref","unstructured":"Xu, L., et al.: Actformer: a gan-based transformer towards general action-conditioned 3d human motion generation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 2228\u20132238 (October 2023)","DOI":"10.1109\/ICCV51070.2023.00212"},{"key":"1_CR48","doi-asserted-by":"crossref","unstructured":"Ye, S., et al.: Scene synthesis from human motion. In: SIGGRAPH Asia 2022 Conference Papers (2022)","DOI":"10.1145\/3550469.3555426"},{"key":"1_CR49","doi-asserted-by":"crossref","unstructured":"Yi, H., Huang, C.H.P., Tripathi, S., Hering, L., Thies, J., Black, M.J.: Mime: human-aware 3d scene generation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 12965\u201312976 (June 2023)","DOI":"10.1109\/CVPR52729.2023.01246"},{"key":"1_CR50","doi-asserted-by":"crossref","unstructured":"Yi, H., et al.: Human-aware object placement for visual environment reconstruction. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3959\u20133970 (2022)","DOI":"10.1109\/CVPR52688.2022.00393"},{"key":"1_CR51","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"34","DOI":"10.1007\/978-3-030-58610-2_3","volume-title":"Computer Vision \u2013 ECCV 2020","author":"JY Zhang","year":"2020","unstructured":"Zhang, J.Y., Pepose, S., Joo, H., Ramanan, D., Malik, J., Kanazawa, A.: Perceiving 3D human-object spatial arrangements from a single image in the wild. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12357, pp. 34\u201351. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58610-2_3"},{"key":"1_CR52","doi-asserted-by":"crossref","unstructured":"Zhang, J., et al.: Generating human motion from textual descriptions with discrete representations. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 14730\u201314740 (June 2023)","DOI":"10.1109\/CVPR52729.2023.01415"},{"key":"1_CR53","unstructured":"Zhang, M., et al.: Motiondiffuse: text-driven human motion generation with diffusion model. arXiv preprint arXiv:2208.15001 (2022)"},{"key":"1_CR54","doi-asserted-by":"crossref","unstructured":"Zhang, M., et al.: Remodiffuse: retrieval-augmented motion diffusion model. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 364\u2013373 (October 2023)","DOI":"10.1109\/ICCV51070.2023.00040"},{"key":"1_CR55","doi-asserted-by":"crossref","unstructured":"Zhang, S., Zhang, Y., Ma, Q., Black, M.J., Tang, S.: Place: proximity learning of articulation and contact in 3d environments. In: 2020 International Conference on 3D Vision (3DV), pp. 642\u2013651. IEEE (2020)","DOI":"10.1109\/3DV50981.2020.00074"},{"key":"1_CR56","doi-asserted-by":"publisher","unstructured":"Zhang, X., Bhatnagar, B.L., Starke, S., Guzov, V., Pons-Moll, G.: Couch: towards controllable human-chair interactions. In: European Conference on Computer Vision, pp. 518\u2013535. Springer (2022). https:\/\/doi.org\/10.1007\/978-3-031-20065-6_3","DOI":"10.1007\/978-3-031-20065-6_3"},{"key":"1_CR57","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Hassan, M., Neumann, H., Black, M.J., Tang, S.: Generating 3d people in scenes without people. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6194\u20136204 (2020)","DOI":"10.1109\/CVPR42600.2020.00623"},{"key":"1_CR58","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Tang, S.: The wanderings of odysseus in 3d scenes. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 20481\u201320491 (2022)","DOI":"10.1109\/CVPR52688.2022.01983"},{"key":"1_CR59","doi-asserted-by":"crossref","unstructured":"Zhao, K., Wang, S., Zhang, Y., Beeler, T., Tang, S.: Compositional human-scene interaction synthesis with semantic control. In: European Conference on Computer Vision, pp. 311\u2013327. Springer (2022)","DOI":"10.1007\/978-3-031-20068-7_18"},{"key":"1_CR60","doi-asserted-by":"crossref","unstructured":"Zhao, K., Zhang, Y., Wang, S., Beeler, T., Tang, S.: Synthesizing diverse human motions in 3d indoor scenes. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 14738\u201314749 (October 2023)","DOI":"10.1109\/ICCV51070.2023.01354"},{"key":"1_CR61","doi-asserted-by":"publisher","unstructured":"Zheng, Y., et al.: Gimo: gaze-informed human motion prediction in context. In: European Conference on Computer Vision, pp. 676\u2013694. Springer (2022). https:\/\/doi.org\/10.1007\/978-3-031-19778-9_39","DOI":"10.1007\/978-3-031-19778-9_39"},{"key":"1_CR62","doi-asserted-by":"crossref","unstructured":"Zhou, Y., Barnes, C., Lu, J., Yang, J., Li, H.: On the continuity of rotation representations in neural networks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5745\u20135753 (2019)","DOI":"10.1109\/CVPR.2019.00589"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-72973-7_1","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,17]],"date-time":"2025-01-17T12:24:44Z","timestamp":1737116684000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-72973-7_1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,1]]},"ISBN":["9783031729720","9783031729737"],"references-count":62,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-72973-7_1","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,11,1]]},"assertion":[{"value":"1 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}