{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,5,25]],"date-time":"2025-05-25T18:10:04Z","timestamp":1748196604474,"version":"3.41.0"},"publisher-location":"Cham","reference-count":37,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031915741","type":"print"},{"value":"9783031915758","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-91575-8_19","type":"book-chapter","created":{"date-parts":[[2025,5,25]],"date-time":"2025-05-25T17:57:44Z","timestamp":1748195864000},"page":"307-323","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Motion Reconstruction via\u00a0Human Anatomy Diffusion from\u00a0Sparse Tracking"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-1732-8627","authenticated-orcid":false,"given":"Zehai","family":"Niu","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0176-3088","authenticated-orcid":false,"given":"Ke","family":"Lu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0006-3714-1650","authenticated-orcid":false,"given":"Kun","family":"Dong","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9460-802X","authenticated-orcid":false,"given":"Jian","family":"Xue","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9720-3220","authenticated-orcid":false,"given":"Xiaoyu","family":"Qin","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5916-8965","authenticated-orcid":false,"given":"Jinbao","family":"Wang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,5,12]]},"reference":[{"key":"19_CR1","doi-asserted-by":"crossref","unstructured":"Ahuja, K., Ofek, E., Gonzalez-Franco, M., Holz, C., Wilson, A.D.: Coolmoves: user motion accentuation in virtual reality. In: Proceedings of the ACM on Interactive, Mobile, Wearable and Ubiquitous Technologies 5(2), pp. 1\u201323 (2021)","DOI":"10.1145\/3463499"},{"key":"19_CR2","doi-asserted-by":"crossref","unstructured":"Chen, X., Jiang, B., Liu, W., Huang, Z., Fu, B., Chen, T., Yu, G.: Executing your commands via motion diffusion in latent space. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 18000\u201318010 (2023)","DOI":"10.1109\/CVPR52729.2023.01726"},{"key":"19_CR3","doi-asserted-by":"crossref","unstructured":"Choi, J., Kim, S., Jeong, Y., Gwon, Y., Yoon, S.: Ilvr: conditioning method for denoising diffusion probabilistic models. arXiv preprint arXiv:2108.02938 (2021)","DOI":"10.1109\/ICCV48922.2021.01410"},{"key":"19_CR4","doi-asserted-by":"crossref","unstructured":"Dabral, R., Mughal, M.H., Golyanik, V., Theobalt, C.: Mofusion: A framework for denoising-diffusion-based motion synthesis. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 9760\u20139770 (2023)","DOI":"10.1109\/CVPR52729.2023.00941"},{"key":"19_CR5","doi-asserted-by":"crossref","unstructured":"Di, X., Dai, X., Zhang, X., Chen, X.: Dual attention poser: dual path body tracking based on attention. In: 2023 IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), pp. 2795\u20132804. IEEE (2023)","DOI":"10.1109\/CVPRW59228.2023.00280"},{"key":"19_CR6","doi-asserted-by":"crossref","unstructured":"Dittadi, A., Dziadzio, S., Cosker, D., Lundell, B., Cashman, T.J., Shotton, J.: Full-body motion from a single head-mounted device: generating smpl poses from partial observations. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 11687\u201311697 (2021)","DOI":"10.1109\/ICCV48922.2021.01148"},{"key":"19_CR7","doi-asserted-by":"crossref","unstructured":"Du, Y., Kips, R., Pumarola, A., Starke, S., Thabet, A., Sanakoyeu, A.: Avatars grow legs: generating smooth human motion from sparse tracking inputs with diffusion model. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 481\u2013490 (2023)","DOI":"10.1109\/CVPR52729.2023.00054"},{"key":"19_CR8","doi-asserted-by":"crossref","unstructured":"Flash, T., Hogan, N.: The coordination of arm movements: an experimentally confirmed mathematical model. J. Neurosci. (1985)","DOI":"10.1523\/JNEUROSCI.05-07-01688.1985"},{"key":"19_CR9","first-page":"6840","volume":"33","author":"J Ho","year":"2020","unstructured":"Ho, J., Jain, A., Abbeel, P.: Denoising diffusion probabilistic models. Adv. Neural. Inf. Process. Syst. 33, 6840\u20136851 (2020)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"issue":"6","key":"19_CR10","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3272127.3275108","volume":"37","author":"Y Huang","year":"2018","unstructured":"Huang, Y., Kaufmann, M., Aksan, E., Black, M.J., Hilliges, O., Pons-Moll, G.: Deep inertial poser: learning to reconstruct human pose from sparse inertial measurements in real time. ACM Trans. Graph. (TOG) 37(6), 1\u201315 (2018)","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"19_CR11","doi-asserted-by":"crossref","unstructured":"Jiang, J., et al.: Avatarposer: articulated full-body pose tracking from sparse motion sensing. In: European Conference on Computer Vision, pp. 443\u2013460. Springer (2022)","DOI":"10.1007\/978-3-031-20065-6_26"},{"key":"19_CR12","doi-asserted-by":"crossref","unstructured":"Jin, Z., et al.: Holosinger: semantics and music driven motion generation with octahedral holographic projection. In: Proceedings of the 31st ACM International Conference on Multimedia, pp. 9393\u20139395 (2023)","DOI":"10.1145\/3581783.3612674"},{"key":"19_CR13","doi-asserted-by":"crossref","unstructured":"Kim, J., Kim, J., Choi, S.: Flame: free-form language-based motion synthesis & editing. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol.\u00a037, pp. 8255\u20138263 (2023)","DOI":"10.1609\/aaai.v37i7.25996"},{"key":"19_CR14","doi-asserted-by":"crossref","unstructured":"Lin, J., Zeng, A., Wang, H., Zhang, L., Li, Y.: One-stage 3d whole-body mesh recovery with component aware transformer. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 21159\u201321168 (2023)","DOI":"10.1109\/CVPR52729.2023.02027"},{"key":"19_CR15","doi-asserted-by":"crossref","unstructured":"Loper, M., Mahmood, N., Romero, J., Pons-Moll, G., Black, M.J.: Smpl: A skinned multi-person linear model. In: Seminal Graphics Papers: Pushing the Boundaries, vol. 2, pp. 851\u2013866 (2023)","DOI":"10.1145\/3596711.3596800"},{"key":"19_CR16","unstructured":"Lou, Y., Zhu, L., Wang, Y., Wang, X., Yang, Y.: Diversemotion: towards diverse human motion generation via discrete diffusion. arXiv preprint arXiv:2309.01372 (2023)"},{"key":"19_CR17","unstructured":"Lu, S., et al.: Humantomato: text-aligned whole-body motion generation. arXiv preprint arXiv:2310.12978 (2023)"},{"key":"19_CR18","unstructured":"Nichol, A., et al.: Glide: towards photorealistic image generation and editing with text-guided diffusion models. arXiv preprint arXiv:2112.10741 (2021)"},{"key":"19_CR19","unstructured":"Nichol, A.Q., Dhariwal, P.: Improved denoising diffusion probabilistic models. In: International Conference on Machine Learning, pp. 8162\u20138171. PMLR (2021)"},{"key":"19_CR20","doi-asserted-by":"crossref","unstructured":"Petrovich, M., Black, M.J., Varol, G.: TMR: text-to-motion retrieval using contrastive 3D human motion synthesis. In: International Conference on Computer Vision (ICCV) (2023)","DOI":"10.1109\/ICCV51070.2023.00870"},{"key":"19_CR21","unstructured":"Ramesh, A., Dhariwal, P., Nichol, A., Chu, C., Chen, M.: Hierarchical text-conditional image generation with clip latents. arXiv preprint arXiv:2204.061251(2), 3 (2022)"},{"key":"19_CR22","unstructured":"Roetenberg, D., Luinge, H., Slycke, P.J.: Xsens mvn: Full 6dof human motion tracking using miniature inertial sensors (2009)"},{"key":"19_CR23","unstructured":"Sohl-Dickstein, J., Weiss, E., Maheswaranathan, N., Ganguli, S.: Deep unsupervised learning using nonequilibrium thermodynamics. In: International Conference on Machine Learning, pp. 2256\u20132265. PMLR (2015)"},{"key":"19_CR24","doi-asserted-by":"crossref","unstructured":"Sun, Y., Bao, Q., Liu, W., Mei, T., Black, M.J.: Trace: 5d temporal regression of avatars with dynamic cameras in 3d environments. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8856\u20138866 (2023)","DOI":"10.1109\/CVPR52729.2023.00855"},{"key":"19_CR25","unstructured":"Tevet, G., Raab, S., Gordon, B., Shafir, Y., Cohen-Or, D., Bermano, A.H.: Human motion diffusion model. arXiv preprint arXiv:2209.14916 (2022)"},{"key":"19_CR26","doi-asserted-by":"crossref","unstructured":"Von\u00a0Marcard, T., Rosenhahn, B., Black, M.J., Pons-Moll, G.: Sparse inertial poser: automatic 3d human pose estimation from sparse imus. In: Computer Graphics Forum, vol.\u00a036, pp. 349\u2013360. Wiley Online Library (2017)","DOI":"10.1111\/cgf.13131"},{"key":"19_CR27","doi-asserted-by":"crossref","unstructured":"Wang, J., Liu, L., Xu, W., Sarkar, K., Luvizon, D., Theobalt, C.: Estimating egocentric 3d human pose in the wild with external weak supervision. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13157\u201313166 (2022)","DOI":"10.1109\/CVPR52688.2022.01281"},{"key":"19_CR28","doi-asserted-by":"crossref","unstructured":"Wang, J., Liu, L., Xu, W., Sarkar, K., Theobalt, C.: Estimating egocentric 3d human pose in global space. In: International Conference on Computer Vision (2021)","DOI":"10.1109\/ICCV48922.2021.01130"},{"key":"19_CR29","doi-asserted-by":"crossref","unstructured":"Wang, J., Luvizon, D., Xu, W., Liu, L., Sarkar, K., Theobalt, C.: Scene-aware egocentric 3d human pose estimation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13031\u201313040 (2023)","DOI":"10.1109\/CVPR52729.2023.01252"},{"key":"19_CR30","doi-asserted-by":"crossref","unstructured":"Yang, D., Kim, D., Lee, S.H.: Lobstr: real-time lower-body pose prediction from sparse upper-body tracking signals. In: Computer Graphics Forum, vol.\u00a040, pp. 265\u2013275. Wiley Online Library (2021)","DOI":"10.1111\/cgf.142631"},{"key":"19_CR31","doi-asserted-by":"crossref","unstructured":"Yi, H., Liang, H., Liu, Y., Cao, Q., Wen, Y., Bolkart, T., Tao, D., Black, M.J.: Generating holistic 3d human motion from speech. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 469\u2013480, June 2023","DOI":"10.1109\/CVPR52729.2023.00053"},{"key":"19_CR32","doi-asserted-by":"crossref","unstructured":"Yi, X., Zhou, Y., Habermann, M., Shimada, S., Golyanik, V., Theobalt, C., Xu, F.: Physical inertial poser (pip): Physics-aware real-time human motion tracking from sparse inertial sensors. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13167\u201313178 (2022)","DOI":"10.1109\/CVPR52688.2022.01282"},{"issue":"4","key":"19_CR33","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3450626.3459786","volume":"40","author":"X Yi","year":"2021","unstructured":"Yi, X., Zhou, Y., Xu, F.: Transpose: real-time 3d human translation and pose estimation with six inertial sensors. ACM Trans. Graph. (TOG) 40(4), 1\u201313 (2021)","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"19_CR34","doi-asserted-by":"crossref","unstructured":"Zhang, J., et al.: T2m-gpt: generating human motion from textual descriptions with discrete representations. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) (2023)","DOI":"10.1109\/CVPR52729.2023.01415"},{"key":"19_CR35","unstructured":"Zhang, M., et al.: Motiondiffuse: text-driven human motion generation with diffusion model. arXiv preprint arXiv:2208.15001 (2022)"},{"key":"19_CR36","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Xia, S., Chu, L., Yang, J., Wu, Q., Pei, L.: Dynamic inertial poser (dynaip): Part-based motion dynamics learning for enhanced human pose estimation with sparse inertial sensors. arXiv preprint arXiv:2312.02196 (2023)","DOI":"10.1109\/CVPR52733.2024.00185"},{"key":"19_CR37","doi-asserted-by":"crossref","unstructured":"Zhu, W., Ma, X., Liu, Z., Liu, L., Wu, W., Wang, Y.: Motionbert: a unified perspective on learning human motion representations. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (2023)","DOI":"10.1109\/ICCV51070.2023.01385"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024 Workshops"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-91575-8_19","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,25]],"date-time":"2025-05-25T17:57:56Z","timestamp":1748195876000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-91575-8_19"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031915741","9783031915758"],"references-count":37,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-91575-8_19","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"12 May 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}