{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,8]],"date-time":"2026-01-08T07:00:27Z","timestamp":1767855627083,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":48,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,12,3]],"date-time":"2024-12-03T00:00:00Z","timestamp":1733184000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,12,3]]},"DOI":"10.1145\/3680528.3687703","type":"proceedings-article","created":{"date-parts":[[2024,12,3]],"date-time":"2024-12-03T08:14:37Z","timestamp":1733213677000},"page":"1-11","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":5,"title":["F\u00fcrElise: Capturing and Physically Synthesizing Hand Motion of Piano Performance"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-8404-6405","authenticated-orcid":false,"given":"Ruocheng","family":"Wang","sequence":"first","affiliation":[{"name":"Stanford University, Stanford, United States of America"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7851-3971","authenticated-orcid":false,"given":"Pei","family":"Xu","sequence":"additional","affiliation":[{"name":"Stanford University, Stanford, United States of America"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3604-465X","authenticated-orcid":false,"given":"Haochen","family":"Shi","sequence":"additional","affiliation":[{"name":"Stanford University, Stanford, United States of America"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-1331-2707","authenticated-orcid":false,"given":"Elizabeth","family":"Schumann","sequence":"additional","affiliation":[{"name":"Stanford University, Stanford, United States of America"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5926-0905","authenticated-orcid":false,"given":"C. Karen","family":"Liu","sequence":"additional","affiliation":[{"name":"Stanford University, Stanford, United States of America"}]}],"member":"320","published-online":{"date-parts":[[2024,12,3]]},"reference":[{"key":"e_1_3_3_1_2_1","doi-asserted-by":"crossref","unstructured":"Simon Alexanderson Rajmund Nagy Jonas Beskow and Gustav\u00a0Eje Henter. 2023. Listen denoise action! audio-driven motion synthesis with diffusion models. ACM Transactions on Graphics (TOG) 42 4 (2023) 1\u201320.","DOI":"10.1145\/3592458"},{"key":"e_1_3_3_1_3_1","doi-asserted-by":"crossref","unstructured":"OpenAI:\u00a0Marcin Andrychowicz Bowen Baker Maciek Chociej Rafal Jozefowicz Bob McGrew Jakub Pachocki Arthur Petron Matthias Plappert Glenn Powell Alex Ray et\u00a0al. 2020. Learning dexterous in-hand manipulation. The International Journal of Robotics Research 39 1 (2020) 3\u201320.","DOI":"10.1177\/0278364919887447"},{"key":"e_1_3_3_1_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00893"},{"key":"e_1_3_3_1_5_1","doi-asserted-by":"crossref","unstructured":"Jiali Chen Changjie Fan Zhimeng Zhang Gongzheng Li Zeng Zhao Zhigang Deng and Yu Ding. 2023a. A Music-Driven Deep Generative Adversarial Model for Guzheng Playing Animation. IEEE Transactions on Visualization and Computer Graphics 29 2 (2023) 1400\u20131414.","DOI":"10.1109\/TVCG.2021.3115902"},{"key":"e_1_3_3_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/3588432.3591528"},{"key":"e_1_3_3_1_7_1","unstructured":"George ElKoura and Karan Singh. 2003. Handrix: Animating the Human Hand. (2003) 110\u2013119."},{"key":"e_1_3_3_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01244"},{"key":"e_1_3_3_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01834"},{"key":"e_1_3_3_1_10_1","first-page":"6840","volume-title":"Advances in Neural Information Processing Systems(NeurIPS)","author":"Ho Jonathan","year":"2020","unstructured":"Jonathan Ho, Ajay Jain, and Pieter Abbeel. 2020. Denoising diffusion probabilistic models. In Advances in Neural Information Processing Systems(NeurIPS) , Vol.\u00a033. 6840\u20136851."},{"key":"e_1_3_3_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413848"},{"key":"e_1_3_3_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/HUMANOIDS.2015.7363441"},{"key":"e_1_3_3_1_13_1","first-page":"218","volume-title":"ISMIR","author":"Li Bochen","year":"2018","unstructured":"Bochen Li, Akira Maezawa, and Zhiyao Duan. 2018. Skeleton Plays Piano: Online Generation of Pianist Body Movements from MIDI Performance.. In ISMIR. 218\u2013224."},{"key":"e_1_3_3_1_14_1","doi-asserted-by":"crossref","unstructured":"Jiaman Li Jiajun Wu and C\u00a0Karen Liu. 2023. Object motion guided human motion synthesis. ACM Transactions on Graphics (TOG) 42 6 (2023) 1\u201311.","DOI":"10.1145\/3618333"},{"key":"e_1_3_3_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01315"},{"key":"e_1_3_3_1_16_1","unstructured":"Jae\u00a0Hyun Lim and Jong\u00a0Chul Ye. 2017. Geometric gan. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1705.02894 (2017)."},{"key":"e_1_3_3_1_17_1","doi-asserted-by":"publisher","DOI":"10.5555\/1632592.1632616"},{"key":"e_1_3_3_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/1576246.1531365"},{"key":"e_1_3_3_1_19_1","doi-asserted-by":"crossref","unstructured":"Jun-Wei Liu Hung-Yi Lin Yu-Fen Huang Hsuan-Kai Kao and Li Su. 2020. Body Movement Generation for Expressive Violin Performance Applying Neural Networks. International Conference on Acoustics Speech and Signal Processing (ICASSP) (2020) 3787\u20133791.","DOI":"10.1109\/ICASSP40776.2020.9054463"},{"key":"e_1_3_3_1_20_1","volume-title":"International Conference on Learning Representations (ICLR)","author":"Liu Xueyi","year":"2024","unstructured":"Xueyi Liu and Li Yi. 2024. GeneOH Diffusion: Towards Generalizable Hand-Object Interaction Denoising via Denoising Diffusion. In International Conference on Learning Representations (ICLR)."},{"key":"e_1_3_3_1_21_1","unstructured":"Viktor Makoviychuk Lukasz Wawrzyniak Yunrong Guo Michelle Lu Kier Storey Miles Macklin David Hoeller Nikita Rudin Arthur Allshire Ankur Handa and Gavriel State. 2021. Isaac Gym: High Performance GPU-Based Physics Simulation For Robot Learning. arxiv:https:\/\/arXiv.org\/abs\/2108.10470\u00a0[cs.RO]"},{"key":"e_1_3_3_1_22_1","unstructured":"Josh Merel Yuval Tassa Dhruva TB Sriram Srinivasan Jay Lemmon Ziyu Wang Greg Wayne and Nicolas Heess. 2017. Learning human behaviors from motion capture by adversarial imitation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1707.02201 (2017)."},{"key":"e_1_3_3_1_23_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58565-5_33"},{"key":"e_1_3_3_1_24_1","doi-asserted-by":"publisher","DOI":"10.5555\/2422356.2422377"},{"key":"e_1_3_3_1_25_1","volume-title":"The art of piano playing","author":"Neuhaus Heinrich","year":"2008","unstructured":"Heinrich Neuhaus. 2008. The art of piano playing. Kahn and Averill."},{"key":"e_1_3_3_1_26_1","doi-asserted-by":"crossref","unstructured":"Georgios Pavlakos Dandan Shan Ilija Radosavovic Angjoo Kanazawa David Fouhey and Jitendra Malik. 2024. Reconstructing Hands in 3D with Transformers.","DOI":"10.1109\/CVPR52733.2024.00938"},{"key":"e_1_3_3_1_27_1","doi-asserted-by":"crossref","unstructured":"Xue\u00a0Bin Peng Yunrong Guo Lina Halper Sergey Levine and Sanja Fidler. 2022. ASE: Large-Scale Reusable Adversarial Skill Embeddings for Physically Simulated Characters. ACM Trans. Graph. 41 4 Article 94 (2022).","DOI":"10.1145\/3528223.3530110"},{"key":"e_1_3_3_1_28_1","doi-asserted-by":"crossref","unstructured":"Xue\u00a0Bin Peng Ze Ma Pieter Abbeel Sergey Levine and Angjoo Kanazawa. 2021. AMP: Adversarial Motion Priors for Stylized Physics-Based Character Control. ACM Trans. Graph. 40 4 Article 144 (2021).","DOI":"10.1145\/3476576.3476723"},{"key":"e_1_3_3_1_29_1","doi-asserted-by":"publisher","unstructured":"Javier Romero Dimitrios Tzionas and Michael\u00a0J. Black. 2017. Embodied hands: modeling and capturing hands and bodies together. ACM Trans. Graph. 36 6 Article 245 (nov 2017) 17\u00a0pages. 10.1145\/3130800.3130883https:\/\/dl.acm.org\/doi\/10.1145\/3130800.3130883","DOI":"10.1145\/3130800.3130883"},{"key":"e_1_3_3_1_30_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00790"},{"key":"e_1_3_3_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.494"},{"key":"e_1_3_3_1_32_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58548-8_34"},{"key":"e_1_3_3_1_33_1","volume-title":"International Conference on Learning Representations (ICLR)","author":"Tevet Guy","year":"2023","unstructured":"Guy Tevet, Sigal Raab, Brian Gordon, Yoni Shafir, Daniel Cohen-or, and Amit\u00a0Haim Bermano. 2023. Human Motion Diffusion Model. In International Conference on Learning Representations (ICLR). https:\/\/openreview.net\/forum?id=SJ1kSyO2jwu"},{"key":"e_1_3_3_1_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00051"},{"key":"e_1_3_3_1_35_1","doi-asserted-by":"crossref","unstructured":"Chen Wang Haochen Shi Weizhuo Wang Ruohan Zhang Li Fei-Fei and C.\u00a0Karen Liu. 2024. DexCap: Scalable and Portable Mocap Data Collection System for Dexterous Manipulation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2403.07788 (2024).","DOI":"10.15607\/RSS.2024.XX.043"},{"key":"e_1_3_3_1_36_1","doi-asserted-by":"crossref","unstructured":"Yangang Wang Jianyuan Min Jianjie Zhang Yebin Liu Feng Xu Qionghai Dai and Jinxiang Chai. 2013. Video-based hand manipulation capture through composite motion control. ACM Transactions on Graphics (TOG) 32 4 (2013) 1\u201314.","DOI":"10.1145\/2461912.2462000"},{"key":"e_1_3_3_1_37_1","doi-asserted-by":"publisher","DOI":"10.1109\/WACV56688.2023.00299"},{"key":"e_1_3_3_1_38_1","doi-asserted-by":"crossref","unstructured":"Zhaoming Xie Jonathan Tseng Sebastian Starke Michiel van\u00a0de Panne and C\u00a0Karen Liu. 2023. Hierarchical planning and control for box loco-manipulation. Proceedings of the ACM on Computer Graphics and Interactive Techniques 6 3 (2023) 1\u201318.","DOI":"10.1145\/3606931"},{"key":"e_1_3_3_1_39_1","doi-asserted-by":"publisher","DOI":"10.1109\/IROS47612.2022.9981221"},{"key":"e_1_3_3_1_40_1","doi-asserted-by":"crossref","unstructured":"Pei Xu and Ioannis Karamouzas. 2021. A GAN-Like Approach for Physics-Based Imitation Learning and Interactive Character Control. Proc. of the ACM on Computer Graphics and Interactive Techniques 4 3 (2021).","DOI":"10.1145\/3480148"},{"key":"e_1_3_3_1_41_1","doi-asserted-by":"crossref","unstructured":"Pei Xu Xiumin Shang Victor Zordan and Ioannis Karamouzas. 2023. Composite Motion Learning with Task Control. ACM Transactions on Graphics 42 4 (2023).","DOI":"10.1145\/3592447"},{"key":"e_1_3_3_1_42_1","unstructured":"Yamaha. 2024. Yamaha Disklavier Pianos. https:\/\/usa.yamaha.com\/products\/musical_instruments\/pianos\/disklavier\/index.html."},{"key":"e_1_3_3_1_43_1","doi-asserted-by":"crossref","unstructured":"Zeshi Yang Kangkang Yin and Libin Liu. 2022. Learning to use chopsticks in diverse gripping styles. ACM Transactions on Graphics (TOG) 41 4 (2022) 1\u201317.","DOI":"10.1145\/3528223.3530057"},{"key":"e_1_3_3_1_44_1","doi-asserted-by":"crossref","unstructured":"Yuting Ye and C\u00a0Karen Liu. 2012. Synthesis of detailed hand manipulations using contact sampling. ACM Transactions on Graphics (ToG) 31 4 (2012) 1\u201310.","DOI":"10.1145\/2185520.2335392"},{"key":"e_1_3_3_1_45_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01467"},{"key":"e_1_3_3_1_46_1","volume-title":"Conference on Robot Learning (CoRL)","author":"Zakka Kevin","year":"2023","unstructured":"Kevin Zakka, Philipp Wu, Laura Smith, Nimrod Gileadi, Taylor Howell, Xue\u00a0Bin Peng, Sumeet Singh, Yuval Tassa, Pete Florence, Andy Zeng, et\u00a0al. 2023. Robopianist: Dexterous piano playing with deep reinforcement learning. In Conference on Robot Learning (CoRL)."},{"key":"e_1_3_3_1_47_1","doi-asserted-by":"crossref","unstructured":"H Zhang Y Ye T Shiratori and T Komura. 2021. ManipNet: neural manipulation synthesis with a hand-object spatial representation. ACM Transactions on Graphics (2021).","DOI":"10.1145\/3476576.3476690"},{"key":"e_1_3_3_1_48_1","doi-asserted-by":"crossref","unstructured":"Wenping Zhao Jianjie Zhang Jianyuan Min and Jinxiang Chai. 2013. Robust realtime physics-based motion control for human grasping. ACM Transactions on Graphics (TOG) 32 6 (2013) 1\u201312.","DOI":"10.1145\/2508363.2508412"},{"key":"e_1_3_3_1_49_1","doi-asserted-by":"crossref","unstructured":"Yuanfeng Zhu Ajay\u00a0Sundar Ramakrishnan Bernd Hamann and Michael Neff. 2013. A system for automatic animation of piano performances. Computer Animation and Virtual Worlds 24 5 (2013) 445\u2013457.","DOI":"10.1002\/cav.1477"}],"event":{"name":"SA '24: SIGGRAPH Asia 2024 Conference Papers","location":"Tokyo Japan","acronym":"SA '24","sponsor":["SIGGRAPH ACM Special Interest Group on Computer Graphics and Interactive Techniques"]},"container-title":["SIGGRAPH Asia 2024 Conference Papers"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3680528.3687703","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3680528.3687703","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:18:20Z","timestamp":1750295900000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3680528.3687703"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,3]]},"references-count":48,"alternative-id":["10.1145\/3680528.3687703","10.1145\/3680528"],"URL":"https:\/\/doi.org\/10.1145\/3680528.3687703","relation":{},"subject":[],"published":{"date-parts":[[2024,12,3]]},"assertion":[{"value":"2024-12-03","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}