{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,28]],"date-time":"2026-03-28T08:18:14Z","timestamp":1774685894021,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":58,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,7,13]],"date-time":"2024-07-13T00:00:00Z","timestamp":1720828800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"National Key R&D Program of China","award":["No.2023YFF0905103"],"award-info":[{"award-number":["No.2023YFF0905103"]}]},{"name":"NSFC of China","award":["No.62172013"],"award-info":[{"award-number":["No.62172013"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,7,13]]},"DOI":"10.1145\/3641519.3657493","type":"proceedings-article","created":{"date-parts":[[2024,7,12]],"date-time":"2024-07-12T10:39:28Z","timestamp":1720780768000},"page":"1-12","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":2,"title":["DiffSound: Differentiable Modal Sound Rendering and Inverse Rendering for Diverse Inference Tasks"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-9017-4618","authenticated-orcid":false,"given":"Xutong","family":"Jin","sequence":"first","affiliation":[{"name":"School of Computer Science, Peking University, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-3102-6336","authenticated-orcid":false,"given":"Chenxi","family":"Xu","sequence":"additional","affiliation":[{"name":"School of Computer Science, Peking University, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8346-1114","authenticated-orcid":false,"given":"Ruohan","family":"Gao","sequence":"additional","affiliation":[{"name":"University of Maryland College Park, United States of America and Stanford University, United States of America"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4176-343X","authenticated-orcid":false,"given":"Jiajun","family":"Wu","sequence":"additional","affiliation":[{"name":"Stanford University, United States of America"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7819-0076","authenticated-orcid":false,"given":"Guoping","family":"Wang","sequence":"additional","affiliation":[{"name":"School of Computer Science, Peking University, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8901-2184","authenticated-orcid":false,"given":"Sheng","family":"Li","sequence":"additional","affiliation":[{"name":"School of Computer Science, Peking University, China"}]}],"member":"320","published-online":{"date-parts":[[2024,7,13]]},"reference":[{"key":"e_1_3_2_2_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/2567943"},{"key":"e_1_3_2_2_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/2816795.2818108"},{"key":"e_1_3_2_2_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/2185520.2185599"},{"key":"e_1_3_2_2_4_1","volume-title":"RealImpact: A Dataset of Impact Sound Fields for Real Objects. In Conference on Computer Vision and Pattern Recognition (CVPR).","author":"Clarke Samuel","year":"2023","unstructured":"Samuel Clarke, Ruohan Gao, Mason Wang, Mark Rau, Julia Xu, Mark Rau, Jui-Hsien Wang, Doug James, and Jiajun Wu. 2023. RealImpact: A Dataset of Impact Sound Fields for Real Objects. In Conference on Computer Vision and Pattern Recognition (CVPR)."},{"key":"e_1_3_2_2_5_1","volume-title":"DiffImpact: Differentiable Rendering and Identification of Impact Sounds. In 5th Annual Conference on Robot Learning.","author":"Clarke Samuel","year":"2021","unstructured":"Samuel Clarke, Negin Heravi, Mark Rau, Ruohan Gao, Jiajun Wu, Doug James, and Jeannette Bohg. 2021. DiffImpact: Differentiable Rendering and Identification of Impact Sounds. In 5th Annual Conference on Robot Learning."},{"key":"e_1_3_2_2_6_1","volume-title":"Differentiable Physics Simulation of Dynamics-Augmented Neural Objects. Robotics and Automation Letters (RA-L)","author":"Cleac\u2019h Simon\u00a0Le","year":"2023","unstructured":"Simon\u00a0Le Cleac\u2019h, Hong-Xing Yu, Michelle Guo, Taylor\u00a0A. Howell, Ruohan Gao, Jiajun Wu, Zachary Manchester, and Mac Schwager. 2023. Differentiable Physics Simulation of Dynamics-Augmented Neural Objects. Robotics and Automation Letters (RA-L) (2023)."},{"key":"e_1_3_2_2_7_1","unstructured":"COMSOL AB Stockholm Sweden. 2005. Comsol multiphysics user\u2019s guide."},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/2461912.2461986"},{"key":"e_1_3_2_2_9_1","volume-title":"Advances in Neural Information Processing Systems, S.\u00a0Bengio, H.\u00a0Wallach, H.\u00a0Larochelle, K.\u00a0Grauman, N.\u00a0Cesa-Bianchi, and R.\u00a0Garnett (Eds.). Vol.\u00a031. Curran Associates","author":"de Avila Belbute-Peres Filipe","unstructured":"Filipe de Avila Belbute-Peres, Kevin Smith, Kelsey Allen, Josh Tenenbaum, and J.\u00a0Zico Kolter. 2018. End-to-End Differentiable Physics for Learning and Control. In Advances in Neural Information Processing Systems, S.\u00a0Bengio, H.\u00a0Wallach, H.\u00a0Larochelle, K.\u00a0Grauman, N.\u00a0Cesa-Bianchi, and R.\u00a0Garnett (Eds.). Vol.\u00a031. Curran Associates, Inc."},{"key":"e_1_3_2_2_10_1","volume-title":"A differentiable physics engine for deep learning in robotics. Frontiers in neurorobotics","author":"Degrave Jonas","year":"2019","unstructured":"Jonas Degrave, Michiel Hermans, Joni Dambre, 2019. A differentiable physics engine for deep learning in robotics. Frontiers in neurorobotics (2019), 6."},{"key":"e_1_3_2_2_11_1","first-page":"214","article-title":"An efficient method of triangulating equi-valued surfaces by using tetrahedral cells","volume":"74","author":"Doi Akio","year":"1991","unstructured":"Akio Doi and Akio Koide. 1991. An efficient method of triangulating equi-valued surfaces by using tetrahedral cells. IEICE TRANSACTIONS on Information and Systems 74, 1 (1991), 214\u2013224.","journal-title":"IEICE TRANSACTIONS on Information and Systems"},{"key":"e_1_3_2_2_12_1","article-title":"DiffPD","volume":"41","author":"Du Tao","year":"2021","unstructured":"Tao Du, Kui Wu, Pingchuan Ma, Sebastien Wah, Andrew Spielberg, Daniela Rus, and Wojciech Matusik. 2021. DiffPD: Differentiable Projective Dynamics. ACM Trans. Graph. 41, 2, Article 13 (nov 2021), 21\u00a0pages.","journal-title":"Differentiable Projective Dynamics. ACM Trans. Graph."},{"key":"e_1_3_2_2_13_1","volume-title":"DDSP: Differentiable Digital Signal Processing. In International Conference on Learning Representations.","author":"Engel Jesse","year":"2020","unstructured":"Jesse Engel, Lamtharn\u00a0(Hanoi) Hantrakul, Chenjie Gu, and Adam Roberts. 2020. DDSP: Differentiable Digital Signal Processing. In International Conference on Learning Representations."},{"key":"e_1_3_2_2_14_1","volume-title":"The 22nd International Conference on Artificial Intelligence and Statistics. 2681\u20132690","author":"Feydy Jean","year":"2019","unstructured":"Jean Feydy, Thibault S\u00e9journ\u00e9, Fran\u00e7ois-Xavier Vialard, Shun-ichi Amari, Alain Trouve, and Gabriel Peyr\u00e9. 2019. Interpolating between Optimal Transport and MMD using Sinkhorn Divergences. In The 22nd International Conference on Artificial Intelligence and Statistics. 2681\u20132690."},{"key":"e_1_3_2_2_15_1","volume-title":"5th Annual Conference on Robot Learning.","author":"Gao Ruohan","year":"2021","unstructured":"Ruohan Gao, Yen-Yu Chang, Shivani Mall, Li Fei-Fei, and Jiajun Wu. 2021. ObjectFolder: A Dataset of Objects with Implicit Visual, Auditory, and Tactile Representations. In 5th Annual Conference on Robot Learning."},{"key":"e_1_3_2_2_16_1","unstructured":"Ruohan Gao Yiming Dou Hao Li Tanmay Agarwal Jeannette Bohg Yunzhu Li Li Fei-Fei and Jiajun Wu. 2023. The ObjectFolder Benchmark: Multisensory Object-Centric Learning with Neural and Real Objects. In CVPR."},{"key":"e_1_3_2_2_17_1","unstructured":"Ruohan Gao Zilin Si Yen-Yu Chang Samuel Clarke Jeannette Bohg Li Fei-Fei Wenzhen Yuan and Jiajun Wu. 2022. ObjectFolder 2.0: A Multisensory Object Dataset for Sim2Real Transfer. In CVPR."},{"key":"e_1_3_2_2_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/3414685.3417766"},{"key":"e_1_3_2_2_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/3355089.3356548"},{"key":"e_1_3_2_2_20_1","volume-title":"International Conference on Learning Representations.","author":"Holl Philipp","year":"2020","unstructured":"Philipp Holl, Nils Thuerey, and Vladlen Koltun. 2020. Learning to Control PDEs with Differentiable Physics. In International Conference on Learning Representations."},{"key":"e_1_3_2_2_21_1","volume-title":"DiffTaichi: Differentiable Programming for Physical Simulation. ICLR","author":"Hu Yuanming","year":"2020","unstructured":"Yuanming Hu, Luke Anderson, Tzu-Mao Li, Qi Sun, Nathan Carr, Jonathan Ragan-Kelley, and Fr\u00e9do Durand. 2020. DiffTaichi: Differentiable Programming for Physical Simulation. ICLR (2020)."},{"key":"e_1_3_2_2_22_1","volume-title":"ChainQueen: A Real-Time Differentiable Physical Simulator for Soft Robotics. In 2019 International Conference on Robotics and Automation (ICRA) (Montreal, QC, Canada). IEEE Press, 6265\u20136271","author":"Hu Yuanming","year":"2019","unstructured":"Yuanming Hu, Jiancheng Liu, Andrew Spielberg, Joshua\u00a0B. Tenenbaum, William\u00a0T. Freeman, Jiajun Wu, Daniela Rus, and Wojciech Matusik. 2019. ChainQueen: A Real-Time Differentiable Physical Simulator for Soft Robotics. In 2019 International Conference on Robotics and Automation (ICRA) (Montreal, QC, Canada). IEEE Press, 6265\u20136271."},{"key":"e_1_3_2_2_23_1","volume-title":"The finite element method: linear static and dynamic finite element analysis","author":"Hughes JR","unstructured":"Thomas\u00a0JR Hughes. 2012. The finite element method: linear static and dynamic finite element analysis. Courier Corporation."},{"key":"e_1_3_2_2_24_1","volume-title":"Physically Based Sound for Computer Animation and Virtual Environments. In ACM SIGGRAPH 2016 Courses","author":"James L.","year":"2016","unstructured":"Doug\u00a0L. James. 2016. Physically Based Sound for Computer Animation and Virtual Environments. In ACM SIGGRAPH 2016 Courses (Anaheim, California) (SIGGRAPH \u201916). Association for Computing Machinery, New York, NY, USA, Article 22, 8\u00a0pages."},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.1145\/1141911.1141983"},{"key":"e_1_3_2_2_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413572"},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/3528223.3530184"},{"key":"e_1_3_2_2_28_1","volume-title":"Can one hear the shape of a drum?The american mathematical monthly 73, 4P2","author":"Kac Mark","year":"1966","unstructured":"Mark Kac. 1966. Can one hear the shape of a drum?The american mathematical monthly 73, 4P2 (1966), 1\u201323."},{"key":"e_1_3_2_2_29_1","unstructured":"Hao Li Yizhi Zhang Junzhe Zhu Shaoxiong Wang Michelle\u00a0A. Lee Huazhe Xu Edward Adelson Li Fei-Fei Ruohan Gao and Jiajun Wu. 2022b. See Hear and Feel: Smart Sensory Fusion for Robotic Manipulation. In CoRL."},{"key":"e_1_3_2_2_30_1","article-title":"DiffCloth: Differentiable Cloth Simulation with Dry Frictional Contact","volume":"42","author":"Li Yifei","year":"2022","unstructured":"Yifei Li, Tao Du, Kui Wu, Jie Xu, and Wojciech Matusik. 2022a. DiffCloth: Differentiable Cloth Simulation with Dry Frictional Contact. ACM Trans. Graph. 42, 1, Article 2 (oct 2022), 20\u00a0pages.","journal-title":"ACM Trans. Graph."},{"key":"e_1_3_2_2_31_1","volume-title":"Advances in Neural Information Processing Systems, H.\u00a0Wallach, H.\u00a0Larochelle, A.\u00a0Beygelzimer, F.\u00a0d'Alch\u00e9-Buc, E.\u00a0Fox, and R.\u00a0Garnett (Eds.). Vol.\u00a032. Curran Associates","author":"Liang Junbang","unstructured":"Junbang Liang, Ming Lin, and Vladlen Koltun. 2019. Differentiable Cloth Simulation for Inverse Problems. In Advances in Neural Information Processing Systems, H.\u00a0Wallach, H.\u00a0Larochelle, A.\u00a0Beygelzimer, F.\u00a0d'Alch\u00e9-Buc, E.\u00a0Fox, and R.\u00a0Garnett (Eds.). Vol.\u00a032. Curran Associates, Inc."},{"key":"e_1_3_2_2_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/3414685.3417853"},{"key":"e_1_3_2_2_33_1","volume-title":"Fluid Control Using the Adjoint Method. 23, 3 (aug","author":"McNamara Antoine","year":"2004","unstructured":"Antoine McNamara, Adrien Treuille, Zoran Popovi\u0107, and Jos Stam. 2004. Fluid Control Using the Adjoint Method. 23, 3 (aug 2004), 449\u2013456."},{"key":"e_1_3_2_2_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/1364901.1364915"},{"key":"e_1_3_2_2_35_1","doi-asserted-by":"crossref","unstructured":"Ben Mildenhall Pratul\u00a0P. Srinivasan Matthew Tancik Jonathan\u00a0T. Barron Ravi Ramamoorthi and Ren Ng. 2020. NeRF: Representing Scenes as Neural Radiance Fields for View Synthesis. In ECCV.","DOI":"10.1007\/978-3-030-58452-8_24"},{"key":"e_1_3_2_2_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00810"},{"key":"e_1_3_2_2_37_1","volume-title":"International Conference on Learning Representations.","author":"Murthy Krishna","year":"2021","unstructured":"J.\u00a0Krishna Murthy, Miles Macklin, Florian Golemo, Vikram Voleti, Linda Petrini, Martin Weiss, Breandan Considine, J\u00e9r\u00f4me Parent-L\u00e9vesque, Kevin Xie, Kenny Erleben, Liam Paull, Florian Shkurti, Derek Nowrouzezahrai, and Sanja Fidler. 2021. gradSim: Differentiable simulation for system identification and visuomotor control. In International Conference on Learning Representations."},{"key":"e_1_3_2_2_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/545261.545290"},{"key":"e_1_3_2_2_39_1","unstructured":"Adam Paszke Sam Gross Soumith Chintala Gregory Chanan Edward Yang Zachary DeVito Zeming Lin Alban Desmaison Luca Antiga and Adam Lerer. 2017. Automatic differentiation in PyTorch. (2017)."},{"key":"e_1_3_2_2_40_1","doi-asserted-by":"publisher","DOI":"10.1145\/944020.944025"},{"key":"e_1_3_2_2_41_1","doi-asserted-by":"publisher","DOI":"10.5555\/3524938.3525665"},{"key":"e_1_3_2_2_42_1","doi-asserted-by":"publisher","DOI":"10.1145\/1111411.1111429"},{"key":"e_1_3_2_2_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/2421636.2421637"},{"key":"e_1_3_2_2_44_1","volume-title":"Conference on Robot Learning. PMLR, 317\u2013335","author":"Schenck Connor","year":"2018","unstructured":"Connor Schenck and Dieter Fox. 2018. Spnets: Differentiable fluid dynamics for deep neural networks. In Conference on Robot Learning. PMLR, 317\u2013335."},{"key":"e_1_3_2_2_45_1","doi-asserted-by":"publisher","DOI":"10.1145\/3313797"},{"key":"e_1_3_2_2_46_1","first-page":"6087","article-title":"Deep marching tetrahedra: a hybrid representation for high-resolution 3d shape synthesis","volume":"34","author":"Shen Tianchang","year":"2021","unstructured":"Tianchang Shen, Jun Gao, Kangxue Yin, Ming-Yu Liu, and Sanja Fidler. 2021. Deep marching tetrahedra: a hybrid representation for high-resolution 3d shape synthesis. Advances in Neural Information Processing Systems 34 (2021), 6087\u20136101.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_2_47_1","doi-asserted-by":"publisher","DOI":"10.1145\/2343483.2343501"},{"key":"e_1_3_2_2_48_1","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2019.2898822"},{"key":"e_1_3_2_2_49_1","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2019\/869"},{"key":"e_1_3_2_2_50_1","doi-asserted-by":"publisher","DOI":"10.1145\/882262.882337"},{"key":"e_1_3_2_2_51_1","doi-asserted-by":"publisher","DOI":"10.1145\/383259.383322"},{"key":"e_1_3_2_2_52_1","doi-asserted-by":"publisher","DOI":"10.1162\/105474698565794"},{"key":"e_1_3_2_2_53_1","doi-asserted-by":"publisher","DOI":"10.5555\/1218064.1218067"},{"key":"e_1_3_2_2_54_1","doi-asserted-by":"publisher","DOI":"10.1145\/3550454.3555479"},{"key":"e_1_3_2_2_55_1","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2021.XVII.008"},{"key":"e_1_3_2_2_56_1","doi-asserted-by":"publisher","DOI":"10.5555\/3294771.3294893"},{"key":"e_1_3_2_2_57_1","volume-title":"Toward High-Quality Modal Contact Sound. In ACM SIGGRAPH 2011 Papers","author":"Zheng Changxi","year":"2011","unstructured":"Changxi Zheng and Doug\u00a0L. James. 2011. Toward High-Quality Modal Contact Sound. In ACM SIGGRAPH 2011 Papers (Vancouver, British Columbia, Canada) (SIGGRAPH \u201911). Association for Computing Machinery, New York, NY, USA, Article 38, 12\u00a0pages."},{"key":"e_1_3_2_2_58_1","doi-asserted-by":"crossref","unstructured":"Bofang Zhu. 2018. The finite element method: fundamentals and applications in civil hydraulic mechanical and aeronautical engineering. (2018).","DOI":"10.1002\/9781119107323"}],"event":{"name":"SIGGRAPH '24: Special Interest Group on Computer Graphics and Interactive Techniques Conference","location":"Denver CO USA","acronym":"SIGGRAPH '24","sponsor":["SIGGRAPH ACM Special Interest Group on Computer Graphics and Interactive Techniques"]},"container-title":["Special Interest Group on Computer Graphics and Interactive Techniques Conference Conference Papers"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3641519.3657493","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3641519.3657493","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T00:05:50Z","timestamp":1750291550000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3641519.3657493"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7,13]]},"references-count":58,"alternative-id":["10.1145\/3641519.3657493","10.1145\/3641519"],"URL":"https:\/\/doi.org\/10.1145\/3641519.3657493","relation":{},"subject":[],"published":{"date-parts":[[2024,7,13]]},"assertion":[{"value":"2024-07-13","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}