{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,8]],"date-time":"2026-07-08T14:53:44Z","timestamp":1783522424878,"version":"3.55.0"},"publisher-location":"New York, NY, USA","reference-count":48,"publisher":"ACM","license":[{"start":{"date-parts":[[2020,10,12]],"date-time":"2020-10-12T00:00:00Z","timestamp":1602460800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"National Key Research and Development","award":["2017YFB0203002"],"award-info":[{"award-number":["2017YFB0203002"]}]},{"name":"National Natural Science Foundation of China","award":["61632003"],"award-info":[{"award-number":["61632003"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2020,10,12]]},"DOI":"10.1145\/3394171.3413572","type":"proceedings-article","created":{"date-parts":[[2020,10,12]],"date-time":"2020-10-12T12:27:35Z","timestamp":1602505655000},"page":"1171-1179","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":17,"title":["Deep-Modal: Real-Time Impact Sound Synthesis for Arbitrary Shapes"],"prefix":"10.1145","author":[{"given":"Xutong","family":"Jin","sequence":"first","affiliation":[{"name":"Peking University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Sheng","family":"Li","sequence":"additional","affiliation":[{"name":"Peking University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Tianshu","family":"Qu","sequence":"additional","affiliation":[{"name":"Peking University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Dinesh","family":"Manocha","sequence":"additional","affiliation":[{"name":"University of Maryland, College Park, MD, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Guoping","family":"Wang","sequence":"additional","affiliation":[{"name":"Peking University, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2020,10,12]]},"reference":[{"key":"e_1_3_2_2_1_1","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2011.76"},{"key":"e_1_3_2_2_2_1","volume-title":"Combined wave and ray based room acoustic simulations of small rooms","author":"Aretz Marc","unstructured":"Marc Aretz . 2012. Combined wave and ray based room acoustic simulations of small rooms . Vol. 12 . Logos Verlag Berlin GmbH. Marc Aretz. 2012. Combined wave and ray based room acoustic simulations of small rooms. Vol. 12. Logos Verlag Berlin GmbH."},{"key":"e_1_3_2_2_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/1399504.1360623"},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/2185520.2185599"},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2018.2871219"},{"key":"e_1_3_2_2_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/3197517.3201357"},{"key":"e_1_3_2_2_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9054091"},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00685"},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_2_2_10_1","volume-title":"Physically Based Sound for Computer Animation and Virtual Environments. ACM SIGGRAPH 2016 Course.","author":"James DL","year":"2016","unstructured":"DL James , TR Langlois , R Mehra , and C Zheng . 2016 . Physically Based Sound for Computer Animation and Virtual Environments. ACM SIGGRAPH 2016 Course. DL James, TR Langlois, R Mehra, and C Zheng. 2016. Physically Based Sound for Computer Animation and Virtual Environments. ACM SIGGRAPH 2016 Course."},{"key":"e_1_3_2_2_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/1141911.1141983"},{"key":"e_1_3_2_2_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00526"},{"key":"e_1_3_2_2_13_1","doi-asserted-by":"crossref","unstructured":"Ignacio Llamas. 2007. Real-time voxelization of triangle meshes on the GPU. In SIGGRAPH Sketches. 18.  Ignacio Llamas. 2007. Real-time voxelization of triangle meshes on the GPU. In SIGGRAPH Sketches. 18.","DOI":"10.1145\/1278780.1278802"},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"e_1_3_2_2_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2015.7353481"},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/2451236.2451245"},{"key":"e_1_3_2_2_17_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46484-8_29"},{"key":"e_1_3_2_2_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/545261.545290"},{"key":"e_1_3_2_2_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.264"},{"key":"e_1_3_2_2_21_1","volume-title":"Proceedings of the IEEE conference on computer vision and pattern recognition. 652--660","author":"Qi Charles R","year":"2017","unstructured":"Charles R Qi , Hao Su , Kaichun Mo , and Leonidas J Guibas . 2017 . Pointnet: Deep learning on point sets for 3d classification and segmentation . In Proceedings of the IEEE conference on computer vision and pattern recognition. 652--660 . Charles R Qi, Hao Su, Kaichun Mo, and Leonidas J Guibas. 2017. Pointnet: Deep learning on point sets for 3d classification and segmentation. In Proceedings of the IEEE conference on computer vision and pattern recognition. 652--660."},{"key":"e_1_3_2_2_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.609"},{"key":"e_1_3_2_2_23_1","unstructured":"Charles Ruizhongtai Qi Li Yi Hao Su and Leonidas J Guibas. 2017. Pointnet++: Deep hierarchical feature learning on point sets in a metric space. In Advances in neural information processing systems. 5099--5108.  Charles Ruizhongtai Qi Li Yi Hao Su and Leonidas J Guibas. 2017. Pointnet++: Deep hierarchical feature learning on point sets in a metric space. In Advances in neural information processing systems. 5099--5108."},{"key":"e_1_3_2_2_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/1111411.1111429"},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2009.27"},{"key":"e_1_3_2_2_26_1","first-page":"1","article-title":"Example-guided physically based modal sound synthesis","volume":"32","author":"Ren Zhimin","year":"2013","unstructured":"Zhimin Ren , Hengchin Yeh , and Ming C Lin . 2013 . Example-guided physically based modal sound synthesis . ACM Transactions on Graphics (TOG) 32 , 1 (2013), 1 -- 16 . Zhimin Ren, Hengchin Yeh, and Ming C Lin. 2013. Example-guided physically based modal sound synthesis. ACM Transactions on Graphics (TOG) 32, 1 (2013), 1--16.","journal-title":"ACM Transactions on Graphics (TOG)"},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"e_1_3_2_2_28_1","volume-title":"SynCoPation: Interactive synthesis-coupled sound propagation","author":"Rungta Atul","year":"2016","unstructured":"Atul Rungta , Carl Schissler , Ravish Mehra , Chris Malloy , Ming Lin , and Dinesh Manocha . 2016. SynCoPation: Interactive synthesis-coupled sound propagation . IEEE transactions on visualization and computer graphics 22, 4 ( 2016 ), 1346--1355. Atul Rungta, Carl Schissler, Ravish Mehra, Chris Malloy, Ming Lin, and Dinesh Manocha. 2016. SynCoPation: Interactive synthesis-coupled sound propagation. IEEE transactions on visualization and computer graphics 22, 4 (2016), 1346--1355."},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461368"},{"key":"e_1_3_2_2_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/2856400.2856419"},{"key":"e_1_3_2_2_31_1","volume-title":"Audio-material reconstruction for virtualized reality using a probabilistic damping model","author":"Sterling Auston","year":"2019","unstructured":"Auston Sterling , Nicholas Rewkowski , Roberta L Klatzky , and Ming C Lin . 2019. Audio-material reconstruction for virtualized reality using a probabilistic damping model . IEEE transactions on visualization and computer graphics 25, 5 ( 2019 ), 1855--1864. Auston Sterling, Nicholas Rewkowski, Roberta L Klatzky, and Ming C Lin. 2019. Audio-material reconstruction for virtualized reality using a probabilistic damping model. IEEE transactions on visualization and computer graphics 25, 5 (2019), 1855--1864."},{"key":"e_1_3_2_2_32_1","volume-title":"Lin","author":"Sterling Auston","year":"2018","unstructured":"Auston Sterling , Justin Wilson , Sam Lowe , and Ming C . Lin . 2018 . ISNN : Impact Sound Neural Network for Audio-Visual Object Classification. In Computer Vision -- ECCV 2018, Vittorio Ferrari, Martial Hebert, Cristian Sminchisescu, and Yair Weiss (Eds.). Springer International Publishing , Cham, 578--595. Auston Sterling, Justin Wilson, Sam Lowe, and Ming C. Lin. 2018. ISNN: Impact Sound Neural Network for Audio-Visual Object Classification. In Computer Vision -- ECCV 2018, Vittorio Ferrari, Martial Hebert, Cristian Sminchisescu, and Yair Weiss (Eds.). Springer International Publishing, Cham, 578--595."},{"key":"e_1_3_2_2_33_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.114"},{"key":"e_1_3_2_2_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2020.2973058"},{"key":"e_1_3_2_2_35_1","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1111"},{"key":"e_1_3_2_2_36_1","volume-title":"Synthesis of shape dependent sounds with physical modeling","author":"van de Doel Kees","unstructured":"Kees van de Doel and Dinesh K Pai . 1996. Synthesis of shape dependent sounds with physical modeling . Georgia Institute of Technology . Kees van de Doel and Dinesh K Pai. 1996. Synthesis of shape dependent sounds with physical modeling. Georgia Institute of Technology."},{"key":"e_1_3_2_2_37_1","doi-asserted-by":"publisher","DOI":"10.1145\/383259.383322"},{"key":"e_1_3_2_2_38_1","doi-asserted-by":"publisher","DOI":"10.1162\/105474698565794"},{"key":"e_1_3_2_2_39_1","volume-title":"WaveNet: A Generative Model for Raw Audio. In 9th ISCA Speech Synthesis Workshop. 125--125","author":"van den Oord A\u00e4ron","unstructured":"A\u00e4ron van den Oord , Sander Dieleman , Heiga Zen , Karen Simonyan , Oriol Vinyals , Alex Graves , Nal Kalchbrenner , Andrew Senior , and Koray Kavukcuoglu . [n.d.]. WaveNet: A Generative Model for Raw Audio. In 9th ISCA Speech Synthesis Workshop. 125--125 . A\u00e4ron van den Oord, Sander Dieleman, Heiga Zen, Karen Simonyan, Oriol Vinyals, Alex Graves, Nal Kalchbrenner, Andrew Senior, and Koray Kavukcuoglu. [n.d.]. WaveNet: A Generative Model for Raw Audio. In 9th ISCA Speech Synthesis Workshop. 125--125."},{"key":"e_1_3_2_2_40_1","doi-asserted-by":"publisher","DOI":"10.1145\/3306346.3322976"},{"key":"e_1_3_2_2_41_1","doi-asserted-by":"publisher","DOI":"10.1145\/3197517.3201318"},{"key":"e_1_3_2_2_42_1","first-page":"4006","article-title":"Tacotron","volume":"2017","author":"Skerry-Ryan R.J.","year":"2017","unstructured":"YuxuanWang, R.J. Skerry-Ryan , Daisy Stanton , YonghuiWu, RonWeiss, Navdeep Jaitly , Zongheng Yang , Ying Xiao , Zhifeng Chen , Samy Bengio , Quoc Le , Yannis Agiomyrgiannakis , Rob Clark , and Rif Saurous . 2017 . Tacotron : Towards End-to- End Speech Synthesis. In Proc. Interspeech 2017. 4006 -- 4010 . YuxuanWang, R.J. Skerry-Ryan, Daisy Stanton, YonghuiWu, RonWeiss, Navdeep Jaitly, Zongheng Yang, Ying Xiao, Zhifeng Chen, Samy Bengio, Quoc Le, Yannis Agiomyrgiannakis, Rob Clark, and Rif Saurous. 2017. Tacotron: Towards End-to- End Speech Synthesis. In Proc. Interspeech 2017. 4006--4010.","journal-title":"Towards End-to- End Speech Synthesis. In Proc. Interspeech"},{"key":"e_1_3_2_2_43_1","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3326362","article-title":"Dynamic graph cnn for learning on point clouds","volume":"38","author":"Wang Yue","year":"2019","unstructured":"Yue Wang , Yongbin Sun , Ziwei Liu , Sanjay E Sarma , Michael M Bronstein , and Justin M Solomon . 2019 . Dynamic graph cnn for learning on point clouds . ACM Transactions On Graphics (TOG) 38 , 5 (2019), 1 -- 12 . Yue Wang, Yongbin Sun, Ziwei Liu, Sanjay E Sarma, Michael M Bronstein, and Justin M Solomon. 2019. Dynamic graph cnn for learning on point clouds. ACM Transactions On Graphics (TOG) 38, 5 (2019), 1--12.","journal-title":"ACM Transactions On Graphics (TOG)"},{"key":"e_1_3_2_2_44_1","volume-title":"Proceedings of the IEEE conference on computer vision and pattern recognition. 1912--1920","author":"Wu Zhirong","year":"2015","unstructured":"Zhirong Wu , Shuran Song , Aditya Khosla , Fisher Yu , Linguang Zhang , Xiaoou Tang , and Jianxiong Xiao . 2015 . 3D shapenets: A deep representation for volumetric shapes . In Proceedings of the IEEE conference on computer vision and pattern recognition. 1912--1920 . Zhirong Wu, Shuran Song, Aditya Khosla, Fisher Yu, Linguang Zhang, Xiaoou Tang, and Jianxiong Xiao. 2015. 3D shapenets: A deep representation for volumetric shapes. In Proceedings of the IEEE conference on computer vision and pattern recognition. 1912--1920."},{"key":"e_1_3_2_2_45_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01231-1_29"},{"key":"e_1_3_2_2_46_1","doi-asserted-by":"publisher","DOI":"10.1007\/11558651_32"},{"key":"e_1_3_2_2_47_1","unstructured":"Zhoutong Zhang Qiujia Li Zhengjia Huang JiajunWu Josh Tenenbaum and Bill Freeman. 2017. Shape and material from sound. In Advances in Neural Information Processing Systems. 1278--1288.  Zhoutong Zhang Qiujia Li Zhengjia Huang JiajunWu Josh Tenenbaum and Bill Freeman. 2017. Shape and material from sound. In Advances in Neural Information Processing Systems. 1278--1288."},{"key":"e_1_3_2_2_48_1","doi-asserted-by":"publisher","DOI":"10.1145\/1833349.1778806"},{"key":"e_1_3_2_2_49_1","doi-asserted-by":"publisher","DOI":"10.1145\/1964921.1964933"}],"event":{"name":"MM '20: The 28th ACM International Conference on Multimedia","location":"Seattle WA USA","acronym":"MM '20","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 28th ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3394171.3413572","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3394171.3413572","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T20:47:14Z","timestamp":1750193234000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3394171.3413572"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,10,12]]},"references-count":48,"alternative-id":["10.1145\/3394171.3413572","10.1145\/3394171"],"URL":"https:\/\/doi.org\/10.1145\/3394171.3413572","relation":{},"subject":[],"published":{"date-parts":[[2020,10,12]]},"assertion":[{"value":"2020-10-12","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}