{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,21]],"date-time":"2026-05-21T14:53:13Z","timestamp":1779375193486,"version":"3.53.1"},"reference-count":28,"publisher":"IEEE","license":[{"start":{"date-parts":[[2022,5,23]],"date-time":"2022-05-23T00:00:00Z","timestamp":1653264000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,5,23]],"date-time":"2022-05-23T00:00:00Z","timestamp":1653264000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022,5,23]]},"DOI":"10.1109\/icassp43922.2022.9746754","type":"proceedings-article","created":{"date-parts":[[2022,4,27]],"date-time":"2022-04-27T19:50:34Z","timestamp":1651089034000},"page":"8872-8876","source":"Crossref","is-referenced-by-count":13,"title":["Spatial Data Augmentation with Simulated Room Impulse Responses for Sound Event Localization and Detection"],"prefix":"10.1109","author":[{"given":"Yuichiro","family":"Koyama","sequence":"first","affiliation":[{"name":"Sony Group Corporation,Tokyo,Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Kazuhide","family":"Shigemi","sequence":"additional","affiliation":[{"name":"The University of Tokyo,Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Masafumi","family":"Takahashi","sequence":"additional","affiliation":[{"name":"Sony Group Corporation,Tokyo,Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Kazuki","family":"Shimada","sequence":"additional","affiliation":[{"name":"Sony Group Corporation,Tokyo,Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Naoya","family":"Takahashi","sequence":"additional","affiliation":[{"name":"Sony Group Corporation,Tokyo,Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Emiru","family":"Tsunoo","sequence":"additional","affiliation":[{"name":"Sony Group Corporation,Tokyo,Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Shusuke","family":"Takahashi","sequence":"additional","affiliation":[{"name":"Sony Group Corporation,Tokyo,Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yuki","family":"Mitsufuji","sequence":"additional","affiliation":[{"name":"Sony Group Corporation,Tokyo,Japan"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.33682\/3qgs-e216"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8461310"},{"key":"ref12","first-page":"20","article-title":"3D sound field recording with higher order Ambisonics&#x2013;objective measurements and validation of a 4th order spherical microphone","author":"moreau","year":"2006","journal-title":"Audio Engineering Society Convention"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA.2017.8170028"},{"key":"ref14","first-page":"993","article-title":"Densely connected multi-dilated convolutional networks for dense prediction tasks","author":"takahashi","year":"2021","journal-title":"Proc of IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)"},{"key":"ref15","article-title":"Ensemble of ACCDOA-and EINV2-based Systems with D3Nets and Impulse Response Simulation for Sound Event Localization and Detection","author":"shimada","year":"2021"},{"key":"ref16","doi-asserted-by":"crossref","DOI":"10.21437\/Interspeech.2016-805","article-title":"Deep convolutional neural networks and data augmentation for acoustic event detection","author":"takahashi","year":"2016","journal-title":"Proc of Interspeech"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2017.2751969"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-2680"},{"key":"ref19","first-page":"5210","article-title":"Robust MVDR beamforming using time-frequency masks for on-line\/offline ASR in noise","author":"higuchi","year":"2016","journal-title":"Proc of IEEE ICASSP"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA.2019.8937220"},{"key":"ref4","first-page":"71","article-title":"A sequence matching network for polyphonic sound event localization and detection","author":"nguyen","year":"2020","journal-title":"Proc of IEEE ICASSP"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003750"},{"key":"ref3","article-title":"A dataset of reverberant spatial sound scenes with moving sources for sound event localization and detection","author":"politis","year":"2020"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9413473"},{"key":"ref5","article-title":"A dataset of dynamic reverberant sound scenes with directional interferers for sound event localization and detection","author":"politis","year":"2021"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9413609"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9414602"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.33682\/4jhy-bj81"},{"key":"ref9","article-title":"A four-stage data augmentation approach to ResNet-Conformer based acoustic modeling for sound event localization and detection","author":"wang","year":"2021"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2018.2885636"},{"key":"ref20","article-title":"Microphone array processing for parametric spatial audio techniques","author":"politis","year":"2016","journal-title":"PhD thesis"},{"key":"ref22","author":"williams","year":"1999","journal-title":"Fourier Acoustics Sound Radiation and Nearfield Acoustical Holography"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2020.3045528"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2009.2025790"},{"key":"ref23","article-title":"The NIGENS general sound events database","author":"trowitzsch","year":"2019"},{"key":"ref26","article-title":"Accurate, large minibatch sgd: Training imagenet in 1 hour","author":"goyal","year":"2017"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-2441"}],"event":{"name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Singapore, Singapore","start":{"date-parts":[[2022,5,23]]},"end":{"date-parts":[[2022,5,27]]}},"container-title":["ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9745891\/9746004\/09746754.pdf?arnumber=9746754","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,23]],"date-time":"2024-09-23T03:21:01Z","timestamp":1727061661000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9746754\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,5,23]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/icassp43922.2022.9746754","relation":{},"subject":[],"published":{"date-parts":[[2022,5,23]]}}}