{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,15]],"date-time":"2025-11-15T10:29:15Z","timestamp":1763202555094,"version":"3.28.0"},"reference-count":28,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,10,17]],"date-time":"2021-10-17T00:00:00Z","timestamp":1634428800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,10,17]],"date-time":"2021-10-17T00:00:00Z","timestamp":1634428800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,10,17]]},"DOI":"10.1109\/waspaa52581.2021.9632737","type":"proceedings-article","created":{"date-parts":[[2021,12,13]],"date-time":"2021-12-13T16:12:28Z","timestamp":1639411948000},"page":"336-340","source":"Crossref","is-referenced-by-count":9,"title":["Saladnet: Self-Attentive Multisource Localization in the Ambisonics Domain"],"prefix":"10.1109","author":[{"given":"Pierre-Amaury","family":"Grumiaux","sequence":"first","affiliation":[{"name":"Orange Labs.,Cesson-S&#x00E9;vign&#x00E9;,France"}]},{"given":"Srdan","family":"Kitic","sequence":"additional","affiliation":[{"name":"Orange Labs.,Cesson-S&#x00E9;vign&#x00E9;,France"}]},{"given":"Prerak","family":"Srivastava","sequence":"additional","affiliation":[{"name":"Univ. de Lorraine, Inria,Nancy,France"}]},{"given":"Laurent","family":"Girin","sequence":"additional","affiliation":[{"name":"Univ. Grenoble Alpes, GIPSA-lab, Grenoble-INP, CNRS,Grenoble,France"}]},{"given":"Alexandre","family":"Guerin","sequence":"additional","affiliation":[{"name":"Orange Labs.,Cesson-S&#x00E9;vign&#x00E9;,France"}]}],"member":"263","reference":[{"doi-asserted-by":"publisher","key":"ref10","DOI":"10.3390\/s18103418"},{"doi-asserted-by":"publisher","key":"ref11","DOI":"10.1109\/TAP.2018.2874430"},{"doi-asserted-by":"publisher","key":"ref12","DOI":"10.23919\/Eusipco47968.2020.9287224"},{"doi-asserted-by":"publisher","key":"ref13","DOI":"10.20965\/jrm.2017.p0037"},{"doi-asserted-by":"publisher","key":"ref14","DOI":"10.21437\/Interspeech.2020-2759"},{"year":"2019","author":"cao","journal-title":"Two-stage sound event localization and detection using intensity vector and generalized cross-correlation","key":"ref15"},{"year":"2021","author":"subramanian","journal-title":"Deep Learning based Multi-Source Localization with Source Splitting and its Effectiveness in Multi-Talker Speech Recognition","key":"ref16"},{"doi-asserted-by":"publisher","key":"ref17","DOI":"10.23919\/Eusipco47968.2020.9287344"},{"doi-asserted-by":"publisher","key":"ref18","DOI":"10.23919\/EUSIPCO54536.2021.9616124"},{"year":"2016","author":"bahdanau","journal-title":"Neural machine translation by jointly learning to align and translate","key":"ref19"},{"key":"ref28","article-title":"TRAMP: TRacking by a realtime AMbisonic-based Particle filter","author":"kitic","year":"0","journal-title":"LOCATA Challenge Workshop"},{"doi-asserted-by":"publisher","key":"ref4","DOI":"10.1109\/TAP.1986.1143830"},{"key":"ref27","article-title":"Incorporating Nesterov Momentum into Adam","author":"dozat","year":"0","journal-title":"ICLR 2016"},{"doi-asserted-by":"publisher","key":"ref3","DOI":"10.1109\/IROS.2016.7759437"},{"doi-asserted-by":"publisher","key":"ref6","DOI":"10.1109\/TASL.2007.906694"},{"doi-asserted-by":"publisher","key":"ref5","DOI":"10.1109\/TASSP.1976.1162830"},{"year":"2018","author":"adavanne","journal-title":"Direction of arrival estimation for multiple sound sources using convolutional recurrent neural network","key":"ref8"},{"doi-asserted-by":"publisher","key":"ref7","DOI":"10.1109\/MLSP.2016.7738817"},{"doi-asserted-by":"publisher","key":"ref2","DOI":"10.1109\/LSP.2016.2583658"},{"doi-asserted-by":"publisher","key":"ref9","DOI":"10.1109\/JSTSP.2019.2900164"},{"doi-asserted-by":"publisher","key":"ref1","DOI":"10.23919\/EUSIPCO.2019.8903121"},{"year":"2020","author":"phan","journal-title":"Audio Event Detection and Localization with Multitask Regression Network","key":"ref20"},{"key":"ref22","volume":"9","author":"jarrett","year":"2017","journal-title":"Theory and Applications of Spherical Microphone Array Processing ser Springer Topics in Signal Processing"},{"year":"2017","author":"vaswani","journal-title":"Attention is all you need","key":"ref21"},{"year":"2006","author":"habets","journal-title":"Room impulse response generator","key":"ref24"},{"doi-asserted-by":"publisher","key":"ref23","DOI":"10.1109\/ICASSP40776.2020.9054561"},{"year":"1993","author":"garofolo","journal-title":"TIMIT Acoustic-Phonetic Continuous Speech Corpus","key":"ref26"},{"doi-asserted-by":"publisher","key":"ref25","DOI":"10.1121\/1.382599"}],"event":{"name":"2021 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","start":{"date-parts":[[2021,10,17]]},"location":"New Paltz, NY, USA","end":{"date-parts":[[2021,10,20]]}},"container-title":["2021 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9632687\/9632666\/09632737.pdf?arnumber=9632737","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,2]],"date-time":"2022-08-02T19:57:42Z","timestamp":1659470262000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9632737\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,10,17]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/waspaa52581.2021.9632737","relation":{},"subject":[],"published":{"date-parts":[[2021,10,17]]}}}