{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,5]],"date-time":"2026-06-05T05:07:26Z","timestamp":1780636046088,"version":"3.54.1"},"reference-count":93,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,12,4]],"date-time":"2025-12-04T00:00:00Z","timestamp":1764806400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2026,1,12]],"date-time":"2026-01-12T00:00:00Z","timestamp":1768176000000},"content-version":"vor","delay-in-days":39,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"name":"Repertorium","award":["1010950"],"award-info":[{"award-number":["1010950"]}]},{"name":"RESTART MUSA","award":["43C22003080001"],"award-info":[{"award-number":["43C22003080001"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J AUDIO SPEECH MUSIC PROC."],"DOI":"10.1186\/s13636-025-00437-y","type":"journal-article","created":{"date-parts":[[2025,12,4]],"date-time":"2025-12-04T04:03:59Z","timestamp":1764821039000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Parametric virtual microphone techniques for sound field reconstruction with early reflection modeling"],"prefix":"10.1186","volume":"2026","author":[{"ORCID":"https:\/\/orcid.org\/0009-0004-5094-4701","authenticated-orcid":false,"given":"Gioele","family":"Greco","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Mirco","family":"Pezzoli","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Fabio","family":"Antonacci","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Augusto","family":"Sarti","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,12,4]]},"reference":[{"key":"437_CR1","doi-asserted-by":"publisher","unstructured":"J. Yang, M. Wu, L. Han, A review of sound field control. Appl. Sci. 12(14), (2022). https:\/\/doi.org\/10.3390\/app12147319","DOI":"10.3390\/app12147319"},{"issue":"9","key":"437_CR2","doi-asserted-by":"publisher","first-page":"1578","DOI":"10.1109\/JPROC.2021.3075390","volume":"109","author":"SR Quackenbush","year":"2021","unstructured":"S.R. Quackenbush, J. Herre, Mpeg standards for compressed representation of immersive audio. Proc. IEEE 109(9), 1578\u20131589 (2021). https:\/\/doi.org\/10.1109\/JPROC.2021.3075390","journal-title":"Proc. IEEE"},{"issue":"8","key":"437_CR3","doi-asserted-by":"publisher","first-page":"605","DOI":"10.1002\/jsid.2001","volume":"32","author":"AK Bhowmik","year":"2024","unstructured":"A.K. Bhowmik, Virtual and augmented reality: Human sensory-perceptual requirements and trends for immersive spatial computing experiences. J. Soc. Inf. Disp. 32(8), 605\u2013646 (2024). https:\/\/doi.org\/10.1002\/jsid.2001","journal-title":"J. Soc. Inf. Disp."},{"key":"437_CR4","unstructured":"J.G. Tylka, E.Y. Choueiri, in Audio Engineering Society Convention. Comparison of techniques for binaural navigation of higher-order ambisonic soundfields, (Audio Engineering Society, New York, NY, 2015) Paper 9421; Available from: https:\/\/aes2.org\/publications\/elibrary-page\/?id=17977"},{"issue":"7","key":"437_CR5","doi-asserted-by":"publisher","first-page":"3609","DOI":"10.1109\/TVCG.2023.3238662","volume":"30","author":"L Pisha","year":"2024","unstructured":"L. Pisha, S. Yadegari, Specular path generation and near-reflective diffraction in interactive acoustical simulations. IEEE Trans. Vis. Comput. Graph. 30(7), 3609\u20133621 (2024). https:\/\/doi.org\/10.1109\/TVCG.2023.3238662","journal-title":"IEEE Trans. Vis. Comput. Graph."},{"key":"437_CR6","doi-asserted-by":"publisher","first-page":"36","DOI":"10.1109\/MSP.2017.2666081","volume":"34","author":"H Hac\u0131habibo\u011flu","year":"2017","unstructured":"H. Hac\u0131habibo\u011flu, E.D. Sena, Z. Cvetkovi\u0107, J.D. Johnston, J.O. Smith, Perceptual spatial audio recording, simulation, and rendering: An overview of spatial-audio techniques based on psychoacoustics. IEEE Signal Process. Mag. 34, 36\u201354 (2017). https:\/\/doi.org\/10.1109\/MSP.2017.2666081","journal-title":"IEEE Signal Process. Mag."},{"key":"437_CR7","doi-asserted-by":"publisher","first-page":"1023","DOI":"10.1109\/TASLPRO.2025.3536841","volume":"33","author":"T Sprunck","year":"2025","unstructured":"T. Sprunck, A. Deleforge, Y. Privat, C. Foy, Fully reversing the shoebox image source method: From impulse responses to room parameters. IEEE Trans. Audio Speech Lang. Process. 33, 1023\u20131033 (2025). https:\/\/doi.org\/10.1109\/TASLPRO.2025.3536841","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"437_CR8","doi-asserted-by":"publisher","first-page":"2667","DOI":"10.1109\/TASLP.2024.3398999","volume":"32","author":"S Damiano","year":"2024","unstructured":"S. Damiano, F. Borra, A. Bernardini, F. Antonacci, A. Sarti, A compressive sensing approach for the reconstruction of the soundfield produced by directive sources in reverberant rooms. IEEE\/ACM Trans. Audio Speech Lang. Process. 32, 2667\u20132679 (2024). https:\/\/doi.org\/10.1109\/TASLP.2024.3398999","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."},{"key":"437_CR9","doi-asserted-by":"publisher","unstructured":"A. Politis, L. Pajunen, J. Lepp\u00e4nen, S. Mate, A. Eronen, in 2023 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA). Wide-area 6dof rendering of multi-point ambisonic recordings based on interpolation of spatial parameters (2023), pp. 1\u20135. https:\/\/doi.org\/10.1109\/WASPAA58266.2023.10248142","DOI":"10.1109\/WASPAA58266.2023.10248142"},{"issue":"6","key":"437_CR10","first-page":"503","volume":"55","author":"V Pulkki","year":"2007","unstructured":"V. Pulkki, Spatial sound reproduction with directional audio coding. J. Audio Eng. Soc. 55(6), 503\u2013516 (2007)","journal-title":"J. Audio Eng. Soc."},{"issue":"9","key":"437_CR11","first-page":"709","volume":"57","author":"J Vilkamo","year":"2009","unstructured":"J. Vilkamo, T. Lokki, V. Pulkki, Directional audio coding: Virtual microphone-based synthesis and subjective evaluation. J. Audio Eng. Soc. 57(9), 709\u2013724 (2009)","journal-title":"J. Audio Eng. Soc."},{"key":"437_CR12","unstructured":"R. Schultz-Amling, F. Kuech, O. Thiergart, M. Kallinger, in Audio Engineering Society Convention. Acoustical zooming based on a parametric sound field representation, vol. 128 (Audio Engineering Society, New York, NY, 2010)"},{"key":"437_CR13","unstructured":"S. Berge, N. Barrett, in 2nd International Symposium on Ambisonics and Spherical Acoustics. High angular resolution planewave expansion (Proc. of the 2nd International Symposium on Ambisonics and Spherical Acoustics, Paris, France, 2010), pp. 6\u20137"},{"key":"437_CR14","doi-asserted-by":"crossref","unstructured":"G. Del\u00a0Galdo, O. Thiergart, T. Weller, E.A.P. Habets, in Hands-Free Speech Communication and Microphone Arrays (HSCMA). Generating virtual microphone signals using geometrical information gathered by distributed arrays (IEEE, Edinburgh, 2011), pp. 185\u2013190","DOI":"10.1109\/HSCMA.2011.5942394"},{"issue":"12","key":"437_CR15","doi-asserted-by":"publisher","first-page":"2583","DOI":"10.1109\/TASL.2013.2280210","volume":"21","author":"O Thiergart","year":"2013","unstructured":"O. Thiergart, G. Del Galdo, M. Taseska, E.A.P. Habets, Geometry-based spatial sound acquisition using distributed microphone arrays. IEEE Trans. Audio Speech Lang. Process. 21(12), 2583\u20132594 (2013)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"issue":"2","key":"437_CR16","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1109\/MSP.2014.2369531","volume":"32","author":"K Kowalczyk","year":"2015","unstructured":"K. Kowalczyk, O. Thiergart, M. Taseska, G. Del Galdo, V. Pulkki, E.A.P. Habets, Parametric spatial sound processing: A flexible and efficient solution to sound scene acquisition, modification, and reproduction. IEEE Signal Process. Mag. 32(2), 31\u201342 (2015)","journal-title":"IEEE Signal Process. Mag."},{"key":"437_CR17","unstructured":"A. Plinge, S.J. Schlecht, O. Thiergart, T. Robotham, O. Rummukainen, E.A.P. Habets, in Audio Engineering Society Conference: International Conference on Audio for Virtual and Augmented Reality. Six-degrees-of-freedom binaural audio reproduction of first-order ambisonics with distance information (Audio Engineering Society, Redmond, WA, USA, 2018), p. 11"},{"key":"437_CR18","doi-asserted-by":"crossref","unstructured":"M. Pezzoli, F. Borra, F. Antonacci, A. Sarti, S. Tubaro, in International Conference on Acoustics, Speech and Signal Processing, (ICASSP). Estimation of the sound field at arbitrary positions in distributed microphone networks based on distributed ray space transform (IEEE, Piscataway, NJ, 2018), pp. 186\u2013190.","DOI":"10.1109\/ICASSP.2018.8462634"},{"key":"437_CR19","doi-asserted-by":"crossref","unstructured":"M. Pezzoli, F. Borra, F. Antonacci, A. Sarti, S. Tubaro, in 26th European Signal Processing Conference (EUSIPCO). Reconstruction of the virtual microphone signal based on the distributed ray space transform (IEEE, Piscataway, NJ, 2018), pp. 1537\u20131541.","DOI":"10.23919\/EUSIPCO.2018.8553548"},{"key":"437_CR20","unstructured":"P. Samarasinghe, T.D. Abhayapala, M.A. Poletti, in International Workshop on Acoustic Signal Enhancement (IWAENC). 3D spatial soundfield recording over large regions (Institute of Electrical and Electronics Engineers Inc., Aachen, Germany, 2012), pp. 1\u20134"},{"issue":"3","key":"437_CR21","doi-asserted-by":"publisher","first-page":"647","DOI":"10.1109\/TASLP.2014.2300341","volume":"22","author":"P Samarasinghe","year":"2014","unstructured":"P. Samarasinghe, T.D. Abhayapala, M.A. Poletti, Wavefield analysis over large areas using distributed higher order microphones. IEEE\/ACM Trans. Audio Speech Lang. Process. 22(3), 647\u2013658 (2014)","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."},{"key":"437_CR22","doi-asserted-by":"publisher","unstructured":"J.G. Tylka, E.Y. Choueiri, in Audio Engineering Society Conference: International Conference on Audio for Virtual and Augmented Reality. Soundfield navigation using an array of higher-order ambisonics microphones (Audio Engineering Society, 2016), p. 10. https:\/\/doi.org\/10.17743\/aesconf.2016.978-1-942220-10-7","DOI":"10.17743\/aesconf.2016.978-1-942220-10-7"},{"issue":"1","key":"437_CR23","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1109\/LSP.2017.2774351","volume":"25","author":"N Ueno","year":"2018","unstructured":"N. Ueno, S. Koyama, H. Saruwatari, Sound field recording using distributed microphones based on harmonic analysis of infinite order. IEEE Signal Process. Lett. 25(1), 135\u2013139 (2018). https:\/\/doi.org\/10.1109\/LSP.2017.2774351","journal-title":"IEEE Signal Process. Lett."},{"key":"437_CR24","doi-asserted-by":"publisher","unstructured":"Y. Takida, S. Koyama, H. Saruwataril, in 26th European Signal Processing Conference, (EUSIPCO). Exterior and interior sound field separation using convex optimization: Comparison of signal models (IEEE , 2018), pp. 2549\u20132553. https:\/\/doi.org\/10.23919\/EUSIPCO.2018.8553535","DOI":"10.23919\/EUSIPCO.2018.8553535"},{"issue":"1","key":"437_CR25","doi-asserted-by":"publisher","first-page":"172","DOI":"10.1109\/JSTSP.2019.2901127","volume":"13","author":"S Koyama","year":"2019","unstructured":"S. Koyama, L. Daudet, Sparse representation of a spatial sound field in a reverberant environment. IEEE J. Sel. Top. Signal Process. 13(1), 172\u2013184 (2019)","journal-title":"IEEE J. Sel. Top. Signal Process."},{"key":"437_CR26","doi-asserted-by":"crossref","unstructured":"F. Borra, I.D. Gebru, D. Markovi\u0107, in International Conference on Acoustics, Speech and Signal Processing, (ICASSP). Soundfield reconstruction in reverberant environments using higher-order microphones and impulse response measurements (IEEE, Piscataway, NJ, 2019), pp. 281\u2013285.","DOI":"10.1109\/ICASSP.2019.8682961"},{"key":"437_CR27","doi-asserted-by":"crossref","unstructured":"F. Borra, I.D. Gebru, D. Markovi\u0107, in Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA). 1st-order microphone array system for large area sound field recording and reconstruction: Discussion and preliminary results (IEEE, 2019), p. 5","DOI":"10.1109\/WASPAA.2019.8937281"},{"key":"437_CR28","doi-asserted-by":"publisher","unstructured":"S. Damiano, F. Miotello, M. Pezzoli, A. Bernardini, F. Antonacci, A. Sarti, T. Van Waterschoot, in ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). A zero-shot physics-informed dictionary learning approach for sound field reconstruction (IEEE, Piscataway, NJ, 2025), pp. 1\u20135. https:\/\/doi.org\/10.1109\/ICASSP49660.2025.10888108","DOI":"10.1109\/ICASSP49660.2025.10888108"},{"issue":"6","key":"437_CR29","doi-asserted-by":"publisher","first-page":"1711","DOI":"10.1109\/TASL.2010.2097249","volume":"19","author":"YJ Wu","year":"2011","unstructured":"Y.J. Wu, T.D. Abhayapala, Spatial multizone soundfield reproduction: Theory and design. Trans. Audio Speech Lang. Proc. 19(6), 1711\u20131720 (2011). https:\/\/doi.org\/10.1109\/TASL.2010.2097249","journal-title":"Trans. Audio Speech Lang. Proc."},{"issue":"4","key":"437_CR30","doi-asserted-by":"publisher","first-page":"2100","DOI":"10.1121\/1.1863032","volume":"117","author":"T Betlehem","year":"2005","unstructured":"T. Betlehem, T.D. Abhayapala, Theory and design of sound field reproduction in reverberant rooms. J. Acoust. Soc. Am. 117(4), 2100\u20132111 (2005). https:\/\/doi.org\/10.1121\/1.1863032","journal-title":"J. Acoust. Soc. Am."},{"key":"437_CR31","doi-asserted-by":"publisher","unstructured":"W. Zhang, P.N. Samarasinghe, H. Chen, T.D. Abhayapala, Surround by sound: A review of spatial audio recording and reproduction. Appl. Sci. 7(5) (2017). https:\/\/doi.org\/10.3390\/app7050532","DOI":"10.3390\/app7050532"},{"key":"437_CR32","doi-asserted-by":"publisher","unstructured":"D.N. Zotkin, R. Duraiswami, N.A. Gumerov, in 2009 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics. Regularized hrtf fitting using spherical harmonics (2009), pp. 257\u2013260. https:\/\/doi.org\/10.1109\/ASPAA.2009.5346521","DOI":"10.1109\/ASPAA.2009.5346521"},{"key":"437_CR33","doi-asserted-by":"publisher","first-page":"78214","DOI":"10.1109\/ACCESS.2019.2921388","volume":"7","author":"H Liu","year":"2019","unstructured":"H. Liu, Y. Fang, Q. Huang, Efficient representation of head-related transfer functions with combination of spherical harmonics and spherical wavelets. IEEE Access 7, 78214\u201378222 (2019). https:\/\/doi.org\/10.1109\/ACCESS.2019.2921388","journal-title":"IEEE Access"},{"issue":"2","key":"437_CR34","doi-asserted-by":"publisher","first-page":"649","DOI":"10.1121\/10.0001687","volume":"148","author":"F Llu\u00eds","year":"2020","unstructured":"F. Llu\u00eds, P. Mart\u00ednez-Nuevo, M. Bo M\u00f8ller, S. Ewan Shepstone, Sound field reconstruction in rooms: Inpainting meets super-resolution. J. Acoust. Soc. Am. 148(2), 649\u2013659 (2020). https:\/\/doi.org\/10.1121\/10.0001687","journal-title":"J. Acoust. Soc. Am."},{"key":"437_CR35","doi-asserted-by":"publisher","unstructured":"S. Damiano, F. Borra, A. Bernardini, F. Antonacci, A. Sarti, in 2021 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA). Soundfield reconstruction in reverberant rooms based on compressive sensing and image-source models of early reflections (2021), pp. 366\u2013370. https:\/\/doi.org\/10.1109\/WASPAA52581.2021.9632746","DOI":"10.1109\/WASPAA52581.2021.9632746"},{"key":"437_CR36","doi-asserted-by":"crossref","unstructured":"S. Koyama, H. Saruwatari, in International Conference on Acoustics, Speech and Signal Processing (ICASSP). Sound field decomposition in reverberant environment using sparse and low-rank signal models (IEEE, Piscataway, NJ, 2016)","DOI":"10.1109\/ICASSP.2016.7471704"},{"key":"437_CR37","doi-asserted-by":"publisher","unstructured":"M. Pezzoli, M. Cobos, F. Antonacci, A. Sarti, in ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). Sparsity-based sound field separation in the spherical harmonics domain (2022), pp. 1051\u20131055. https:\/\/doi.org\/10.1109\/ICASSP43922.2022.9746391","DOI":"10.1109\/ICASSP43922.2022.9746391"},{"key":"437_CR38","doi-asserted-by":"publisher","first-page":"4369","DOI":"10.1109\/TASLP.2024.3467951","volume":"32","author":"JGC Ribeiro","year":"2024","unstructured":"J.G.C. Ribeiro, S. Koyama, R. Horiuchi, H. Saruwatari, Sound field estimation based on physics-constrained kernel interpolation adapted to environment. IEEE\/ACM Trans. Audio Speech Lang. Process. 32, 4369\u20134383 (2024). https:\/\/doi.org\/10.1109\/TASLP.2024.3467951","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."},{"issue":"1","key":"437_CR39","doi-asserted-by":"publisher","first-page":"180","DOI":"10.1121\/10.0034833","volume":"157","author":"A Figueroa-Duran","year":"2025","unstructured":"A. Figueroa-Duran, E. Fernandez-Grande, Reconstruction of reverberant sound fields over large spatial domains. J. Acoust. Soc. Am. 157(1), 180\u2013190 (2025). https:\/\/doi.org\/10.1121\/10.0034833","journal-title":"J. Acoust. Soc. Am."},{"key":"437_CR40","doi-asserted-by":"publisher","unstructured":"F. Ronchini, L. Comanducci, M. Pezzoli, F. Antonacci, A. Sarti, in 2024 32nd European Signal Processing Conference (EUSIPCO). Room transfer function reconstruction using complex-valued neural networks and irregularly distributed microphones (2024), pp. 441\u2013445. https:\/\/doi.org\/10.23919\/EUSIPCO63174.2024.10715145","DOI":"10.23919\/EUSIPCO63174.2024.10715145"},{"key":"437_CR41","doi-asserted-by":"publisher","unstructured":"F. Miotello, L. Comanducci, M. Pezzoli, A. Bernardini, F. Antonacci, A. Sarti, in ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). Reconstruction of sound field through diffusion models (2024), pp. 1476\u20131480. https:\/\/doi.org\/10.1109\/ICASSP48485.2024.10446761","DOI":"10.1109\/ICASSP48485.2024.10446761"},{"key":"437_CR42","doi-asserted-by":"publisher","first-page":"686","DOI":"10.1016\/j.jcp.2018.10.045","volume":"378","author":"M Raissi","year":"2019","unstructured":"M. Raissi, P. Perdikaris, G.E. Karniadakis, Physics-informed neural networks: A deep learning framework for solving forward and inverse problems involving nonlinear partial differential equations. J. Comput. Phys. 378, 686\u2013707 (2019). https:\/\/doi.org\/10.1016\/j.jcp.2018.10.045","journal-title":"J. Comput. Phys."},{"issue":"6","key":"437_CR43","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1109\/MSP.2024.3465896","volume":"41","author":"S Koyama","year":"2024","unstructured":"S. Koyama, J.G.C. Ribeiro, T. Nakamura, N. Ueno, M. Pezzoli, Physics-informed machine learning for sound field estimation: Fundamentals, state of the art, and challenges. IEEE Signal Process. Mag. 41(6), 60\u201371 (2024). https:\/\/doi.org\/10.1109\/MSP.2024.3465896","journal-title":"IEEE Signal Process. Mag."},{"key":"437_CR44","doi-asserted-by":"publisher","first-page":"2333","DOI":"10.1109\/TASLP.2020.3012058","volume":"28","author":"M Pezzoli","year":"2020","unstructured":"M. Pezzoli, F. Borra, F. Antonacci, S. Tubaro, A. Sarti, A parametric approach to virtual miking for sources of arbitrary directivity. IEEE\/ACM Trans. Audio Speech Lang. Process. 28, 2333\u20132348 (2020). https:\/\/doi.org\/10.1109\/TASLP.2020.3012058","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."},{"key":"437_CR45","doi-asserted-by":"publisher","unstructured":"D. Albertini, G. Greco, A. Bernardini, A. Sarti, in ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). Diffusion-based sound source localization using networks of planar microphone arrays (2023), pp. 1\u20135. https:\/\/doi.org\/10.1109\/ICASSP49357.2023.10095405","DOI":"10.1109\/ICASSP49357.2023.10095405"},{"key":"437_CR46","doi-asserted-by":"publisher","unstructured":"D. Albertini, A. Bernardini, G. Greco, A. Sarti, Diffusion-based sound source localization using a distributed network of microphone arrays. Sensors 25(7) (2025). https:\/\/doi.org\/10.3390\/s25072078","DOI":"10.3390\/s25072078"},{"key":"437_CR47","doi-asserted-by":"publisher","first-page":"65883","DOI":"10.1109\/ACCESS.2024.3398351","volume":"12","author":"AM Molaei","year":"2024","unstructured":"A.M. Molaei, B. Zakeri, S.M.H. Andargoli, M.A.B. Abbasi, V. Fusco, O. Yurduseven, A comprehensive review of direction-of-arrival estimation and localization approaches in mixed-field sources scenario. IEEE Access 12, 65883\u201365918 (2024). https:\/\/doi.org\/10.1109\/ACCESS.2024.3398351","journal-title":"IEEE Access"},{"key":"437_CR48","doi-asserted-by":"publisher","unstructured":"Y. Sumura, D.D. Carlo, A. Arie\u00a0Nugraha, Y. Bando, K. Yoshii, in 2024 18th International Workshop on Acoustic Signal Enhancement (IWAENC). Joint audio source localization and separation with distributed microphone arrays based on spatially-regularized multichannel nmf (2024), pp. 145\u2013149. https:\/\/doi.org\/10.1109\/IWAENC61483.2024.10694042","DOI":"10.1109\/IWAENC61483.2024.10694042"},{"key":"437_CR49","doi-asserted-by":"publisher","unstructured":"F. Miotello, P. Ostan, M. Pezzoli, L. Comanducci, A. Bernardini, F. Antonacci, A. Sarti, in 2024 IEEE International Conference on Acoustics, Speech, and Signal Processing Workshops (ICASSPW). Homula-rir: A room impulse response dataset for teleconferencing and spatial audio applications acquired through higher-order microphones and uniform linear microphone arrays (2024), pp. 795\u2013799. https:\/\/doi.org\/10.1109\/ICASSPW62465.2024.10626753","DOI":"10.1109\/ICASSPW62465.2024.10626753"},{"issue":"6","key":"437_CR50","doi-asserted-by":"publisher","first-page":"1006","DOI":"10.1109\/TASLP.2015.2418571","volume":"23","author":"A Schwarz","year":"2015","unstructured":"A. Schwarz, W. Kellermann, Coherent-to-diffuse power ratio estimation for dereverberation. IEEE Trans. Audio Speech Lang. Process. 23(6), 1006\u20131018 (2015)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"issue":"4","key":"437_CR51","doi-asserted-by":"publisher","first-page":"943","DOI":"10.1121\/1.382599","volume":"65","author":"JB Allen","year":"1979","unstructured":"J.B. Allen, D.A. Berkley, Image method for efficiently simulating small-room acoustics. J. Acoust. Soc. Am. 65(4), 943\u2013950 (1979)","journal-title":"J. Acoust. Soc. Am."},{"key":"437_CR52","unstructured":"B. Loesch, B. Yang, in International Workshop on Acoustic Signal Enhancement (IWAENC). Source number estimation and clustering for underdetermined blind source separatio (IEEE, Piscataway, NJ, 2008)."},{"key":"437_CR53","doi-asserted-by":"crossref","unstructured":"S. Araki, T. Nakatani, H. Sawada, S. Makino, in Independent Component Analysis and Signal Separation, ed by T. Adali, C. Jutten, J.M.T. Romano, A.K. Barros. Stereo source separation and source counting with map estimation with Dirichlet prior considering spatial aliasing problem (Springer, Berlin, 2009), pp. 742\u2013750","DOI":"10.1007\/978-3-642-00599-2_93"},{"issue":"1","key":"437_CR54","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1109\/TSP.2009.2030854","volume":"58","author":"S Arberet","year":"2010","unstructured":"S. Arberet, R. Gribonval, F. Bimbot, A robust method to count and locate audio sources in a multichannel underdetermined mixture. IEEE Trans. Signal Process. 58(1), 121\u2013133 (2010)","journal-title":"IEEE Trans. Signal Process."},{"key":"437_CR55","doi-asserted-by":"crossref","unstructured":"D. Pavlidi, A. Griffin, M. Puigt, A. Mouchtaris, in Sensor Array and Multichannel Signal Processing Workshop (SAM). Source counting in real-time sound source localization using a circular microphone array (IEEE, 2012), pp. 521\u2013524. IEEE 445 Hoes Lane Piscataway, NJ 08854-4141 USA","DOI":"10.1109\/SAM.2012.6250555"},{"key":"437_CR56","doi-asserted-by":"crossref","unstructured":"O. Walter, L. Drude, R. Haeb-Umbach, in International Conference on Acoustics, Speech and Signal Processing (ICASSP). Source counting in speech mixtures by nonparametric bayesian estimation of an infinite gaussian mixture model (IEEE, Piscataway, NJ, 2015), pp. 459\u2013463","DOI":"10.1109\/ICASSP.2015.7178011"},{"key":"437_CR57","doi-asserted-by":"crossref","unstructured":"S. Pasha, J. Donley, C. Ritz, in Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC). Blind speaker counting in highly reverberant environments by clustering coherence features (2017), pp. 1684\u20131687","DOI":"10.1109\/APSIPA.2017.8282303"},{"key":"437_CR58","doi-asserted-by":"publisher","unstructured":"C. Xu, S. Li, G. Liu, Y. Zhang, E. Miluzzo, Y.-F. Chen, J. Li, B. Firner, in ACM International Joint Conference on Pervasive and Ubiquitous Computing. Crowd++: Unsupervised speaker count with smartphones, UbiComp\u201913 (Association for Computing Machinery, New York, 2013), pp. 43\u201352. https:\/\/doi.org\/10.1145\/2493432.2493435","DOI":"10.1145\/2493432.2493435"},{"issue":"2","key":"437_CR59","doi-asserted-by":"publisher","first-page":"268","DOI":"10.1109\/TASLP.2018.2877892","volume":"27","author":"F St\u00f6ter","year":"2019","unstructured":"F. St\u00f6ter, S. Chakrabarty, B. Edler, E.A.P. Habets, Countnet: Estimating the number of concurrent speakers using supervised learning. IEEE\/ACM Trans. Audio Speech Lang. Process. 27(2), 268\u2013282 (2019)","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Process."},{"key":"437_CR60","doi-asserted-by":"publisher","unstructured":"M. Cobos, F. Antonacci, A. Alexandridis, A. Mouchtaris, B. Lee, A survey of sound source localization methods in wireless acoustic sensor networks. Wirel. Commun. Mob. Comput. 2017 (Wiley,2017) pp.1\u201324 https:\/\/doi.org\/10.1155\/2017\/3956282","DOI":"10.1155\/2017\/3956282"},{"issue":"1","key":"437_CR61","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1109\/TSP.2004.838930","volume":"53","author":"X Sheng","year":"2005","unstructured":"X. Sheng, Y.-H. Hu, Maximum likelihood multiple-source localization using acoustic energy measurements with wireless sensor networks. IEEE Trans. Signal Process. 53(1), 44\u201353 (2005)","journal-title":"IEEE Trans. Signal Process."},{"issue":"2","key":"437_CR62","doi-asserted-by":"publisher","first-page":"439","DOI":"10.1109\/TASL.2012.2215601","volume":"21","author":"A Canclini","year":"2013","unstructured":"A. Canclini, F. Antonacci, A. Sarti, S. Tubaro, Acoustic source localization with distributed asynchronous microphone networks. IEEE Trans. Audio Speech Lang. Process. 21(2), 439\u2013443 (2013)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"437_CR63","unstructured":"F. Borra, M. Pezzoli, L. Comanducci, A. Bernardini, F. Antonacci, S. Tubaro, A. Sarti, in 28th European Signal Processing Conference (EUSIPCO). A fast ray space transform for wave field processing using acoustic arrays (IEEE, Piscataway, NJ, 2020)"},{"key":"437_CR64","doi-asserted-by":"crossref","unstructured":"DiBiase, J.H.: A high-accuracy, low-latency technique for talker localization in reverberant environments using microphone arrays. PhD thesis (Brown University, 2000)","DOI":"10.1007\/978-3-662-04619-7_8"},{"key":"437_CR65","unstructured":"H. Teutsch, W. Kellermann, in 2008 IEEE International Conference on Acoustics, Speech and Signal Processing. Acoustic source detection and localization based on wavefield decomposition using circular microphone arrays (IEEE, Piscataway, NJ, 2008), pp. 273\u2013276."},{"issue":"1","key":"437_CR66","doi-asserted-by":"publisher","first-page":"34","DOI":"10.1109\/JSTSP.2018.2885636","volume":"13","author":"S Adavanne","year":"2019","unstructured":"S. Adavanne, A. Politis, J. Nikunen, T. Virtanen, Sound event localization and detection of overlapping sources using convolutional recurrent neural networks. IEEE J. Sel. Top. Signal Process. 13(1), 34\u201348 (2019)","journal-title":"IEEE J. Sel. Top. Signal Process."},{"issue":"7","key":"437_CR67","doi-asserted-by":"publisher","first-page":"3428","DOI":"10.3390\/app12073428","volume":"12","author":"L Chen","year":"2022","unstructured":"L. Chen, G. Chen, L. Huang, Y.-S. Choy, W. Sun, Multiple sound source localization, separation, and reconstruction by microphone array: A dnn-based approach. Appl. Sci. 12(7), 3428 (2022)","journal-title":"Appl. Sci."},{"key":"437_CR68","doi-asserted-by":"crossref","unstructured":"Y. Gong, S. Liu, X.-L. Zhang, APSIPA Annual Summit and Conference.  End-to-end two-dimensional sound source localization with ad-hoc microphone arrays. (Proceedings of 2022 APSIPA Annual Summit and Conference, Chiang Mai, Thailand, 2022).","DOI":"10.23919\/APSIPAASC55919.2022.9980181"},{"key":"437_CR69","doi-asserted-by":"crossref","unstructured":"G. Greco, S. Messana, M. Pezzoli, M. Cobos, F. Antonacci, in 2025 34nd European Signal Processing Conference (EUSIPCO). Dereverberation of relative harmonic coefficients via CNNs for acoustic source DOA estimation (IEEE, Palermo, 2025)","DOI":"10.23919\/EUSIPCO63237.2025.11226374"},{"issue":"2","key":"437_CR70","doi-asserted-by":"publisher","first-page":"145","DOI":"10.1109\/29.1509","volume":"36","author":"M Miyoshi","year":"1988","unstructured":"M. Miyoshi, Y. Kaneda, Inverse filtering of room acoustics. IEEE Trans. Acoust. Speech Signal Process. 36(2), 145\u2013152 (1988)","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"issue":"2","key":"437_CR71","doi-asserted-by":"publisher","first-page":"430","DOI":"10.1109\/TASL.2006.881698","volume":"15","author":"M Delcroix","year":"2007","unstructured":"M. Delcroix, T. Hikichi, M. Miyoshi, Precise dereverberation using multichannel linear prediction. IEEE Trans. Audio Speech Lang. Process. 15(2), 430\u2013440 (2007)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"437_CR72","doi-asserted-by":"crossref","unstructured":"H. Buchner, R. Aichner, W. Kellermann, in International Conference on Acoustics, Speech and Signal Processing, (ICASSP). TRINICON: A versatile framework for multichannel blind signal processing, vol. 3 (IEEE, Piscataway, NJ, 2004), p. 889.","DOI":"10.1109\/ICASSP.2004.1326688"},{"issue":"4","key":"437_CR73","doi-asserted-by":"publisher","first-page":"2337","DOI":"10.1121\/1.4750493","volume":"132","author":"O Thiergart","year":"2012","unstructured":"O. Thiergart, G. Del Galdo, E.A.P. Habets, On the spatial coherence in mixed sound fields and its application to signal-to-diffuse ratio estimation. J. Acoust. Soc. Am. 132(4), 2337\u20132346 (2012)","journal-title":"J. Acoust. Soc. Am."},{"key":"437_CR74","doi-asserted-by":"crossref","unstructured":"S.V. Vaseghi, Advanced Digital Signal Processing and Noise Reduction (Wiley, Hoboken, NJ, 2008)","DOI":"10.1002\/9780470740156"},{"issue":"1","key":"437_CR75","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/97.736233","volume":"6","author":"J Sohn","year":"1999","unstructured":"J. Sohn, N.S. Kim, W. Sung, A statistical model-based voice activity detection. IEEE Signal Process. Lett. 6(1), 1\u20133 (1999)","journal-title":"IEEE Signal Process. Lett."},{"key":"437_CR76","doi-asserted-by":"crossref","unstructured":"R. Zelinski, in International Conference on Acoustics, Speech, and Signal Processing, (ICASSP). A microphone array with adaptive post-filtering for noise reduction in reverberant rooms, vol. 5, (IEEE, Piscataway, NJ, 1988), pp. 2578\u20132581.","DOI":"10.1109\/ICASSP.1988.197172"},{"issue":"6","key":"437_CR77","doi-asserted-by":"publisher","first-page":"709","DOI":"10.1109\/TSA.2003.818212","volume":"11","author":"IA McCowan","year":"2003","unstructured":"I.A. McCowan, H. Bourlard, Microphone array post-filter based on noise field coherence. IEEE Trans. Speech Audio Process. 11(6), 709\u2013716 (2003)","journal-title":"IEEE Trans. Speech Audio Process."},{"issue":"1","key":"437_CR78","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1109\/TAES.1970.310015","volume":"AES\u20136","author":"RJ Polge","year":"1970","unstructured":"R.J. Polge, E.M. Mitchell, Impulse response determination by cross correlation. IEEE Trans. Aerosp. Electron. Syst. AES\u20136(1), 91\u201397 (1970). https:\/\/doi.org\/10.1109\/TAES.1970.310015","journal-title":"IEEE Trans. Aerosp. Electron. Syst."},{"issue":"4","key":"437_CR79","doi-asserted-by":"publisher","first-page":"4141","DOI":"10.1109\/TIE.2023.3279569","volume":"71","author":"J Cao","year":"2024","unstructured":"J. Cao, Z. Yang, X. Chen, R. Yan, From pseudo to real: Generalized subspace method for power spectrum reconstruction. IEEE Trans. Ind. Electron. 71(4), 4141\u20134150 (2024). https:\/\/doi.org\/10.1109\/TIE.2023.3279569","journal-title":"IEEE Trans. Ind. Electron."},{"key":"437_CR80","unstructured":"M. Ester, H.-P. Kriegel, J. Sander, X. Xu, in Proceedings of the Second International Conference on Knowledge Discovery and Data Mining (KDD). A density-based algorithm for discovering clusters in large spatial databases with noise (AAAI Press, Portland, 1996), pp. 226\u2013231"},{"issue":"11","key":"437_CR81","first-page":"1","volume":"2025","author":"L Madmoni","year":"2025","unstructured":"L. Madmoni, Z. Ben-Hur, J. Donley, V. Tourbabin, B. Rafaely, Design and analysis of binaural signal matching with arbitrary microphone arrays and listener head rotations. EURASIP J. Audio Speech Music Process. 2025(11), 1\u201318 (2025)","journal-title":"EURASIP J. Audio Speech Music Process."},{"key":"437_CR82","doi-asserted-by":"publisher","first-page":"233121652091957","DOI":"10.1177\/2331216520919573","volume":"24","author":"N G\u00f6\u00dfling","year":"2020","unstructured":"N. G\u00f6\u00dfling, D. Marquardt, S. Doclo, Perceptual evaluation of binaural mvdr-based algorithms to preserve the interaural coherence of diffuse noise fields. Trends Hear. 24, 2331216520919573 (2020)","journal-title":"Trends Hear."},{"key":"437_CR83","doi-asserted-by":"publisher","unstructured":"Hardin, R.H., Sloane, N.J.A. McLaren\u2019s improved snub cube and other new spherical designs in three dimensions. Discrete Comput Geom 15, 429\u2013441 (SpringerNature, 1996). https:\/\/doi.org\/10.1007\/BF02711518","DOI":"10.1007\/BF02711518"},{"key":"437_CR84","unstructured":"European Broadcasting Union: Sound quality assessment material recording for subjective tests. Technical report, European Broadcasting Union (2008). European Broadcasting Union.(Accessed: February 10, 2025) https:\/\/tech.ebu.ch\/publications\/sqamcd"},{"key":"437_CR85","unstructured":"Habets, E.A.P.: Room impulse response generator. Technical Report 2.4, Technische Universiteit Eindhoven, Tech. Rep (2006)"},{"issue":"10","key":"437_CR86","doi-asserted-by":"publisher","first-page":"1796","DOI":"10.1109\/TASLP.2016.2585862","volume":"24","author":"N Epain","year":"2016","unstructured":"N. Epain, C.T. Jin, Spherical harmonic signal covariance and sound field diffuseness. IEEE\/ACM Trans. Audio Speech Lang. Proc. 24(10), 1796\u20131807 (2016). https:\/\/doi.org\/10.1109\/TASLP.2016.2585862","journal-title":"IEEE\/ACM Trans. Audio Speech Lang. Proc."},{"issue":"10","key":"437_CR87","doi-asserted-by":"publisher","first-page":"713","DOI":"10.1016\/j.apacoust.2011.04.004","volume":"72","author":"JS Bradley","year":"2011","unstructured":"J.S. Bradley, Review of objective room acoustics measures and future needs. Appl. Acoust. 72(10), 713\u2013720 (2011). https:\/\/doi.org\/10.1016\/j.apacoust.2011.04.004","journal-title":"Appl. Acoust."},{"key":"437_CR88","doi-asserted-by":"publisher","unstructured":"T.D. Abhayapala, D.B. Ward, in 2002 IEEE International Conference on Acoustics, Speech, and Signal Processing. Theory and design of high order sound field microphones using spherical microphone array, vol. 2 (2002), pp. 1949\u20131952. https:\/\/doi.org\/10.1109\/ICASSP.2002.5745011","DOI":"10.1109\/ICASSP.2002.5745011"},{"key":"437_CR89","doi-asserted-by":"publisher","unstructured":"J. Richter, Y.-C. Wu, S. Krenn, S. Welker, B. Lay, S. Watanabe, A. Richard, T. Gerkmann, in ISCA Interspeech. EARS: An anechoic fullband speech dataset benchmarked for speech enhancement and dereverberation (Proc. Interspeech, Kos, Grece, 2024), pp. 4873\u20134877.\u00a0https:\/\/doi.org\/10.21437\/Interspeech.2024-1532024","DOI":"10.21437\/Interspeech.2024-1532024"},{"issue":"2","key":"437_CR90","doi-asserted-by":"publisher","first-page":"522","DOI":"10.1109\/TMM.2018.2856090","volume":"21","author":"B Li","year":"2019","unstructured":"B. Li, X. Liu, K. Dinesh, Z. Duan, G. Sharma, Creating a multitrack classical music performance dataset for multimodal music analysis: Challenges, insights, and applications. IEEE Trans. Multimed. 21(2), 522\u2013535 (2019). https:\/\/doi.org\/10.1109\/TMM.2018.2856090","journal-title":"IEEE Trans. Multimed."},{"key":"437_CR91","doi-asserted-by":"crossref","unstructured":"P. Ostan, F.D. Gaudio, F. Miotello, M. Pezzoli, F. Antonacci, in Proceedings of the Forum Acusticum. VR-PTOLEMAIC: A virtual environment for the perceptual testing of spatial audio algorithms, vol 2025 (EAA, Malaga, Spain, 2025)","DOI":"10.61782\/fa.2025.0965"},{"key":"437_CR92","unstructured":"O.S. Rummukainen, T. Robotham, S.J. Schlecht, A. Plinge, J. Herre, E.A.P. Habets, in AES International Conference on Audio for Virtual and Augmented Reality. Audio quality evaluation in virtual reality: Multiple stimulus ranking with behavior tracking (2018), pp. 1\u201310. (Accessed: February 10, 2025) https:\/\/www.aes.org\/e-lib\/browse.cfm?elib=19678"},{"key":"437_CR93","doi-asserted-by":"publisher","unstructured":"A. Carlini, C. Bordeau, M. Ambard, Auditory localization: a comprehensive practical review. Front. Psychol. Volume 15 - 2024 (2024). https:\/\/doi.org\/10.3389\/fpsyg.2024.1408073","DOI":"10.3389\/fpsyg.2024.1408073"}],"container-title":["EURASIP Journal on Audio, Speech, and Music Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13636-025-00437-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s13636-025-00437-y","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s13636-025-00437-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,12]],"date-time":"2026-01-12T12:05:11Z","timestamp":1768219511000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1186\/s13636-025-00437-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,4]]},"references-count":93,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2026,12]]}},"alternative-id":["437"],"URL":"https:\/\/doi.org\/10.1186\/s13636-025-00437-y","relation":{},"ISSN":["1687-4722"],"issn-type":[{"value":"1687-4722","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,12,4]]},"assertion":[{"value":"4 June 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 November 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 December 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"4"}}