{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T17:57:21Z","timestamp":1743098241230,"version":"3.40.3"},"publisher-location":"Cham","reference-count":17,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319181639"},{"type":"electronic","value":"9783319181646"}],"license":[{"start":{"date-parts":[[2015,1,1]],"date-time":"2015-01-01T00:00:00Z","timestamp":1420070400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2015,1,1]],"date-time":"2015-01-01T00:00:00Z","timestamp":1420070400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2015]]},"DOI":"10.1007\/978-3-319-18164-6_15","type":"book-chapter","created":{"date-parts":[[2015,6,5]],"date-time":"2015-06-05T08:55:38Z","timestamp":1433494538000},"page":"149-157","source":"Crossref","is-referenced-by-count":0,"title":["Integration of Audio and Video Clues for Source Localization by a Robotic Head"],"prefix":"10.1007","author":[{"given":"Raffaele","family":"Parisi","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Danilo","family":"Comminiello","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Michele","family":"Scarpiniti","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Aurelio","family":"Uncini","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"key":"15_CR1","doi-asserted-by":"publisher","first-page":"214","DOI":"10.1080\/14786440709463595","volume":"13","author":"L. Rayleigh","year":"1907","unstructured":"Rayleigh, L.: On our perception of sound direction. Phil. Mag.\u00a013, 214\u2013232 (1907)","journal-title":"Phil. Mag."},{"key":"15_CR2","doi-asserted-by":"crossref","unstructured":"Blauert, J.: Spatial Hearing - The Psychophysics of Human Sound Localization. MIT Press (1996)","DOI":"10.7551\/mitpress\/6391.001.0001"},{"issue":"1","key":"15_CR3","doi-asserted-by":"publisher","first-page":"68","DOI":"10.1109\/TASL.2009.2023644","volume":"18","author":"M. Raspaud","year":"2010","unstructured":"Raspaud, M., Viste, H., Evangelista, G.: Binaural source localization by joint estimation of ILD and ITD. IEEE Trans. on Audio, Speech and Language Processing\u00a018(1), 68\u201377 (2010)","journal-title":"IEEE Trans. on Audio, Speech and Language Processing"},{"issue":"9","key":"15_CR4","doi-asserted-by":"publisher","first-page":"2272","DOI":"10.1109\/TIP.2007.901813","volume":"16","author":"G. Monaci","year":"2007","unstructured":"Monaci, G., Jost, P., Vandergheynst, P., Mail\u00e9, B., Lesage, S., Gribonval, R.: Learning multimodal dictionaries. IEEE Trans. on Image Processing\u00a016(9), 2272\u20132283 (2007)","journal-title":"IEEE Trans. on Image Processing"},{"issue":"8","key":"15_CR5","doi-asserted-by":"publisher","first-page":"1541","DOI":"10.1109\/TMM.2008.2007344","volume":"10","author":"C. Zhang","year":"2008","unstructured":"Zhang, C., Yin, P., Rui, Y., Cutler, R., Viola, P., Sun, X., Pinto, N., Zhang, Z.: Boosting-based multimodal speaker detection for distributed meeting videos. IEEE Trans. on Multimedia\u00a010(8), 1541\u20131552 (2008)","journal-title":"IEEE Trans. on Multimedia"},{"issue":"5","key":"15_CR6","doi-asserted-by":"publisher","first-page":"845","DOI":"10.1109\/JSTSP.2010.2050519","volume":"4","author":"J. Schmalenstroeer","year":"2010","unstructured":"Schmalenstroeer, J., Haeb-Umbach, R.: Online diarization of streaming audio-visual data for smart envirnments. IEEE Journ. of Selected Topics in Signal Processing\u00a04(5), 845\u2013856 (2010)","journal-title":"IEEE Journ. of Selected Topics in Signal Processing"},{"issue":"5","key":"15_CR7","doi-asserted-by":"publisher","first-page":"466","DOI":"10.1049\/iet-spr.2011.0124","volume":"6","author":"S.M. Naqvi","year":"2012","unstructured":"Naqvi, S.M., Wang, W., Khan, M.S., Barnard, M., Chambers, J.A.: Multimodal (audio-visual) source separation exploiting multi-speaker tracking, robust beamforming and time-frequency masking. IET Signal Processing\u00a06(5), 466\u2013477 (2012)","journal-title":"IET Signal Processing"},{"issue":"4","key":"15_CR8","doi-asserted-by":"publisher","first-page":"1032","DOI":"10.1109\/TMM.2014.2305632","volume":"16","author":"V.P. Minotto","year":"2014","unstructured":"Minotto, V.P., Jung, C.R., Lee, B.: Simultaneous-speaker voice activity detection and localization using mid-fusion of svm and hmms. IEEE Trans. on Multimedia\u00a016(4), 1032\u20131044 (2014)","journal-title":"IEEE Trans. on Multimedia"},{"key":"15_CR9","unstructured":"Wang, D., Brown, G.J.: Computational Auditory Scene Analysis - Principles, Algorithms, and Applications. IEEE Press, Wiley Interscience (2006)"},{"key":"15_CR10","unstructured":"Algazi, V.R., Duda, R.O., Thompson, D.M., Avendano, C.: The CIPIC HRTF database. In: 2001 IEEE Workshop on Applications of Digital Signal Processing to Audio and Acoustics (2001)"},{"key":"15_CR11","unstructured":"Kuttruff, H.: Room Acoustics, 4th edn. Taylor & Francis (2000)"},{"issue":"3","key":"15_CR12","doi-asserted-by":"publisher","first-page":"253","DOI":"10.1016\/S0165-1684(97)00051-0","volume":"59","author":"A. St\u00e9phenne","year":"1997","unstructured":"St\u00e9phenne, A., Champagne, B.: A new cepstral prefiltering technique for estimating time delay under reverberant conditions. Signal Processing\u00a059(3), 253\u2013266 (1997)","journal-title":"Signal Processing"},{"key":"15_CR13","doi-asserted-by":"crossref","unstructured":"Parisi, R., Gazzetta, R., Di Claudio, E.: Prefiltering approaches for time delay estimation in reverberant environments. In: Proceedings of ICASSP, vol.\u00a03, pp. III-2997\u2013III-3000 (2002)","DOI":"10.1109\/ICASSP.2002.1005317"},{"key":"15_CR14","doi-asserted-by":"crossref","unstructured":"Zannini, C.M., Parisi, R., Uncini, A.: Binaural sound source localization in the presence of reverberation. In: Proc. of the 17th International Conference on Digital Signal Processing (July 2011)","DOI":"10.1109\/ICDSP.2011.6004954"},{"issue":"2","key":"15_CR15","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1109\/LSP.2011.2180376","volume":"19","author":"R. Parisi","year":"2012","unstructured":"Parisi, R., Camoes, F., Scarpiniti, M., Uncini, A.: Cepstrum prefiltering for binaural source localization in reverberant environments. IEEE Signal Processing Letters\u00a019(2), 99\u2013102 (2012)","journal-title":"IEEE Signal Processing Letters"},{"issue":"2","key":"15_CR16","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1023\/B:VISI.0000013087.49260.fb","volume":"57","author":"P. Viola","year":"2004","unstructured":"Viola, P., Jones, M.J.: Robust real-time face detection. Int. J. of Computer Vision\u00a057(2), 137\u2013154 (2004)","journal-title":"Int. J. of Computer Vision"},{"issue":"1","key":"15_CR17","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1006\/jcss.1997.1504","volume":"55","author":"Y.Y. Freund","year":"1997","unstructured":"Freund, Y.Y., Schapire, R.E.: A decision-theoretic generalization of on-line learning and an application to boosting. Journal of Computer and System Sciences\u00a055(1), 119\u2013139 (1997)","journal-title":"Journal of Computer and System Sciences"}],"container-title":["Smart Innovation, Systems and Technologies","Advances in Neural Networks: Computational and Theoretical Issues"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-18164-6_15","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,31]],"date-time":"2023-01-31T03:55:16Z","timestamp":1675137316000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-18164-6_15"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015]]},"ISBN":["9783319181639","9783319181646"],"references-count":17,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-18164-6_15","relation":{},"ISSN":["2190-3018","2190-3026"],"issn-type":[{"type":"print","value":"2190-3018"},{"type":"electronic","value":"2190-3026"}],"subject":[],"published":{"date-parts":[[2015]]}}}