{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T04:52:24Z","timestamp":1725511944819},"publisher-location":"Berlin, Heidelberg","reference-count":19,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540695677"},{"type":"electronic","value":"9783540695684"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1007\/978-3-540-69568-4_4","type":"book-chapter","created":{"date-parts":[[2007,5,17]],"date-time":"2007-05-17T19:03:17Z","timestamp":1179428597000},"page":"69-80","source":"Crossref","is-referenced-by-count":3,"title":["An Audio-Visual Particle Filter for Speaker Tracking on the CLEAR\u201906 Evaluation Dataset"],"prefix":"10.1007","author":[{"given":"Kai","family":"Nickel","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tobias","family":"Gehrig","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hazim K.","family":"Ekenel","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"John","family":"McDonough","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Rainer","family":"Stiefelhagen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"key":"4_CR1","unstructured":"CLEAR 2006 Evaluation and Workshop Campaign, April 6-7, Southampton, UK (2006), http:\/\/clear-evaluation.org"},{"key":"4_CR2","unstructured":"Brandstein, M.S.: A framework for speech source localization using sensor arrays. PhD thesis, Brown University, Providence, RI (May 1995)"},{"issue":"1","key":"4_CR3","doi-asserted-by":"publisher","first-page":"45","DOI":"10.1109\/89.554268","volume":"5","author":"M.S. Brandstein","year":"1997","unstructured":"Brandstein, M.S., Adcock, J.E., Silverman, H.F.: A closed-form location estimator for use with room environment microphone arrays. IEEE Trans. Speech Audio Proc.\u00a05(1), 45\u201350 (1997)","journal-title":"IEEE Trans. Speech Audio Proc."},{"key":"4_CR4","doi-asserted-by":"crossref","unstructured":"Checka, N., Wilson, K., Rangarajan, V., Darrell, T.: A probabilistic framework for multi-modal multi-person tracking. In: IEEE Workshop on Multi-Object Tracking (in conjunction with CVPR) (2003)","DOI":"10.1109\/CVPRW.2003.10099"},{"issue":"6","key":"4_CR5","doi-asserted-by":"publisher","first-page":"549","DOI":"10.1109\/TSA.2003.818025","volume":"11","author":"J. Chen","year":"2003","unstructured":"Chen, J., Benesty, J., Huang, Y.A.: Robust time delay estimation exploiting redundancy among multiple microphones. IEEE Trans. Speech Audio Proc.\u00a011(6), 549\u2013557 (2003)","journal-title":"IEEE Trans. Speech Audio Proc."},{"key":"4_CR6","unstructured":"Gatica-Perez, D., Lathoud, G., McCowan, I., Odobez, J.-M.: A mixed-state i-particle filter for multi-camera speaker tracking. In: Proc. IEEE ICCV Workshop on Multimedia Technologies in E-Learning and Collaboration (ICCV-WOMTEC) (2003)"},{"issue":"8","key":"4_CR7","doi-asserted-by":"publisher","first-page":"943","DOI":"10.1109\/89.966097","volume":"9","author":"Y. Huang","year":"2001","unstructured":"Huang, Y., Benesty, J., Elko, G.W., Mersereau, R.M.: Real-time passive source localization: A practical linear-correction least-squares approach. IEEE Trans. Speech Audio Proc.\u00a09(8), 943\u2013956 (2001)","journal-title":"IEEE Trans. Speech Audio Proc."},{"issue":"1","key":"4_CR8","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1008078328650","volume":"29","author":"M. Isard","year":"1998","unstructured":"Isard, M., Blake, A.: Condensation\u2013conditional density propagation for visual tracking. International Journal of Computer Vision\u00a029(1), 5\u201328 (1998)","journal-title":"International Journal of Computer Vision"},{"key":"4_CR9","doi-asserted-by":"crossref","unstructured":"Gehrig, T., Nickel, K., Ekenel, H.K., Klee, U., McDonough, J.: Kalman filters for audio-video source localization. In: IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (Oct. 2005)","DOI":"10.1109\/ASPAA.2005.1540183"},{"key":"4_CR10","unstructured":"Klee, U., Gehrig, T., McDonough, J.: Kalman filters for time delay of arrival-based source localization. EURASIP Special Issue on Multichannel Speech Processing, submitted for publication"},{"key":"4_CR11","unstructured":"Kruppa, H., Castrillon-Santana, M., Schiele, B.: Fast and robust face finding via local context. In: IEEE Intl. Workshop on Visual Surveillance and Performance Evaluation of Tracking and Surveillance (Oct. 2003)"},{"key":"4_CR12","doi-asserted-by":"crossref","unstructured":"Lienhart, R., Maydt, J.: An extended set of haar-like features for rapid object detection. In: ICIP, vol.\u00a01, pp. 900\u2013903 (Sept. 2002)","DOI":"10.1109\/ICIP.2002.1038171"},{"key":"4_CR13","unstructured":"Mikic, I., Santini, S., Jain, R.: Tracking objects in 3d using multiple camera views. In: ACCV (2000)"},{"key":"4_CR14","first-page":"273","volume":"2","author":"M. Omologo","year":"1994","unstructured":"Omologo, M., Svaizer, P.: Acoustic event localization using a crosspower-spectrum phase based technique. Proc. ICASSP\u00a02, 273\u2013276 (1994)","journal-title":"Proc. ICASSP"},{"key":"4_CR15","doi-asserted-by":"crossref","first-page":"741","DOI":"10.1109\/ICCV.2001.937600","volume":"1","author":"J. Vermaak","year":"2001","unstructured":"Vermaak, J., Gangnet, M., Blake, A., P\u00e9rez, P.: Sequential monte carlo fusion of sound and vision for speaker tracking. Proc. IEEE Intl. Conf. on Computer Vision\u00a01, 741\u2013746 (2001)","journal-title":"Proc. IEEE Intl. Conf. on Computer Vision"},{"key":"4_CR16","unstructured":"Viola, P., Jones, M.: Robust real-time object detection. In: ICCV Workshop on Statistical and Computation Theories of Vision (July 2001)"},{"issue":"6","key":"4_CR17","doi-asserted-by":"publisher","first-page":"826","DOI":"10.1109\/TSA.2003.818112","volume":"11","author":"D.B. Ward","year":"2003","unstructured":"Ward, D.B., Lehmann, E.A., Williamson, R.C.: Particle filtering algorithms for tracking an acoustic source in a reverberant environment. IEEE Trans. Speech Audio Proc.\u00a011(6), 826\u2013836 (2003)","journal-title":"IEEE Trans. Speech Audio Proc."},{"key":"4_CR18","unstructured":"W\u00f6lfel, M., Nickel, K., McDonough, J.: Microphone Array Driven Speech Recognition: Influence of Localization on the Word Error Rate. In: 2nd Joint Workshop on Multimodal Interaction and Related Machine Learning Algorithms, Edinburgh, 11-13 July (2005)"},{"key":"4_CR19","doi-asserted-by":"crossref","unstructured":"Zotkin, D., Duraiswami, R., Davis, L.: Joint audio-visual tracking using particle filters. EURASIP journal on Applied Signal Processing\u00a011 (2002)","DOI":"10.1155\/S1110865702206058"}],"container-title":["Lecture Notes in Computer Science","Multimodal Technologies for Perception of Humans"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-69568-4_4.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,11,19]],"date-time":"2020-11-19T05:01:35Z","timestamp":1605762095000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-69568-4_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"ISBN":["9783540695677","9783540695684"],"references-count":19,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-69568-4_4","relation":{},"subject":[]}}