{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T04:24:24Z","timestamp":1750307064332,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":17,"publisher":"ACM","license":[{"start":{"date-parts":[[2012,10,22]],"date-time":"2012-10-22T00:00:00Z","timestamp":1350864000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2012,10,22]]},"DOI":"10.1145\/2388676.2388760","type":"proceedings-article","created":{"date-parts":[[2012,10,24]],"date-time":"2012-10-24T18:44:56Z","timestamp":1351104296000},"page":"371-378","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Audio-visual robot command recognition"],"prefix":"10.1145","author":[{"given":"Jordi","family":"Sanchez-Riera","sequence":"first","affiliation":[{"name":"INRIA Rhone Alpes, Montbonnot, France"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xavier","family":"Alameda-Pineda","sequence":"additional","affiliation":[{"name":"INRIA Rhone Alpes, Montbonnot, France"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Radu","family":"Horaud","sequence":"additional","affiliation":[{"name":"INRIA Rhone Alpes, Montbonnor, France"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2012,10,22]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/2070481.2070527"},{"key":"e_1_3_2_1_2_1","volume-title":"Journal of Multimodal User Interfaces","author":"Alameda-Pineda Xavier","year":"2012","unstructured":"Xavier Alameda-Pineda , Jordi Sanchez-Riera , Vojtech Franc , Johannes Wienke , Jan \u010cech , Kaustubh Kulkarni , Antoine Deleforge , and Radu P. Horaud . Ravel: An annotated corpus for training robots with audio visual abilities . Journal of Multimodal User Interfaces , 2012 . Xavier Alameda-Pineda, Jordi Sanchez-Riera, Vojtech Franc, Johannes Wienke, Jan \u010cech, Kaustubh Kulkarni, Antoine Deleforge, and Radu P. Horaud. Ravel: An annotated corpus for training robots with audio visual abilities. Journal of Multimodal User Interfaces, 2012."},{"key":"e_1_3_2_1_3_1","volume-title":"Pattern Recognition and Machine Learning (Information Science and Statistics)","author":"Bishop Christopher M.","year":"2006","unstructured":"Christopher M. Bishop . Pattern Recognition and Machine Learning (Information Science and Statistics) . Springer-Verlag New York, Inc. , Secaucus, NJ, USA , 2006 . Christopher M. Bishop. Pattern Recognition and Machine Learning (Information Science and Statistics). Springer-Verlag New York, Inc., Secaucus, NJ, USA, 2006."},{"key":"e_1_3_2_1_4_1","unstructured":"Mike Brookes. VOICEBOX: Speech processing toolbox for MATLAB. http:\/\/www.ee.ic.ac.uk\/hp\/staff\/dmb\/voicebox\/voicebox.html.  Mike Brookes. VOICEBOX: Speech processing toolbox for MATLAB. http:\/\/www.ee.ic.ac.uk\/hp\/staff\/dmb\/voicebox\/voicebox.html."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/1631272.1631277"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1162\/NECO_a_00074"},{"key":"e_1_3_2_1_7_1","volume-title":"Proceedings of the IEEE\/RSJ International Conference on Intelligent Robots and Systems","author":"Lacheze L.","year":"2009","unstructured":"L. Lacheze , Y. Guo , R. Benosman , B. Gas , and C. Couverture . Audio\/video fusion for objects recognition . In Proceedings of the IEEE\/RSJ International Conference on Intelligent Robots and Systems , 2009 . L. Lacheze, Y. Guo, R. Benosman, B. Gas, and C. Couverture. Audio\/video fusion for objects recognition. In Proceedings of the IEEE\/RSJ International Conference on Intelligent Robots and Systems, 2009."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-005-1838-7"},{"key":"e_1_3_2_1_9_1","volume-title":"Proceedings of the IEEE International Conference on Audio Speech and Signal Processing","author":"Liu Ming","year":"2008","unstructured":"Ming Liu , Yun Fu , and Thomas S. Huang . An audio-visual fusion framework with joint dimensionality reduction . In Proceedings of the IEEE International Conference on Audio Speech and Signal Processing , 2008 . Ming Liu, Yun Fu, and Thomas S. Huang. An audio-visual fusion framework with joint dimensionality reduction. In Proceedings of the IEEE International Conference on Audio Speech and Signal Processing, 2008."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1007\/11875581_99"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.5555\/1788524.1788584"},{"key":"e_1_3_2_1_12_1","volume-title":"Pearson","author":"Rabiner Lawrence R","year":"2011","unstructured":"Lawrence R Rabiner and Ronald W Schafer . Theory and Applications of Digital Speech Processing . Pearson , 2011 . Lawrence R Rabiner and Ronald W Schafer. Theory and Applications of Digital Speech Processing. Pearson, 2011."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2011.5946966"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.5555\/1787422.1787428"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33863-2_33"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995442"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10044-005-0244-7"}],"event":{"name":"ICMI '12: INTERNATIONAL CONFERENCE ON MULTIMODAL INTERACTION","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction"],"location":"Santa Monica California USA","acronym":"ICMI '12"},"container-title":["Proceedings of the 14th ACM international conference on Multimodal interaction"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2388676.2388760","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2388676.2388760","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T09:21:20Z","timestamp":1750238480000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2388676.2388760"}},"subtitle":["D-META'12 grand challenge"],"short-title":[],"issued":{"date-parts":[[2012,10,22]]},"references-count":17,"alternative-id":["10.1145\/2388676.2388760","10.1145\/2388676"],"URL":"https:\/\/doi.org\/10.1145\/2388676.2388760","relation":{},"subject":[],"published":{"date-parts":[[2012,10,22]]},"assertion":[{"value":"2012-10-22","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}