{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,17]],"date-time":"2025-10-17T00:04:23Z","timestamp":1760659463455,"version":"build-2065373602"},"publisher-location":"New York, NY, USA","reference-count":29,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,11,4]],"date-time":"2024-11-04T00:00:00Z","timestamp":1730678400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,11,4]]},"DOI":"10.1145\/3686215.3690153","type":"proceedings-article","created":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T12:17:01Z","timestamp":1730290621000},"page":"51-55","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Levels of Multimodal Interaction"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0009-9231-603X","authenticated-orcid":false,"given":"Anoop K.","family":"Sinha","sequence":"first","affiliation":[{"name":"Google, United States"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4922-6601","authenticated-orcid":false,"given":"Chinmay","family":"Kulkarni","sequence":"additional","affiliation":[{"name":"Google, United States"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7772-0530","authenticated-orcid":false,"given":"Alex","family":"Olwal","sequence":"additional","affiliation":[{"name":"Google, United States"}]}],"member":"320","published-online":{"date-parts":[[2024,11,4]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"Adobe. 2024. Adobe Firefly. https:\/\/www.adobe.com\/products\/firefly.html"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.73"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2798607"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/800250.807503"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/266180.266328"},{"key":"e_1_3_2_1_6_1","volume-title":"Gemini: A Family of Highly Capable Multimodal Models. arXiv [cs.CL].","author":"Gemini Team","year":"2023","unstructured":"Gemini Team. 2023. Gemini: A Family of Highly Capable Multimodal Models. arXiv [cs.CL]. Retrieved from http:\/\/arxiv.org\/abs\/2312.11805"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-49457-4_1"},{"key":"e_1_3_2_1_8_1","volume-title":"Proceedings of the 2nd international conference on Intelligent user interfaces, 61\u201368","author":"Douglas B.","year":"1997","unstructured":"Douglas B. Moran, Adam J. Cheyer, Luc E. Julia, David L. Martin, and Sangkyu Park. 1997. Multimodal user interfaces in the Open Agent Architecture. In Proceedings of the 2nd international conference on Intelligent user interfaces, 61\u201368."},{"key":"e_1_3_2_1_9_1","volume-title":"Multimodal Interfaces: A Special Issue of Human Computer Interaction","author":"Thomas Moran","year":"1997","unstructured":"Thomas Moran. 1997. Multimodal Interfaces: A Special Issue of Human Computer Interaction. CRC Press. Retrieved from https:\/\/books.google.com\/books\/about\/Multimodal_Interfaces.html?hl=&id=lQsUPQAACAAJ"},{"key":"e_1_3_2_1_10_1","volume-title":"Brubaker","author":"Meredith Ringel Morris R","year":"2024","unstructured":"Meredith Ringel Morris and Jed R. Brubaker. 2024. Generative Ghosts: Anticipating Benefits and Risks of AI Afterlives. arXiv [cs.CY]. Retrieved from http:\/\/arxiv.org\/abs\/2402.01662"},{"key":"e_1_3_2_1_11_1","unstructured":"Meredith Ringel Morris Jascha Sohl-dickstein Noah Fiedel Tris Warkentin Allan Dafoe Aleksandra Faust Clement Farabet and Shane Legg. 2023. Levels of AGI: Operationalizing Progress on the Path to AGI. arXiv [cs.AI]. Retrieved from http:\/\/arxiv.org\/abs\/2311.02462"},{"key":"e_1_3_2_1_12_1","unstructured":"OpenAI. 2023. GPT-4 Technical Report. arXiv [cs.CL]. Retrieved from http:\/\/arxiv.org\/abs\/2303.08774"},{"key":"e_1_3_2_1_13_1","volume-title":"Cohen","author":"Sharon Oviatt R","year":"2015","unstructured":"Sharon Oviatt and Philip R. Cohen. 2015. The paradigm shift to multimodality in contemporary computer interfaces. Springer Nature."},{"key":"e_1_3_2_1_14_1","volume-title":"Retrieved","author":"Seymour A.","year":"1966","unstructured":"Seymour A. Papert. 1966. The Summer Vision Project. Retrieved May 21, 2024 from https:\/\/dspace.mit.edu\/handle\/1721.1\/6125?show=full"},{"volume-title":"Affective computing","author":"Rosalind W.","key":"e_1_3_2_1_15_1","unstructured":"Rosalind W. Picard. 2000. Affective computing. MIT press."},{"key":"e_1_3_2_1_16_1","volume-title":"Machine perception of three-dimensional solids","author":"Lawrence G.","year":"2024","unstructured":"Lawrence G. Roberts. 1963. Machine perception of three-dimensional solids. Massachusetts Institute of Technology. Retrieved May 21, 2024 from https:\/\/dspace.mit.edu\/handle\/1721.1\/11589?show=full"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/1461551.1461591"},{"key":"e_1_3_2_1_18_1","unstructured":"Yudai Tanaka Angela Vujic Pattie Maes Robert J. K. Jacob Olaf Blanke Sho Nakagome and Pedro Lopes. Panel: NeuroCHI: Are We Prepared for the Integration of the Brain with Computing? Retrieved from https:\/\/www.youtube.com\/watch?v=IDGRn0PHEgo"},{"key":"e_1_3_2_1_19_1","unstructured":"Ashish Vaswani Noam Shazeer Niki Parmar Jakob Uszkoreit Llion Jones Aidan N. Gomez Lukasz Kaiser and Illia Polosukhin. 2017. Attention Is All You Need. arXiv [cs.CL]. Retrieved from http:\/\/arxiv.org\/abs\/1706.03762"},{"volume-title":"The Free Encyclopedia.","author":"Wikipedia","key":"e_1_3_2_1_20_1","unstructured":"Wikipedia contributors. 2023. Timeline of speech and voice recognition. Wikipedia, The Free Encyclopedia. Retrieved from https:\/\/en.wikipedia.org\/w\/index.php?title=Timeline_of_speech_and_voice_recognition&oldid=1168514805"},{"volume-title":"International Conference on Multimodal Interaction. ICMI.","key":"e_1_3_2_1_21_1","unstructured":"2002. International Conference on Multimodal Interaction. ICMI. Retrieved from https:\/\/dl.acm.org\/conference\/icmi-mlmi"},{"key":"e_1_3_2_1_22_1","unstructured":"2023. GPT4. OpenAI. https:\/\/platform.openai.com\/docs\/models\/gpt-4-turbo-and-gpt-4"},{"key":"e_1_3_2_1_23_1","unstructured":"2024. GPT-4o. Retrieved from https:\/\/openai.com\/index\/hello-gpt-4o\/"},{"key":"e_1_3_2_1_24_1","unstructured":"2024. Gemini Flash. Google DeepMind. Retrieved from https:\/\/deepmind.google\/technologies\/gemini\/flash\/"},{"key":"e_1_3_2_1_25_1","unstructured":"J3016_202104: Taxonomy and Definitions for Terms Related to Driving Automation Systems for On-Road Motor Vehicles - SAE International. Retrieved from https:\/\/www.sae.org\/standards\/content\/j3016_202104\/"},{"key":"e_1_3_2_1_26_1","unstructured":"Gemini Ultra. Google DeepMind. https:\/\/deepmind.google\/technologies\/gemini\/ultra\/"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/191666.191703"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1038\/s41598-023-30938-9"},{"key":"e_1_3_2_1_29_1","volume-title":"Proceedings of the 15th Conference on Creativity and Cognition (pp. 75-87)","author":"Chang M.","year":"2023","unstructured":"Chang, M., Druga, S., Fiannaca, A. J., Vergani, P., Kulkarni, C., Cai, C. J., & Terry, M. (2023, June). The prompt artists. In Proceedings of the 15th Conference on Creativity and Cognition (pp. 75-87)."}],"event":{"name":"ICMI '24: INTERNATIONAL CONFERENCE ON MULTIMODAL INTERACTION","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction"],"location":"San Jose Costa Rica","acronym":"ICMI '24"},"container-title":["Companion Proceedings of the 26th International Conference on Multimodal Interaction"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3686215.3690153","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3686215.3690153","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,15]],"date-time":"2025-10-15T16:21:32Z","timestamp":1760545292000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3686215.3690153"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,4]]},"references-count":29,"alternative-id":["10.1145\/3686215.3690153","10.1145\/3686215"],"URL":"https:\/\/doi.org\/10.1145\/3686215.3690153","relation":{},"subject":[],"published":{"date-parts":[[2024,11,4]]},"assertion":[{"value":"2024-11-04","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}