{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,9]],"date-time":"2026-03-09T23:32:52Z","timestamp":1773099172089,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":68,"publisher":"ACM","license":[{"start":{"date-parts":[[2020,4,21]],"date-time":"2020-04-21T00:00:00Z","timestamp":1587427200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"the Natural Science Foundation of China","award":["61521002 61672314 and 61572276"],"award-info":[{"award-number":["61521002 61672314 and 61572276"]}]},{"name":"the National Key Research and Development Plan","award":["2016YFB1001200"],"award-info":[{"award-number":["2016YFB1001200"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2020,4,21]]},"DOI":"10.1145\/3313831.3376810","type":"proceedings-article","created":{"date-parts":[[2020,5,27]],"date-time":"2020-05-27T19:28:08Z","timestamp":1590607688000},"page":"1-14","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":23,"title":["FrownOnError: Interrupting Responses from Smart Speakers by Facial Expressions"],"prefix":"10.1145","author":[{"given":"Yukang","family":"Yan","sequence":"first","affiliation":[{"name":"Tsinghua University, Beijing, China"}]},{"given":"Chun","family":"Yu","sequence":"additional","affiliation":[{"name":"Tsinghua University; Ministry of Education, Beijing, China"}]},{"given":"Wengrui","family":"Zheng","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, China"}]},{"given":"Ruining","family":"Tang","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, China"}]},{"given":"Xuhai","family":"Xu","sequence":"additional","affiliation":[{"name":"Tsinghua University, Beijing, China"}]},{"given":"Yuanchun","family":"Shi","sequence":"additional","affiliation":[{"name":"Tsinghua University; Ministry of Education, Beijing, China"}]}],"member":"320","published-online":{"date-parts":[[2020,4,23]]},"reference":[{"key":"e_1_3_2_2_1_1","volume-title":"Retrieved","author":"Echo Amazon","year":"2019","unstructured":"2019a. Amazon Echo. Website. (2019). Retrieved September 3, 2019 from https:\/\/www.amazon.com\/gp\/ help\/customer\/display.html?nodeId=201399130."},{"key":"e_1_3_2_2_2_1","volume-title":"Retrieved December 27th","year":"2019","unstructured":"2019b. Baidu Text-To-Speech online tool. Website. (2019). Retrieved December 27th, 2019 from https:\/\/ai.baidu.com\/tech\/speech\/tts."},{"key":"e_1_3_2_2_3_1","volume-title":"Retrieved","author":"Home Google","year":"2019","unstructured":"2019c. Google Home. Website. (2019). Retrieved September 3, 2019 from https:\/\/store.google.com\/product\/google_home."},{"key":"e_1_3_2_2_4_1","volume-title":"Retrieved December 27th","year":"2019","unstructured":"2019d. Online tutorial of fcal action coding systme. Website. (2019). Retrieved December 27th, 2019 from https:\/\/imotions.com\/blog\/facial-action-coding-system\/."},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/NCVPRIPG.2015.7490026"},{"key":"e_1_3_2_2_6_1","volume-title":"2016 IEEE Winter Conference on Applications of Computer Vision (WACV). IEEE, 1--10","author":"Tadas","year":"2016","unstructured":"Tadas Baltru?aitis, Peter Robinson, and Louis-Philippe Morency. 2016. Openface: an open source facial behavior analysis toolkit. In 2016 IEEE Winter Conference on Applications of Computer Vision (WACV). IEEE, 1--10."},{"key":"e_1_3_2_2_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300473"},{"key":"e_1_3_2_2_8_1","volume-title":"Evaluating user experience in games: Concepts and methods","author":"Bernhaupt Regina","unstructured":"Regina Bernhaupt. 2010. Evaluating user experience in games: Concepts and methods. Springer."},{"key":"e_1_3_2_2_10_1","volume-title":"6th SIGdial workshop on discourse and dialogue.","author":"Bohus Dan","year":"2005","unstructured":"Dan Bohus and Alexander I Rudnicky. 2005. Sorry, I didn't catch that!-An investigation of non-understanding errors and recovery strategies. In 6th SIGdial workshop on discourse and dialogue."},{"key":"e_1_3_2_2_11_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--1--4020--6821--8_6"},{"key":"e_1_3_2_2_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300270"},{"key":"e_1_3_2_2_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/3202185.3202749"},{"key":"e_1_3_2_2_14_1","volume-title":"The State of Speech in HCI: Trends, Themes and Challenges. arXiv preprint arXiv:1810.06828","author":"Clark Leigh","year":"2018","unstructured":"Leigh Clark, Phillip Doyle, Diego Garaialde, Emer Gilmartin, Stephan Schl\u00f6gl, Jens Edlund, Matthew Aylett, Jo\u00e3o Cabral, Cosmin Munteanu, and Benjamin Cowan. 2018. The State of Speech in HCI: Trends, Themes and Challenges. arXiv preprint arXiv:1810.06828 (2018)."},{"key":"e_1_3_2_2_15_1","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.92.22.9921"},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/3098279.3098539"},{"key":"e_1_3_2_2_17_1","volume-title":"Facial expression and emotion. American psychologist 48, 4","author":"Ekman Paul","year":"1993","unstructured":"Paul Ekman. 1993. Facial expression and emotion. American psychologist 48, 4 (1993), 384."},{"key":"e_1_3_2_2_18_1","volume-title":"Friesen","author":"Ekman Paul","year":"1978","unstructured":"Paul Ekman and Wallace V. Friesen. 1978. Facial action coding system: a technique for the measurement of facial movement."},{"key":"e_1_3_2_2_19_1","volume-title":"Universal facial expressions of emotion","author":"Ekman Paul","year":"1997","unstructured":"Paul Ekman and Dacher Keltner. 1997. Universal facial expressions of emotion. Segerstrale U, P. Molnar P, eds. Nonverbal communication: Where nature meets culture (1997), 27--46."},{"key":"e_1_3_2_2_20_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.robot.2016.01.010"},{"key":"e_1_3_2_2_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/3242587.3242603"},{"key":"e_1_3_2_2_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2014.2313557"},{"key":"e_1_3_2_2_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/765891.765958"},{"key":"e_1_3_2_2_24_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1"},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.entcom.2014.04.005"},{"key":"e_1_3_2_2_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/2911451.2911521"},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/3290607.3313062"},{"key":"e_1_3_2_2_28_1","unstructured":"Margarita Kotti Alexandros Papangelis and Yannis Stylianou. 2017. Will this dialogue be unsuccessful? prediction using audio features. (2017)."},{"key":"e_1_3_2_2_29_1","volume-title":"International journal of speech technology 4, 1","author":"Krahmer Emiel","year":"2001","unstructured":"Emiel Krahmer, Marc Swerts, Mariet Theune, and Mieke Weegels. 2001. Error detection in spoken human-machine interaction. International journal of speech technology 4, 1 (2001), 19--30."},{"key":"e_1_3_2_2_30_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2010.5543264"},{"key":"e_1_3_2_2_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/1501750.1501809"},{"key":"e_1_3_2_2_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/3274371"},{"key":"e_1_3_2_2_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/2556288.2557370"},{"key":"e_1_3_2_2_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/3311823.3311869"},{"key":"e_1_3_2_2_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/3173574.3173577"},{"key":"e_1_3_2_2_36_1","volume-title":"2010 IEEE 11th International Conference on Computer-Aided Industrial Design & Conceptual Design 1","volume":"1","author":"Liu Weiyuan","year":"2010","unstructured":"Weiyuan Liu. 2010. Natural user interface-next mainstream product user interface. In 2010 IEEE 11th International Conference on Computer-Aided Industrial Design & Conceptual Design 1, Vol. 1. IEEE, 203--205."},{"key":"e_1_3_2_2_37_1","volume-title":"Prediction of Dialogue Success with Spectral and Rhythm Acoustic Features Using DNNS and SVMS. In 2018 IEEE Spoken Language Technology Workshop (SLT). IEEE, 838--845","author":"Lykartsis Athanasios","year":"2018","unstructured":"Athanasios Lykartsis, Margarita Kotti, Alexandros Papangelis, and Yannis Stylianou. 2018. Prediction of Dialogue Success with Spectral and Rhythm Acoustic Features Using DNNS and SVMS. In 2018 IEEE Spoken Language Technology Workshop (SLT). IEEE, 838--845."},{"key":"e_1_3_2_2_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/169059.169215"},{"key":"e_1_3_2_2_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/2851581.2890247"},{"key":"e_1_3_2_2_40_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W15-4647"},{"key":"e_1_3_2_2_41_1","doi-asserted-by":"publisher","DOI":"10.1145\/3132847.3133001"},{"key":"e_1_3_2_2_42_1","doi-asserted-by":"publisher","DOI":"10.1145\/3299819.3299840"},{"key":"e_1_3_2_2_43_1","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2010-206"},{"key":"e_1_3_2_2_44_1","doi-asserted-by":"publisher","DOI":"10.1145\/1690388.1690403"},{"key":"e_1_3_2_2_45_1","doi-asserted-by":"publisher","DOI":"10.1145\/506443.506528"},{"key":"e_1_3_2_2_46_1","volume-title":"Aaron Adler, Krzysztof Z Gajos, Louis-Philippe Morency, and Trevor Darrell.","author":"Oh Alice","year":"2002","unstructured":"Alice Oh, Harold Fox, Max Van Kleek, Aaron Adler, Krzysztof Z Gajos, Louis-Philippe Morency, and Trevor Darrell. 2002b. Evaluating look-to-talk. (2002)."},{"key":"e_1_3_2_2_47_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7953110"},{"key":"e_1_3_2_2_48_1","doi-asserted-by":"publisher","DOI":"10.1145\/3173574.3174214"},{"key":"e_1_3_2_2_49_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00779-011-0470-5"},{"key":"e_1_3_2_2_50_1","unstructured":"David Reitter and Johanna D Moore. 2007. Predicting success in dialogue. (2007)."},{"key":"e_1_3_2_2_51_1","doi-asserted-by":"publisher","DOI":"10.1037\/1528-3542.3.1.68"},{"key":"e_1_3_2_2_52_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2004.11.005"},{"key":"e_1_3_2_2_53_1","unstructured":"Gabriel Skantze and Jens Edlund. 2004. Early error detection on word level. In COST278 and ISCA Tutorial and Research Workshop (ITRW) on Robustness Issues in Conversational Interaction."},{"key":"e_1_3_2_2_54_1","doi-asserted-by":"publisher","DOI":"10.1145\/3173574.3173914"},{"key":"e_1_3_2_2_55_1","doi-asserted-by":"publisher","DOI":"10.1145\/2317956.2318068"},{"key":"e_1_3_2_2_56_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-30120-2_79"},{"key":"e_1_3_2_2_57_1","doi-asserted-by":"publisher","DOI":"10.1145\/3242587.3242599"},{"key":"e_1_3_2_2_58_1","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2006-507"},{"key":"e_1_3_2_2_59_1","doi-asserted-by":"publisher","DOI":"10.1109\/SLT.2016.7846319"},{"key":"e_1_3_2_2_60_1","doi-asserted-by":"publisher","DOI":"10.1109\/VSMM.2017.8346263"},{"key":"e_1_3_2_2_61_1","doi-asserted-by":"publisher","DOI":"10.1145\/3152832.3156628"},{"key":"e_1_3_2_2_62_1","volume-title":"Proceedings of the 1st North American chapter of the Association for Computational Linguistics conference. Association for Computational Linguistics, 210--217","author":"Walker Marilyn","year":"2000","unstructured":"Marilyn Walker, Irene Langkilde, Jerry Wright, Allen Gorin, and Diane Litman. 2000. Learning to predict problematic situations in a spoken dialogue system: experiments with how may i help you?. In Proceedings of the 1st North American chapter of the Association for Computational Linguistics conference. Association for Computational Linguistics, 210--217."},{"key":"e_1_3_2_2_63_1","doi-asserted-by":"publisher","DOI":"10.1145\/3229434.3229449"},{"key":"e_1_3_2_2_64_1","doi-asserted-by":"publisher","DOI":"10.1145\/3313831.3376836"},{"key":"e_1_3_2_2_65_1","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300505"},{"key":"e_1_3_2_2_66_1","doi-asserted-by":"publisher","DOI":"10.1145\/3332165.3347950"},{"key":"e_1_3_2_2_67_1","volume-title":"Smile with Angry Birds: Two Smile-Interface Implementations. In 2018 Nicograph International (NicoInt)","author":"Yang Changeun","unstructured":"Changeun Yang, Yuxuan Jiang, Pujana Paliyawan, Tomohiro Harada, and Ruck Thawonmas. 2018. Smile with Angry Birds: Two Smile-Interface Implementations. In 2018 Nicograph International (NicoInt). IEEE, 80--80."},{"key":"e_1_3_2_2_68_1","volume-title":"Thirteenth Symposium on Usable Privacy and Security ({SOUPS}","author":"Zeng Eric","year":"2017","unstructured":"Eric Zeng, Shrirang Mare, and Franziska Roesner. 2017. End user security and privacy concerns with smart homes. In Thirteenth Symposium on Usable Privacy and Security ({SOUPS} 2017). 65--80."},{"key":"e_1_3_2_2_69_1","volume-title":"Proceedings of AAAI Fall Symposium on Psychological Models of Communication in Collaborative Systems. 132--139","author":"Zollo Teresa","year":"1999","unstructured":"Teresa Zollo. 1999. A study of human dialogue strategies in the presence of speech recognition errors. In Proceedings of AAAI Fall Symposium on Psychological Models of Communication in Collaborative Systems. 132--139."}],"event":{"name":"CHI '20: CHI Conference on Human Factors in Computing Systems","location":"Honolulu HI USA","acronym":"CHI '20","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction"]},"container-title":["Proceedings of the 2020 CHI Conference on Human Factors in Computing Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3313831.3376810","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3313831.3376810","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T22:32:47Z","timestamp":1750199567000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3313831.3376810"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,4,21]]},"references-count":68,"alternative-id":["10.1145\/3313831.3376810","10.1145\/3313831"],"URL":"https:\/\/doi.org\/10.1145\/3313831.3376810","relation":{},"subject":[],"published":{"date-parts":[[2020,4,21]]},"assertion":[{"value":"2020-04-23","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}