{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,15]],"date-time":"2026-04-15T18:08:32Z","timestamp":1776276512393,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":62,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,5,11]],"date-time":"2024-05-11T00:00:00Z","timestamp":1715385600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,5,11]]},"DOI":"10.1145\/3613904.3641904","type":"proceedings-article","created":{"date-parts":[[2024,5,11]],"date-time":"2024-05-11T08:39:12Z","timestamp":1715416752000},"page":"1-18","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":30,"title":["RELIC: Investigating Large Language Model Responses using Self-Consistency"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2329-6126","authenticated-orcid":false,"given":"Furui","family":"Cheng","sequence":"first","affiliation":[{"name":"ETH Z\u00fcrich, Switzerland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9874-2069","authenticated-orcid":false,"given":"Vil\u00e9m","family":"Zouhar","sequence":"additional","affiliation":[{"name":"ETH Z\u00fcrich, Switzerland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-7044-4689","authenticated-orcid":false,"given":"Simran","family":"Arora","sequence":"additional","affiliation":[{"name":"Stanford University, United States"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8787-8681","authenticated-orcid":false,"given":"Mrinmaya","family":"Sachan","sequence":"additional","affiliation":[{"name":"ETH Z\u00fcrich, Switzerland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8995-1683","authenticated-orcid":false,"given":"Hendrik","family":"Strobelt","sequence":"additional","affiliation":[{"name":"IBM Research AI, United States"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8526-2613","authenticated-orcid":false,"given":"Mennatallah","family":"El-Assady","sequence":"additional","affiliation":[{"name":"ETH Z\u00fcrich, Switzerland"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2024,5,11]]},"reference":[{"key":"e_1_3_3_2_1_1","volume-title":"Proceedings of the 2021 AAAI\/ACM Conference on AI, Ethics, and Society. 401\u2013413","author":"Bhatt Umang","unstructured":"Umang Bhatt, Javier Antor\u00e1n, Yunfeng Zhang, Q\u00a0Vera Liao, Prasanna Sattigeri, Riccardo Fogliato, Gabrielle Melan\u00e7on, Ranganath Krishnan, Jason Stanley, Omesh Tickoo, Uncertainty as a form of transparency: Measuring, communicating, and using uncertainty. In Proceedings of the 2021 AAAI\/ACM Conference on AI, Ethics, and Society. 401\u2013413."},{"key":"e_1_3_3_2_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2011.185"},{"key":"e_1_3_3_2_3_1","volume-title":"Polyphony: an Interactive Transfer Learning Framework for Single-Cell Data Analysis","author":"Cheng Furui","year":"2022","unstructured":"Furui Cheng, Mark\u00a0S Keller, Huamin Qu, Nils Gehlenborg, and Qianwen Wang. 2022. Polyphony: an Interactive Transfer Learning Framework for Single-Cell Data Analysis. IEEE transactions on visualization and computer graphics 29, 1 (2022), 591\u2013601."},{"key":"e_1_3_3_2_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2021.3114836"},{"key":"e_1_3_3_2_5_1","doi-asserted-by":"crossref","unstructured":"Ruijia Cheng Alison Smith-Renner Ke Zhang Joel Tetreault and Alejandro Jaimes-Larrarte. Mapping the Design Space of Human-AI Interaction in Text Summarization. In Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies. 431\u2013455.","DOI":"10.18653\/v1\/2022.naacl-main.33"},{"key":"e_1_3_3_2_6_1","doi-asserted-by":"publisher","DOI":"10.2196\/47184"},{"key":"e_1_3_3_2_7_1","volume-title":"Daniel Buschek. Beyond Text Generation: Supporting Writers with Continuous Automatic Text Summaries. In Proceedings of the 35th Annual ACM Symposium on User Interface Software and Technology","author":"Dang Hai","unstructured":"Hai Dang, Karim Benharrak, Florian Lehmann, and Daniel Buschek. Beyond Text Generation: Supporting Writers with Continuous Automatic Text Summaries. In Proceedings of the 35th Annual ACM Symposium on User Interface Software and Technology (Bend, OR, USA) (UIST \u201922). Article 98, 13\u00a0pages."},{"key":"e_1_3_3_2_8_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ipm.2022.103219"},{"key":"e_1_3_3_2_9_1","unstructured":"Zijian Ding and Joel Chan. 2023. Mapping the Design Space of Interactions in Human-AI Text Co-creation Tasks. arxiv:2303.06430"},{"key":"e_1_3_3_2_10_1","volume-title":"Improving Factuality and Reasoning in Language Models through Multiagent Debate. arXiv preprint arXiv:2305.14325","author":"Du Yilun","year":"2023","unstructured":"Yilun Du, Shuang Li, Antonio Torralba, Joshua\u00a0B Tenenbaum, and Igor Mordatch. 2023. Improving Factuality and Reasoning in Language Models through Multiagent Debate. arXiv preprint arXiv:2305.14325 (2023)."},{"key":"e_1_3_3_2_11_1","unstructured":"Tao Fang Shu Yang Kaixin Lan Derek\u00a0F. Wong Jinpeng Hu Lidia\u00a0S. Chao and Yue Zhang. 2023. Is ChatGPT a Highly Fluent Grammatical Error Correction System? A Comprehensive Evaluation. arxiv:2304.01746"},{"key":"e_1_3_3_2_12_1","doi-asserted-by":"crossref","unstructured":"Patrick Fernandes Aman Madaan Emmy Liu Ant\u00f3nio Farinhas Pedro\u00a0Henrique Martins Amanda Bertsch Jos\u00e9\u00a0GC de Souza Shuyan Zhou Tongshuang Wu Graham Neubig 2023. Bridging the gap: A survey on integrating (human) feedback for natural language generation. arxiv:2305.00955","DOI":"10.1162\/tacl_a_00626"},{"key":"e_1_3_3_2_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2014.2346435"},{"key":"e_1_3_3_2_14_1","volume-title":"CRITIC: Large language models can self-correct with tool-interactive critiquing. arxiv:2305.11738","author":"Gou Zhibin","year":"2023","unstructured":"Zhibin Gou, Zhihong Shao, Yeyun Gong, Yelong Shen, Yujiu Yang, Nan Duan, and Weizhu Chen. 2023. CRITIC: Large language models can self-correct with tool-interactive critiquing. arxiv:2305.11738"},{"key":"e_1_3_3_2_15_1","volume-title":"Weizhu Chen. DeBERTa: Decoding-Ehanced BERT with Disentangled Attention. In International Conference on Learning Representations.","author":"He Pengcheng","unstructured":"Pengcheng He, Xiaodong Liu, Jianfeng Gao, and Weizhu Chen. DeBERTa: Decoding-Ehanced BERT with Disentangled Attention. In International Conference on Learning Representations."},{"key":"e_1_3_3_2_16_1","unstructured":"Matthew Honnibal Ines Montani Sofie\u00a0Van Landeghem and Adriane Boyd. 2020. spaCy: Industrial-strength Natural Language Processing in Python. Explosion. https:\/\/github.com\/explosion\/spaCy"},{"key":"e_1_3_3_2_17_1","unstructured":"Daphne Ippolito Ann Yuan Andy Coenen and Sehmon Burnam. 2022. Creative Writing with an AI-Powered Writing Assistant: Perspectives from Professional Writers. arxiv:2211.05030"},{"key":"e_1_3_3_2_18_1","volume-title":"Article 248","author":"Ji Ziwei","year":"2023","unstructured":"Ziwei Ji, Nayeon Lee, Rita Frieske, Tiezheng Yu, Dan Su, Yan Xu, Etsuko Ishii, Ye\u00a0Jin Bang, Andrea Madotto, and Pascale Fung. 2023. Survey of Hallucination in Natural Language Generation. ACM Comput. Surv. 55, 12, Article 248 (2023), 38\u00a0pages."},{"key":"e_1_3_3_2_19_1","volume-title":"CHI Conference on Human Factors in Computing Systems Extended Abstracts. 1\u20138.","author":"Jiang Ellen","unstructured":"Ellen Jiang, Kristen Olson, Edwin Toh, Alejandra Molina, Aaron Donsbach, Michael Terry, and Carrie\u00a0J Cai. Promptmaker: Prompt-based prototyping with large language models. In CHI Conference on Human Factors in Computing Systems Extended Abstracts. 1\u20138."},{"key":"e_1_3_3_2_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/3586183.3606737"},{"key":"e_1_3_3_2_21_1","doi-asserted-by":"publisher","DOI":"10.5555\/3618408.3619049"},{"key":"e_1_3_3_2_22_1","volume-title":"Sebastian Farquhar. Semantic Uncertainty: Linguistic Invariances for Uncertainty Estimation in Natural Language Generation. In The Eleventh International Conference on Learning Representations.","author":"Kuhn Lorenz","unstructured":"Lorenz Kuhn, Yarin Gal, and Sebastian Farquhar. Semantic Uncertainty: Linguistic Invariances for Uncertainty Estimation in Natural Language Generation. In The Eleventh International Conference on Learning Representations."},{"key":"e_1_3_3_2_23_1","volume-title":"Proceedings of the 2022 CHI conference on human factors in computing systems. 1\u201319","author":"Lee Mina","unstructured":"Mina Lee, Percy Liang, and Qian Yang. Coauthor: Designing a human-ai collaborative writing dataset for exploring language model capabilities. In Proceedings of the 2022 CHI conference on human factors in computing systems. 1\u201319."},{"key":"e_1_3_3_2_24_1","volume-title":"Tim Rockt\u00e4schel, Sebastian Riedel, and Douwe Kiela.","author":"Lewis Patrick","year":"2021","unstructured":"Patrick Lewis, Ethan Perez, Aleksandra Piktus, Fabio Petroni, Vladimir Karpukhin, Naman Goyal, Heinrich K\u00fcttler, Mike Lewis, Wen tau Yih, Tim Rockt\u00e4schel, Sebastian Riedel, and Douwe Kiela. 2021. Retrieval-Augmented Generation for Knowledge-Intensive NLP Tasks. arxiv:2005.11401"},{"key":"e_1_3_3_2_25_1","doi-asserted-by":"crossref","unstructured":"Q\u00a0Vera Liao and Jennifer\u00a0Wortman Vaughan. 2023. AI Transparency in the Age of LLMs: A Human-Centered Research Roadmap. arxiv:2306.01941","DOI":"10.1162\/99608f92.8036d03b"},{"key":"e_1_3_3_2_26_1","volume-title":"The mythos of model interpretability: In machine learning, the concept of interpretability is both important and slippery.Queue 16, 3","author":"Lipton C","year":"2018","unstructured":"Zachary\u00a0C Lipton. 2018. The mythos of model interpretability: In machine learning, the concept of interpretability is both important and slippery.Queue 16, 3 (2018), 31\u201357."},{"key":"e_1_3_3_2_27_1","volume-title":"RoBERTa: A Robustly Optimized BERT Pretraining Approach. CoRR","author":"Liu Yinhan","year":"2019","unstructured":"Yinhan Liu, Myle Ott, Naman Goyal, Jingfei Du, Mandar Joshi, Danqi Chen, Omer Levy, Mike Lewis, Luke Zettlemoyer, and Veselin Stoyanov. 2019. RoBERTa: A Robustly Optimized BERT Pretraining Approach. CoRR (2019)."},{"key":"e_1_3_3_2_28_1","volume-title":"\u00a0F. Gales","author":"Manakul Potsawee","year":"2023","unstructured":"Potsawee Manakul, Adian Liusie, and Mark J.\u00a0F. Gales. 2023. SelfCheckGPT: Zero-Resource Black-Box Hallucination Detection for Generative Large Language Models. arxiv:2303.08896"},{"key":"e_1_3_3_2_29_1","volume-title":"Pang\u00a0Wei Koh, Mohit Iyyer, Luke Zettlemoyer, and Hannaneh Hajishirzi.","author":"Min Sewon","year":"2023","unstructured":"Sewon Min, Kalpesh Krishna, Xinxi Lyu, Mike Lewis, Wen tau Yih, Pang\u00a0Wei Koh, Mohit Iyyer, Luke Zettlemoyer, and Hannaneh Hajishirzi. 2023. FActScore: Fine-grained Atomic Evaluation of Factual Precision in Long Form Text Generation. arxiv:2305.14251"},{"key":"e_1_3_3_2_30_1","volume-title":"ProtoSteer: Steering Deep Sequence Model with Prototypes","author":"Ming Yao","year":"2019","unstructured":"Yao Ming, Panpan Xu, Furui Cheng, Huamin Qu, and Liu Ren. 2019. ProtoSteer: Steering Deep Sequence Model with Prototypes. IEEE transactions on visualization and computer graphics 26, 1 (2019), 238\u2013248."},{"key":"e_1_3_3_2_31_1","unstructured":"Niels M\u00fcndler Jingxuan He Slobodan Jenko and Martin Vechev. 2023. Self-contradictory Hallucinations of Large Language Models: Evaluation Detection and Mitigation. arxiv:2305.15852"},{"key":"e_1_3_3_2_32_1","volume-title":"Proceedings of the 2023 CHI Conference on Human Factors in Computing Systems. 1\u201316","author":"Petridis Savvas","unstructured":"Savvas Petridis, Nicholas Diakopoulos, Kevin Crowston, Mark Hansen, Keren Henderson, Stan Jastrzebski, Jeffrey\u00a0V Nickerson, and Lydia\u00a0B Chilton. Anglekindling: Supporting journalistic angle ideation with large language models. In Proceedings of the 2023 CHI Conference on Human Factors in Computing Systems. 1\u201316."},{"key":"e_1_3_3_2_33_1","doi-asserted-by":"publisher","DOI":"10.1038\/s42256-023-00726-1"},{"key":"e_1_3_3_2_34_1","volume-title":"Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining. 1135\u20131144","author":"Ribeiro Marco\u00a0Tulio","unstructured":"Marco\u00a0Tulio Ribeiro, Sameer Singh, and Carlos Guestrin. \"Why should i trust you?\" Explaining the predictions of any classifier. In Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining. 1135\u20131144."},{"key":"e_1_3_3_2_35_1","first-page":"1178","article-title":"Visual comparison of language model adaptation","volume":"29","author":"Sevastjanova Rita","year":"2022","unstructured":"Rita Sevastjanova, Eren Cakmak, Shauli Ravfogel, Ryan Cotterell, and Mennatallah El-Assady. 2022. Visual comparison of language model adaptation. IEEE Transactions on Visualization and Computer Graphics 29, 1 (2022), 1178\u20131188.","journal-title":"IEEE Transactions on Visualization and Computer Graphics"},{"key":"e_1_3_3_2_36_1","unstructured":"Rita Sevastjanova and Mennatallah El-Assady. 2022. Beware the rationalization trap! when language model explainability diverges from our mental models of language. arxiv:2207.06897"},{"key":"e_1_3_3_2_37_1","volume-title":"Computer Graphics Forum","author":"Sevastjanova Rita","unstructured":"Rita Sevastjanova, A Kalouli, Christin Beck, Hanna Hauptmann, and Mennatallah El-Assady. LMFingerprints: Visual explanations of language model embedding spaces through layerwise contextualization scores. In Computer Graphics Forum. Wiley Online Library, 295\u2013307."},{"key":"e_1_3_3_2_38_1","first-page":"1064","article-title":"explAIner: A visual analytics framework for interactive and explainable machine learning","volume":"26","author":"Spinner Thilo","year":"2019","unstructured":"Thilo Spinner, Udo Schlegel, Hanna Sch\u00e4fer, and Mennatallah El-Assady. 2019. explAIner: A visual analytics framework for interactive and explainable machine learning. IEEE Transactions on Visualization and computer graphics 26, 1 (2019), 1064\u20131074.","journal-title":"IEEE Transactions on Visualization and computer graphics"},{"key":"e_1_3_3_2_39_1","volume-title":"Seq2seq-vis: A visual debugging tool for sequence-to-sequence models","author":"Strobelt Hendrik","year":"2018","unstructured":"Hendrik Strobelt, Sebastian Gehrmann, Michael Behrisch, Adam Perer, Hanspeter Pfister, and Alexander\u00a0M Rush. 2018. Seq2seq-vis: A visual debugging tool for sequence-to-sequence models. IEEE transactions on visualization and computer graphics 25, 1 (2018), 353\u2013363."},{"key":"e_1_3_3_2_40_1","volume-title":"Lstmvis: A tool for visual analysis of hidden state dynamics in recurrent neural networks","author":"Strobelt Hendrik","year":"2017","unstructured":"Hendrik Strobelt, Sebastian Gehrmann, Hanspeter Pfister, and Alexander\u00a0M Rush. 2017. Lstmvis: A tool for visual analysis of hidden state dynamics in recurrent neural networks. IEEE transactions on visualization and computer graphics 24, 1 (2017), 667\u2013676."},{"key":"e_1_3_3_2_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2022.3209479"},{"key":"e_1_3_3_2_42_1","volume-title":"Haijun Xia. Sensecape: Enabling Multilevel Exploration and Sensemaking with Large Language Models. In Proceedings of the 36th Annual ACM Symposium on User Interface Software and Technology(UIST \u201923)","author":"Suh Sangho","unstructured":"Sangho Suh, Bryan Min, Srishti Palani, and Haijun Xia. Sensecape: Enabling Multilevel Exploration and Sensemaking with Large Language Models. In Proceedings of the 36th Annual ACM Symposium on User Interface Software and Technology(UIST \u201923). Article 1, 18\u00a0pages."},{"key":"e_1_3_3_2_43_1","volume-title":"Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing: System Demonstrations. 107\u2013118","author":"Tenney Ian","unstructured":"Ian Tenney, James Wexler, Jasmijn Bastings, Tolga Bolukbasi, Andy Coenen, Sebastian Gehrmann, Ellen Jiang, Mahima Pushkarna, Carey Radebaugh, Emily Reif, The Language Interpretability Tool: Extensible, Interactive Visualizations and Analysis for NLP Models. In Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing: System Demonstrations. 107\u2013118."},{"key":"e_1_3_3_2_44_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1"},{"key":"e_1_3_3_2_45_1","volume-title":"Fine-tuning Language Models for Factuality. arXiv preprint arXiv:2311.08401","author":"Tian Katherine","year":"2023","unstructured":"Katherine Tian, Eric Mitchell, Huaxiu Yao, Christopher\u00a0D Manning, and Chelsea Finn. 2023. Fine-tuning Language Models for Factuality. arXiv preprint arXiv:2311.08401 (2023)."},{"key":"e_1_3_3_2_46_1","volume-title":"Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processin.","author":"Wallace Eric","unstructured":"Eric Wallace, Yizhong Wang, Sujian Li, and Sameer\u00a0Singh andMatt Gardner. Do NLP Models Know Numbers? Probing Numeracy in Embeddings. In Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processin."},{"key":"e_1_3_3_2_47_1","volume-title":"Survey on factuality in large language models: Knowledge, retrieval and domain-specificity. arXiv preprint arXiv:2310.07521","author":"Wang Cunxiang","year":"2023","unstructured":"Cunxiang Wang, Xiaoze Liu, Yuanhao Yue, Xiangru Tang, Tianhang Zhang, Cheng Jiayang, Yunzhi Yao, Wenyang Gao, Xuming Hu, Zehan Qi, 2023. Survey on factuality in large language models: Knowledge, retrieval and domain-specificity. arXiv preprint arXiv:2310.07521 (2023)."},{"key":"e_1_3_3_2_48_1","volume-title":"Proceedings of the 2019 CHI conference on human factors in computing systems. 1\u201315","author":"Wang Danding","unstructured":"Danding Wang, Qian Yang, Ashraf Abdul, and Brian\u00a0Y Lim. Designing theory-driven user-centric explainable AI. In Proceedings of the 2019 CHI conference on human factors in computing systems. 1\u201315."},{"key":"e_1_3_3_2_49_1","volume-title":"Denny Zhou. Self-Consistency Improves Chain of Thought Reasoning in Language Models. In The Eleventh International Conference on Learning Representations.","author":"Wang Xuezhi","unstructured":"Xuezhi Wang, Jason Wei, Dale Schuurmans, Quoc\u00a0V Le, Ed\u00a0H. Chi, Sharan Narang, Aakanksha Chowdhery, and Denny Zhou. Self-Consistency Improves Chain of Thought Reasoning in Language Models. In The Eleventh International Conference on Learning Representations."},{"key":"e_1_3_3_2_50_1","first-page":"24824","article-title":"Chain-of-thought prompting elicits reasoning in large language models","volume":"35","author":"Wei Jason","year":"2022","unstructured":"Jason Wei, Xuezhi Wang, Dale Schuurmans, Maarten Bosma, Fei Xia, Ed Chi, Quoc\u00a0V Le, Denny Zhou, 2022. Chain-of-thought prompting elicits reasoning in large language models. Advances in Neural Information Processing Systems 35 (2022), 24824\u201324837.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_3_2_51_1","volume-title":"CHI Conference on Human Factors in Computing Systems Extended Abstracts. 1\u201310","author":"Wu Tongshuang","unstructured":"Tongshuang Wu, Ellen Jiang, Aaron Donsbach, Jeff Gray, Alejandra Molina, Michael Terry, and Carrie\u00a0J Cai. Promptchainer: Chaining large language model prompts through visual programming. In CHI Conference on Human Factors in Computing Systems Extended Abstracts. 1\u201310."},{"key":"e_1_3_3_2_52_1","volume-title":"Proceedings of the 2022 CHI conference on human factors in computing systems. 1\u201322","author":"Wu Tongshuang","unstructured":"Tongshuang Wu, Michael Terry, and Carrie\u00a0Jun Cai. AI chains: Transparent and controllable human-AI interaction by chaining large language model prompts. In Proceedings of the 2022 CHI conference on human factors in computing systems. 1\u201322."},{"key":"e_1_3_3_2_53_1","volume-title":"Joint Proceedings of the ACM IUI Workshops, Vol.\u00a010","author":"Yang Daijin","unstructured":"Daijin Yang, Yanpeng Zhou, Zhiyuan Zhang, Toby Jia-Jun Li, and Ray LC. AI as an Active Writer: Interaction strategies with generated text in human-AI collaborative fiction writing. In Joint Proceedings of the ACM IUI Workshops, Vol.\u00a010."},{"key":"e_1_3_3_2_54_1","volume-title":"Mo Yu, and Ying Xu.","author":"Yao Bingsheng","year":"2021","unstructured":"Bingsheng Yao, Dakuo Wang, Tongshuang Wu, Zheng Zhang, Toby Jia-Jun Li, Mo Yu, and Ying Xu. 2021. It is AI\u2019s Turn to Ask Humans a Question: Question-Answer Pair Generation for Children\u2019s Story Books. arxiv:2109.03423"},{"key":"e_1_3_3_2_55_1","unstructured":"Shunyu Yao Dian Yu Jeffrey Zhao Izhak Shafran Thomas\u00a0L. Griffiths Yuan Cao and Karthik Narasimhan. 2023. Tree of Thoughts: Deliberate Problem Solving with Large Language Models. arxiv:2305.10601\u00a0[cs.CL]"},{"key":"e_1_3_3_2_56_1","unstructured":"Xiaozhe Yao. 2023. Open Compute Framework: Peer-to-Peer Task Queue for Foundation Model Inference Serving. AutoAI. https:\/\/github.com\/autoai-org\/OpenComputeFramework"},{"key":"e_1_3_3_2_57_1","volume-title":"Daphne Ippolito. Wordcraft: Story Writing With Large Language Models. In 27th International Conference on Intelligent User Interfaces","author":"Yuan Ann","unstructured":"Ann Yuan, Andy Coenen, Emily Reif, and Daphne Ippolito. Wordcraft: Story Writing With Large Language Models. In 27th International Conference on Intelligent User Interfaces (Helsinki, Finland) (IUI \u201922). 841\u2013852."},{"key":"e_1_3_3_2_58_1","volume-title":"Proceedings of the 2023 CHI Conference on Human Factors in Computing Systems. 1\u201321","author":"Zamfirescu-Pereira JD","unstructured":"JD Zamfirescu-Pereira, Richmond\u00a0Y Wong, Bjoern Hartmann, and Qian Yang. Why Johnny can\u2019t prompt: How non-AI experts try (and fail) to design LLM prompts. In Proceedings of the 2023 CHI Conference on Human Factors in Computing Systems. 1\u201321."},{"key":"e_1_3_3_2_59_1","volume-title":"Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processin","author":"Q.","year":"2021","unstructured":"Michael\u00a0J.Q. Zhang and Eunsol Choi. 2021. Situatedqa: Incorporating extra-linguistic contexts into QA. Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processin (2021)."},{"key":"e_1_3_3_2_60_1","volume-title":"Siren\u2019s Song in the AI Ocean: A Survey on Hallucination in Large Language Models. arXiv preprint arXiv:2309.01219","author":"Zhang Yue","year":"2023","unstructured":"Yue Zhang, Yafu Li, Leyang Cui, Deng Cai, Lemao Liu, Tingchen Fu, Xinting Huang, Enbo Zhao, Yu Zhang, Yulong Chen, Longyue Wang, Anh\u00a0Tuan Luu, Wei Bi, Freda Shi, and Shuming Shi. 2023. Siren\u2019s Song in the AI Ocean: A Survey on Hallucination in Large Language Models. arXiv preprint arXiv:2309.01219 (2023)."},{"key":"e_1_3_3_2_61_1","volume-title":"Conference on Fairness, Accountability, and Transparency Barcelona, Spain","author":"Zhang Yunfeng","year":"2020","unstructured":"Yunfeng Zhang, Q.\u00a0Vera Liao, and Rachel K.\u00a0E. Bellamy. Effect of confidence and explanation on accuracy and trust calibration in AI-assisted decision making. In FAT* \u201920: Conference on Fairness, Accountability, and Transparency Barcelona, Spain, January 27-30, 2020, Mireille Hildebrandt, Carlos Castillo, L.\u00a0Elisa Celis, Salvatore Ruggieri, Linnet Taylor, and Gabriela Zanfir-Fortuna (Eds.). 295\u2013305."},{"key":"e_1_3_3_2_62_1","volume-title":"Not Quality. In Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies. 151\u2013161","author":"Zouhar Vil\u00e9m","unstructured":"Vil\u00e9m Zouhar, Michal Nov\u00e1k, Mat\u00fa\u0161 \u017dilinec, Ond\u0159ej Bojar, Mateo Obreg\u00f3n, Robin\u00a0L. Hill, Fr\u00e9d\u00e9ric Blain, Marina Fomicheva, Lucia Specia, and Lisa Yankovskaya. Backtranslation Feedback Improves User Confidence in MT, Not Quality. In Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies. 151\u2013161."}],"event":{"name":"CHI '24: CHI Conference on Human Factors in Computing Systems","location":"Honolulu HI USA","acronym":"CHI '24","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction","SIGACCESS ACM Special Interest Group on Accessible Computing"]},"container-title":["Proceedings of the CHI Conference on Human Factors in Computing Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3613904.3641904","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3613904.3641904","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T23:57:28Z","timestamp":1750291048000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3613904.3641904"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,11]]},"references-count":62,"alternative-id":["10.1145\/3613904.3641904","10.1145\/3613904"],"URL":"https:\/\/doi.org\/10.1145\/3613904.3641904","relation":{},"subject":[],"published":{"date-parts":[[2024,5,11]]},"assertion":[{"value":"2024-05-11","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}