{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,4]],"date-time":"2026-03-04T03:36:51Z","timestamp":1772595411118,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":62,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,4,25]],"date-time":"2025-04-25T00:00:00Z","timestamp":1745539200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"University of Texas at Austin University Graduate Continuing Fellowship","award":[""],"award-info":[{"award-number":[""]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,4,26]]},"DOI":"10.1145\/3706599.3719821","type":"proceedings-article","created":{"date-parts":[[2025,4,23]],"date-time":"2025-04-23T20:20:42Z","timestamp":1745439642000},"page":"1-11","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":3,"title":["Can Large Language Models Grasp Abstract Visual Concepts in Videos? A Case Study on YouTube Shorts about Depression"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-5398-1485","authenticated-orcid":false,"given":"Jiaying \"Lizzy\"","family":"Liu","sequence":"first","affiliation":[{"name":"School of Information, University of Texas at Austin, Austin, Texas, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-8021-429X","authenticated-orcid":false,"given":"Yiheng","family":"Su","sequence":"additional","affiliation":[{"name":"Artificial Intelligence and Human-Centered Computing (AI&amp;HCC) Lab, The University of Texas at Austin, Austin, Texas, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-4665-0776","authenticated-orcid":false,"given":"Praneel","family":"Seth","sequence":"additional","affiliation":[{"name":"Computer Science Department, University of Texas at Austin, Austin, Texas, USA"}]}],"member":"320","published-online":{"date-parts":[[2025,4,25]]},"reference":[{"key":"e_1_3_3_2_2_2","unstructured":"Dana Alsagheer Rabimba Karanjai Weidong Shi Nour Diallo Yang Lu Suha Beydoun and Qiaoning Zhang. 2024. Evaluating Irrationality in Large Language Models and Open Research Questions. (2024)."},{"key":"e_1_3_3_2_3_2","doi-asserted-by":"publisher","DOI":"10.1145\/3027063.3027137"},{"key":"e_1_3_3_2_4_2","doi-asserted-by":"publisher","DOI":"10.1145\/2998181.2998243"},{"key":"e_1_3_3_2_5_2","first-page":"9","volume-title":"Proceedings of the 1st Workshop on Computational Humor (CHum)","author":"Baluja Ashwin","year":"2025","unstructured":"Ashwin Baluja. 2025. Text Is Not All You Need: Multimodal Prompting Helps LLMs Understand Humor. In Proceedings of the 1st Workshop on Computational Humor (CHum), Christian\u00a0F. Hempelmann, Julia Rayz, Tiansi Dong, and Tristan Miller (Eds.). Association for Computational Linguistics, Online, 9\u201317. https:\/\/aclanthology.org\/2025.chum-1.2\/"},{"key":"e_1_3_3_2_6_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3581107"},{"key":"e_1_3_3_2_7_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3581107"},{"key":"e_1_3_3_2_8_2","doi-asserted-by":"publisher","DOI":"10.5555\/2390948.2391058"},{"key":"e_1_3_3_2_9_2","doi-asserted-by":"crossref","unstructured":"Virginia Braun and Victoria Clarke. 2006. Using thematic analysis in psychology. Qualitative research in psychology 3 2 (2006) 77\u2013101.","DOI":"10.1191\/1478088706qp063oa"},{"key":"e_1_3_3_2_10_2","doi-asserted-by":"publisher","unstructured":"Yupeng Chang Xu Wang Jindong Wang Yuan Wu Linyi Yang Kaijie Zhu Hao Chen Xiaoyuan Yi Cunxiang Wang Yidong Wang Wei Ye Yue Zhang Yi Chang Philip\u00a0S. Yu Qiang Yang and Xing Xie. 2024. A Survey on Evaluation of Large Language Models. ACM Trans. Intell. Syst. Technol. 15 3 Article 39 (mar 2024) 45\u00a0pages. 10.1145\/3641289","DOI":"10.1145\/3641289"},{"key":"e_1_3_3_2_11_2","unstructured":"Xiang Chen Chenxi Wang Yida Xue Ningyu Zhang Xiaoyan Yang Qiang Li Yue Shen Lei Liang Jinjie Gu and Huajun Chen. 2024. Unified Hallucination Detection for Multimodal Large Language Models. arxiv:https:\/\/arXiv.org\/abs\/2402.03190\u00a0[cs.CL] https:\/\/arxiv.org\/abs\/2402.03190"},{"key":"e_1_3_3_2_12_2","doi-asserted-by":"publisher","unstructured":"Robert Chew John Bollenbacher Michael Wenger Jessica Speer and Annice Kim. 2023. LLM-Assisted Content Analysis: Using Large Language Models to Support Deductive Coding. 10.48550\/arXiv.2306.14924 Issue: arXiv:https:\/\/arXiv.org\/abs\/2306.14924 arXiv:2306.14924 [cs stat].","DOI":"10.48550\/arXiv.2306.14924"},{"key":"e_1_3_3_2_13_2","unstructured":"Munmun\u00a0De Choudhury and Sushovan De. 2014. Mental Health Discourse on reddit: Self-Disclosure Social Support and Anonymity. (May 2014). https:\/\/www.scinapse.io\/papers\/2182854643"},{"key":"e_1_3_3_2_14_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.emnlp-main.64"},{"key":"e_1_3_3_2_15_2","volume-title":"Content Analysis","author":"Drisko James\u00a0W.","year":"2016","unstructured":"James\u00a0W. Drisko and Tina Maschi. 2016. Content Analysis. Oxford University Press. Google-Books-ID: 07GYCgAAQBAJ."},{"key":"e_1_3_3_2_16_2","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300495"},{"key":"e_1_3_3_2_17_2","doi-asserted-by":"publisher","DOI":"10.1145\/3593013.3593989"},{"key":"e_1_3_3_2_18_2","doi-asserted-by":"publisher","DOI":"10.1145\/3584931.3607500"},{"key":"e_1_3_3_2_19_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642139"},{"key":"e_1_3_3_2_20_2","unstructured":"Zeyu Han Chao Gao Jinyang Liu Jeff Zhang and Sai\u00a0Qian Zhang. 2024. Parameter-efficient fine-tuning for large models: A comprehensive survey. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2403.14608 (2024)."},{"key":"e_1_3_3_2_21_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01282"},{"key":"e_1_3_3_2_22_2","doi-asserted-by":"publisher","unstructured":"Sungeun Hong Jongbin Ryu Woobin Im and Hyun\u00a0S. Yang. 2018. D3: Recognizing dynamic scenes with deep dual descriptor based on key frames and key segments. Neurocomputing 273 (2018) 611\u2013621. 10.1016\/j.neucom.2017.08.046","DOI":"10.1016\/j.neucom.2017.08.046"},{"key":"e_1_3_3_2_23_2","doi-asserted-by":"publisher","DOI":"10.1109\/BIBM58861.2023.10385590"},{"key":"e_1_3_3_2_24_2","first-page":"47166","volume-title":"Advances in Neural Information Processing Systems","volume":"37","author":"Hu Zhe","year":"2024","unstructured":"Zhe Hu, Tuo Liang, Jing Li, Yiren Lu, Yunlai Zhou, Yiran Qiao, Jing Ma, and Yu Yin. 2024. Cracking the Code of Juxtaposition: Can AI Models Understand the Humorous Contradictions. In Advances in Neural Information Processing Systems , A.\u00a0Globerson, L.\u00a0Mackey, D.\u00a0Belgrave, A.\u00a0Fan, U.\u00a0Paquet, J.\u00a0Tomczak, and C.\u00a0Zhang (Eds.), Vol.\u00a037. Curran Associates, Inc., 47166\u201347188. https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2024\/file\/540a6eefb60428c8547a27253f9a2a59-Paper-Conference.pdf"},{"key":"e_1_3_3_2_25_2","doi-asserted-by":"publisher","unstructured":"Jina Huh Leslie\u00a0S. Liu Tina Neogi Kori Inkpen and Wanda Pratt. 2014. Health Vlogs as Social Support for Chronic Illness Management. ACM Trans. Comput.-Hum. Interact. 21 4 (Aug. 2014) 23:1\u201323:31. 10.1145\/2630067","DOI":"10.1145\/2630067"},{"key":"e_1_3_3_2_26_2","doi-asserted-by":"publisher","unstructured":"Margot Kelly-Hedrick Paul\u00a0H. Grunberg Felicia Brochu and Phyllis Zelkowitz. 2018. \"It\u2019s Totally Okay to Be Sad but Never Lose Hope\": Content Analysis of Infertility-Related Videos on YouTube in Relation to Viewer Preferences. Journal of Medical Internet Research 20 5 (May 2018) e10199. 10.2196\/10199 Number: 5.","DOI":"10.2196\/10199"},{"key":"e_1_3_3_2_27_2","first-page":"22199","volume-title":"Advances in Neural Information Processing Systems","volume":"35","author":"Kojima Takeshi","year":"2022","unstructured":"Takeshi Kojima, Shixiang\u00a0(Shane) Gu, Machel Reid, Yutaka Matsuo, and Yusuke Iwasawa. 2022. Large Language Models are Zero-Shot Reasoners. In Advances in Neural Information Processing Systems , S.\u00a0Koyejo, S.\u00a0Mohamed, A.\u00a0Agarwal, D.\u00a0Belgrave, K.\u00a0Cho, and A.\u00a0Oh (Eds.), Vol.\u00a035. Curran Associates, Inc., 22199\u201322213. https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2022\/file\/8bb0d291acd4acf06ef112099c16f326-Paper-Conference.pdf"},{"key":"e_1_3_3_2_28_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-40700-5"},{"key":"e_1_3_3_2_29_2","doi-asserted-by":"crossref","unstructured":"E\u00a0Megan Lachmar Andrea\u00a0K Wittenborn Katherine\u00a0W Bogen and Heather\u00a0L McCauley. 2017. #MyDepressionLooksLike: Examining Public Discourse About Depression on Twitter. JMIR MENTAL HEALTH (2017) 11.","DOI":"10.2196\/mental.8141"},{"key":"e_1_3_3_2_30_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW59228.2023.00602"},{"key":"e_1_3_3_2_31_2","doi-asserted-by":"publisher","DOI":"10.1145\/3630106.3658975"},{"key":"e_1_3_3_2_32_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642428"},{"key":"e_1_3_3_2_33_2","doi-asserted-by":"publisher","unstructured":"Shuailin Li Shiwei Wu Tianjian Liu Han Zhang Qingyu Guo and Zhenhui Peng. 2024. Understanding the Features of Text-Image Posts and Their Received Social Support in Online Grief Support Communities. Proceedings of the International AAAI Conference on Web and Social Media 18 (May 2024) 917\u2013929. 10.1609\/icwsm.v18i1.31362","DOI":"10.1609\/icwsm.v18i1.31362"},{"key":"e_1_3_3_2_34_2","first-page":"25268","volume-title":"Advances in Neural Information Processing Systems","author":"Lin Jing","year":"2023","unstructured":"Jing Lin, Ailing Zeng, Shunlin Lu, Yuanhao Cai, Ruimao Zhang, Haoqian Wang, and Lei Zhang. 2023. Motion-X: A Large-scale 3D Expressive Whole-body Human Motion Dataset. In Advances in Neural Information Processing Systems , A.\u00a0Oh, T.\u00a0Naumann, A.\u00a0Globerson, K.\u00a0Saenko, M.\u00a0Hardt, and S.\u00a0Levine (Eds.), Vol.\u00a036. Curran Associates, Inc., 25268\u201325280. https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2023\/file\/4f8e27f6036c1d8b4a66b5b3a947dd7b-Paper-Datasets_and_Benchmarks.pdf"},{"key":"e_1_3_3_2_35_2","unstructured":"Haotian Liu Chunyuan Li Yuheng Li and Yong\u00a0Jae Lee. 2024. Improved Baselines with Visual Instruction Tuning. arxiv:https:\/\/arXiv.org\/abs\/2310.03744\u00a0[cs.CV]"},{"key":"e_1_3_3_2_36_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02484"},{"key":"e_1_3_3_2_37_2","doi-asserted-by":"publisher","unstructured":"Jiaying Liu and Yan Zhang. 2024. Modeling Health Video Consumption Behaviors on Social Media: Activities Challenges and Characteristics. Proceedings of the ACM on Human-Computer Interaction 8 CSCW1 (April 2024) 208:1\u2013208:28. 10.1145\/3653699","DOI":"10.1145\/3653699"},{"key":"e_1_3_3_2_38_2","doi-asserted-by":"publisher","DOI":"10.1145\/3678884.3681850"},{"key":"e_1_3_3_2_39_2","doi-asserted-by":"publisher","DOI":"10.1145\/2470654.2470663"},{"key":"e_1_3_3_2_40_2","doi-asserted-by":"publisher","unstructured":"Yuanxin Liu Shicheng Li Yi Liu Yuxiang Wang Shuhuai Ren Lei Li Sishuo Chen Xu Sun and Lu Hou. 2024. TempCompass: Do Video LLMs Really Understand Videos?10.48550\/arXiv.2403.00476 Issue: arXiv:https:\/\/arXiv.org\/abs\/2403.00476 arXiv:2403.00476 [cs].","DOI":"10.48550\/arXiv.2403.00476"},{"key":"e_1_3_3_2_41_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.318"},{"key":"e_1_3_3_2_42_2","doi-asserted-by":"publisher","DOI":"10.1145\/3025453.3025932"},{"key":"e_1_3_3_2_43_2","doi-asserted-by":"crossref","unstructured":"Ryan McGrady Kevin Zheng Rebecca Curran Jason Baumgartner and Ethan Zuckerman. 2023. Dialing for Videos: A Random Sample of YouTube. Journal of Quantitative Description: Digital Media 3 (2023).","DOI":"10.51685\/jqd.2023.022"},{"key":"e_1_3_3_2_44_2","doi-asserted-by":"publisher","DOI":"10.4324\/9780203811030"},{"key":"e_1_3_3_2_45_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.emnlp-main.759"},{"key":"e_1_3_3_2_46_2","unstructured":"OpenAI Josh Achiam Steven Adler Sandhini Agarwal Lama Ahmad Ilge Akkaya Florencia\u00a0Leoni Aleman Diogo Almeida Janko Altenschmidt Sam Altman Shyamal Anadkat Red Avila Igor Babuschkin Suchir Balaji Valerie Balcom Paul Baltescu Haiming Bao Mohammad Bavarian Jeff Belgum Irwan Bello Jake Berdine Gabriel Bernadett-Shapiro Christopher Berner Lenny Bogdonoff Oleg Boiko Madelaine Boyd Anna-Luisa Brakman Greg Brockman Tim Brooks Miles Brundage Kevin Button Trevor Cai Rosie Campbell Andrew Cann Brittany Carey Chelsea Carlson Rory Carmichael Brooke Chan Che Chang Fotis Chantzis Derek Chen Sully Chen Ruby Chen Jason Chen Mark Chen Ben Chess Chester Cho Casey Chu Hyung\u00a0Won Chung Dave Cummings Jeremiah Currier Yunxing Dai Cory Decareaux Thomas Degry Noah Deutsch Damien Deville Arka Dhar David Dohan Steve Dowling Sheila Dunning Adrien Ecoffet Atty Eleti Tyna Eloundou David Farhi Liam Fedus Niko Felix Sim\u00f3n\u00a0Posada Fishman Juston Forte Isabella Fulford Leo Gao Elie Georges Christian Gibson Vik Goel Tarun Gogineni Gabriel Goh Rapha Gontijo-Lopes Jonathan Gordon Morgan Grafstein Scott Gray Ryan Greene Joshua Gross Shixiang\u00a0Shane Gu Yufei Guo Chris Hallacy Jesse Han Jeff Harris Yuchen He Mike Heaton Johannes Heidecke Chris Hesse Alan Hickey Wade Hickey Peter Hoeschele Brandon Houghton Kenny Hsu Shengli Hu Xin Hu Joost Huizinga Shantanu Jain Shawn Jain Joanne Jang Angela Jiang Roger Jiang Haozhun Jin Denny Jin Shino Jomoto Billie Jonn Heewoo Jun Tomer Kaftan \u0141ukasz Kaiser Ali Kamali Ingmar Kanitscheider Nitish\u00a0Shirish Keskar Tabarak Khan Logan Kilpatrick Jong\u00a0Wook Kim Christina Kim Yongjik Kim Jan\u00a0Hendrik Kirchner Jamie Kiros Matt Knight Daniel Kokotajlo \u0141ukasz Kondraciuk Andrew Kondrich Aris Konstantinidis Kyle Kosic Gretchen Krueger Vishal Kuo Michael Lampe Ikai Lan Teddy Lee Jan Leike Jade Leung Daniel Levy Chak\u00a0Ming Li Rachel Lim Molly Lin Stephanie Lin Mateusz Litwin Theresa Lopez Ryan Lowe Patricia Lue Anna Makanju Kim Malfacini Sam Manning Todor Markov Yaniv Markovski Bianca Martin Katie Mayer Andrew Mayne Bob McGrew Scott\u00a0Mayer McKinney Christine McLeavey Paul McMillan Jake McNeil David Medina Aalok Mehta Jacob Menick Luke Metz Andrey Mishchenko Pamela Mishkin Vinnie Monaco Evan Morikawa Daniel Mossing Tong Mu Mira Murati Oleg Murk David M\u00e9ly Ashvin Nair Reiichiro Nakano Rajeev Nayak Arvind Neelakantan Richard Ngo Hyeonwoo Noh Long Ouyang Cullen O\u2019Keefe Jakub Pachocki Alex Paino Joe Palermo Ashley Pantuliano Giambattista Parascandolo Joel Parish Emy Parparita Alex Passos Mikhail Pavlov Andrew Peng Adam Perelman Filipe de Avila Belbute\u00a0Peres Michael Petrov Henrique\u00a0Ponde de Oliveira\u00a0Pinto Michael Pokorny Michelle Pokrass Vitchyr\u00a0H. Pong Tolly Powell Alethea Power Boris Power Elizabeth Proehl Raul Puri Alec Radford Jack Rae Aditya Ramesh Cameron Raymond Francis Real Kendra Rimbach Carl Ross Bob Rotsted Henri Roussez Nick Ryder Mario Saltarelli Ted Sanders Shibani Santurkar Girish Sastry Heather Schmidt David Schnurr John Schulman Daniel Selsam Kyla Sheppard Toki Sherbakov Jessica Shieh Sarah Shoker Pranav Shyam Szymon Sidor Eric Sigler Maddie Simens Jordan Sitkin Katarina Slama Ian Sohl Benjamin Sokolowsky Yang Song Natalie Staudacher Felipe\u00a0Petroski Such Natalie Summers Ilya Sutskever Jie Tang Nikolas Tezak Madeleine\u00a0B. Thompson Phil Tillet Amin Tootoonchian Elizabeth Tseng Preston Tuggle Nick Turley Jerry Tworek Juan Felipe\u00a0Cer\u00f3n Uribe Andrea Vallone Arun Vijayvergiya Chelsea Voss Carroll Wainwright Justin\u00a0Jay Wang Alvin Wang Ben Wang Jonathan Ward Jason Wei CJ Weinmann Akila Welihinda Peter Welinder Jiayi Weng Lilian Weng Matt Wiethoff Dave Willner Clemens Winter Samuel Wolrich Hannah Wong Lauren Workman Sherwin Wu Jeff Wu Michael Wu Kai Xiao Tao Xu Sarah Yoo Kevin Yu Qiming Yuan Wojciech Zaremba Rowan Zellers Chong Zhang Marvin Zhang Shengjia Zhao Tianhao Zheng Juntang Zhuang William Zhuk and Barret Zoph. 2024. GPT-4 Technical Report. arxiv:https:\/\/arXiv.org\/abs\/2303.08774\u00a0[cs.CL]"},{"key":"e_1_3_3_2_47_2","doi-asserted-by":"crossref","unstructured":"Cliodhna O\u2019Connor and Helene Joffe. 2020. Intercoder reliability in qualitative research: debates and practical guidelines. International journal of qualitative methods 19 (2020) 1609406919899220.","DOI":"10.1177\/1609406919899220"},{"key":"e_1_3_3_2_48_2","doi-asserted-by":"publisher","unstructured":"Sachin\u00a0R. Pendse Neha Kumar and Munmun De\u00a0Choudhury. 2023. Marginalization and the Construction of Mental Illness Narratives Online: Foregrounding Institutions in Technology-Mediated Care. Proceedings of the ACM on Human-Computer Interaction 7 CSCW2 (Oct. 2023) 346:1\u2013346:30. 10.1145\/3610195","DOI":"10.1145\/3610195"},{"key":"e_1_3_3_2_49_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3581559"},{"key":"e_1_3_3_2_50_2","doi-asserted-by":"crossref","unstructured":"Mirjam Seckler Klaus Opwis and Alexandre\u00a0N Tuch. 2015. Linking objective design factors with subjective aesthetics: An experimental study on how structure and color of websites affect the facets of users\u2019 visual aesthetic perception. Computers in Human Behavior 49 (2015) 375\u2013389.","DOI":"10.1016\/j.chb.2015.02.056"},{"key":"e_1_3_3_2_51_2","unstructured":"Hua Shen Tiffany Knearem Reshmi Ghosh Yu-Ju Yang Tanushree Mitra and Yun Huang. 2024. Valuecompass: A framework of fundamental values for human-ai alignment. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2409.09586 (2024)."},{"key":"e_1_3_3_2_52_2","unstructured":"Yunlong Tang Jing Bi Siting Xu Luchuan Song Susan Liang Teng Wang Daoan Zhang Jie An Jingyang Lin Rongyi Zhu et\u00a0al. 2023. Video understanding with large language models: A survey. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2312.17432 (2023)."},{"key":"e_1_3_3_2_53_2","unstructured":"Suramya Tomar. 2006. Converting video formats with FFmpeg. Linux journal 2006 146 (2006) 10."},{"key":"e_1_3_3_2_54_2","unstructured":"Jiaqi Wang Hanqi Jiang Yiheng Liu Chong Ma Xu Zhang Yi Pan Mengyuan Liu Peiran Gu Sichen Xia Wenjun Li et\u00a0al. 2024. A Comprehensive Review of Multimodal Large Language Models: Performance and Challenges Across Different Tasks. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2408.01319 (2024)."},{"key":"e_1_3_3_2_55_2","doi-asserted-by":"crossref","unstructured":"Zhou Wang Alan\u00a0C Bovik Hamid\u00a0R Sheikh and Eero\u00a0P Simoncelli. 2004. Image quality assessment: from error measurement to structural similarity. IEEE transactions on image processing 13 1 (2004).","DOI":"10.1109\/TIP.2003.819861"},{"key":"e_1_3_3_2_56_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3636302"},{"key":"e_1_3_3_2_57_2","doi-asserted-by":"publisher","DOI":"10.1145\/3581754.3584136"},{"key":"e_1_3_3_2_58_2","first-page":"11809","volume-title":"Advances in Neural Information Processing Systems","volume":"36","author":"Yao Shunyu","year":"2023","unstructured":"Shunyu Yao, Dian Yu, Jeffrey Zhao, Izhak Shafran, Tom Griffiths, Yuan Cao, and Karthik Narasimhan. 2023. Tree of Thoughts: Deliberate Problem Solving with Large Language Models. In Advances in Neural Information Processing Systems , A.\u00a0Oh, T.\u00a0Naumann, A.\u00a0Globerson, K.\u00a0Saenko, M.\u00a0Hardt, and S.\u00a0Levine (Eds.), Vol.\u00a036. Curran Associates, Inc., 11809\u201311822. https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2023\/file\/271db9922b8d1f4dd7aaef84ed5ac703-Paper-Conference.pdf"},{"key":"e_1_3_3_2_59_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.506"},{"key":"e_1_3_3_2_60_2","doi-asserted-by":"publisher","unstructured":"Shukang Yin Chaoyou Fu Sirui Zhao Ke Li Xing Sun Tong Xu and Enhong Chen. 2024. A survey on multimodal large language models. National Science Review 11 12 (11 2024) nwae403. 10.1093\/nsr\/nwae403 arXiv:https:\/\/academic.oup.com\/nsr\/article-pdf\/11\/12\/nwae403\/61201557\/nwae403.pdf","DOI":"10.1093\/nsr\/nwae403"},{"key":"e_1_3_3_2_61_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-demo.49"},{"key":"e_1_3_3_2_62_2","doi-asserted-by":"publisher","unstructured":"He Zhang Chuhao Wu Jingyi Xie Yao Lyu Jie Cai and John\u00a0M. Carroll. 2023. Redefining Qualitative Analysis in the AI Era: Utilizing ChatGPT for Efficient Thematic Analysis. 10.48550\/arXiv.2309.10771 Issue: arXiv:https:\/\/arXiv.org\/abs\/2309.10771 arXiv:2309.10771 [cs].","DOI":"10.48550\/arXiv.2309.10771"},{"key":"e_1_3_3_2_63_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW63382.2024.00206"}],"event":{"name":"CHI EA '25: Extended Abstracts of the CHI Conference on Human Factors in Computing Systems","location":"Yokohama Japan","acronym":"CHI EA '25","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction"]},"container-title":["Proceedings of the Extended Abstracts of the CHI Conference on Human Factors in Computing Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3706599.3719821","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3706599.3719821","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:18:34Z","timestamp":1750295914000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3706599.3719821"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,25]]},"references-count":62,"alternative-id":["10.1145\/3706599.3719821","10.1145\/3706599"],"URL":"https:\/\/doi.org\/10.1145\/3706599.3719821","relation":{},"subject":[],"published":{"date-parts":[[2025,4,25]]},"assertion":[{"value":"2025-04-25","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}