{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,4]],"date-time":"2026-02-04T18:48:28Z","timestamp":1770230908952,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":156,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,4,25]],"date-time":"2025-04-25T00:00:00Z","timestamp":1745539200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,4,26]]},"DOI":"10.1145\/3706598.3714069","type":"proceedings-article","created":{"date-parts":[[2025,4,24]],"date-time":"2025-04-24T03:30:09Z","timestamp":1745465409000},"page":"1-21","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Emerging Data Practices: Data Work in the Era of Large Language Models"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4230-3777","authenticated-orcid":false,"given":"Adriana","family":"Alvarado Garcia","sequence":"first","affiliation":[{"name":"Responsible Tech Research, IBM Research, Yorktown Heights, New York, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0365-8057","authenticated-orcid":false,"given":"Heloisa","family":"Candello","sequence":"additional","affiliation":[{"name":"IBM Research, Sao Paulo, Brazil"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1165-3619","authenticated-orcid":false,"given":"Karla","family":"Badillo-Urquiola","sequence":"additional","affiliation":[{"name":"Department of Computer Science and Engineering, University of Notre Dame, South Bend, Indiana, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8071-6716","authenticated-orcid":false,"given":"Marisol","family":"Wong-Villacres","sequence":"additional","affiliation":[{"name":"Facultad de Ingenier\u00eda en Electricidad y Computaci\u00f3n, Escuela Superior Polit\u00e9cnica del Litoral, Guayaquil, Ecuador"}]}],"member":"320","published-online":{"date-parts":[[2025,4,25]]},"reference":[{"key":"e_1_3_3_3_2_2","unstructured":"2024. https:\/\/partnershiponai.org\/modeldeployment\/#landing"},{"key":"e_1_3_3_3_3_2","unstructured":"Sara Abdali Richard Anarfi CJ Barberan and Jia He. 2024. Securing Large Language Models: Threats Vulnerabilities and Responsible Practices. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2403.12503 (2024)."},{"key":"e_1_3_3_3_4_2","doi-asserted-by":"crossref","unstructured":"Abubakar Abid Maheen Farooqi and James Zou. 2021. Large language models associate Muslims with violence. Nature Machine Intelligence 3 6 (2021) 461\u2013463.","DOI":"10.1038\/s42256-021-00359-2"},{"key":"e_1_3_3_3_5_2","doi-asserted-by":"crossref","unstructured":"Rene Abraham Johannes Schneider and Jan Vom\u00a0Brocke. 2019. Data governance: A conceptual framework structured review and research agenda. International journal of information management 49 (2019) 424\u2013438.","DOI":"10.1016\/j.ijinfomgt.2019.07.008"},{"key":"e_1_3_3_3_6_2","doi-asserted-by":"publisher","unstructured":"Jumana Almahmoud Robert DeLine and Steven\u00a0M. Drucker. 2021. How Teams Communicate about the Quality of ML Models: A Case Study at an International Technology Company. Proc. ACM Hum.-Comput. Interact. 5 GROUP Article 222 (July 2021) 24\u00a0pages. 10.1145\/3463934","DOI":"10.1145\/3463934"},{"key":"e_1_3_3_3_7_2","doi-asserted-by":"publisher","unstructured":"Anne Arzberger Stefan Buijsman Maria\u00a0Luce Lupetti Alessandro Bozzon and Jie Yang. 2024. Nothing Comes Without Its World \u2013 Practical Challenges of Aligning LLMs to Situated Human Values through RLHF. Proceedings of the AAAI\/ACM Conference on AI Ethics and Society 7 1 (Oct. 2024) 61\u201373. 10.1609\/aies.v7i1.31617","DOI":"10.1609\/aies.v7i1.31617"},{"key":"e_1_3_3_3_8_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.608"},{"key":"e_1_3_3_3_9_2","doi-asserted-by":"publisher","DOI":"10.1145\/3442188.3445922"},{"key":"e_1_3_3_3_10_2","unstructured":"Sarah Bird Miro Dud\u00edk Richard Edgar Brandon Horn Roman Lutz Vanessa Milan Mehrnoosh Sameki Hanna Wallach and Kathleen Walker. 2020. Fairlearn: A toolkit for assessing and improving fairness in AI. Microsoft Tech. Rep. MSR-TR-2020-32 (2020)."},{"key":"e_1_3_3_3_11_2","unstructured":"Tolga Bolukbasi Kai-Wei Chang James\u00a0Y Zou Venkatesh Saligrama and Adam\u00a0T Kalai. 2016. Man is to computer programmer as woman is to homemaker? debiasing word embeddings. Advances in neural information processing systems 29 (2016)."},{"key":"e_1_3_3_3_12_2","doi-asserted-by":"crossref","unstructured":"Zal\u00e1n Borsos Rapha\u00ebl Marinier Damien Vincent Eugene Kharitonov Olivier Pietquin Matt Sharifi Dominik Roblek Olivier Teboul David Grangier Marco Tagliasacchi et\u00a0al. 2023. Audiolm: a language modeling approach to audio generation. IEEE\/ACM transactions on audio speech and language processing 31 (2023) 2523\u20132533.","DOI":"10.1109\/TASLP.2023.3288409"},{"key":"e_1_3_3_3_13_2","volume-title":"Sorting things out: classification and its consequences","author":"Bowker Geoffrey\u00a0C.","year":"2008","unstructured":"Geoffrey\u00a0C. Bowker and Susan\u00a0Leigh. Star. 2008. Sorting things out: classification and its consequences. MIT Press."},{"key":"e_1_3_3_3_14_2","doi-asserted-by":"crossref","unstructured":"Virginia Braun and Victoria Clarke. 2006. Using thematic analysis in psychology. Qualitative Research in Psychology 3 2 (2006) 77\u2013101.","DOI":"10.1191\/1478088706qp063oa"},{"key":"e_1_3_3_3_15_2","unstructured":"Tom\u00a0B Brown. 2020. Language models are few-shot learners. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2005.14165 (2020)."},{"key":"e_1_3_3_3_16_2","unstructured":"Jeff Burke Ruofei Du Matthew\u00a0K Hong Jennifer Jacobs Philippe Laban Dingzeyu Li Nanyun Peng Karl\u00a0DD Willis Chien-Sheng Wu and Bolei Zhou. [n. d.]. Next Steps for Human-Centered Generative AI. ([n. d.])."},{"key":"e_1_3_3_3_17_2","doi-asserted-by":"crossref","unstructured":"Steve Campbell Melanie Greenwood Sarah Prior Toniele Shearer Kerrie Walkem Sarah Young Danielle Bywaters and Kim Walker. 2020. Purposive sampling: complex or simple? Research case examples. Journal of research in Nursing 25 8 (2020) 652\u2013661.","DOI":"10.1177\/1744987120927206"},{"key":"e_1_3_3_3_18_2","first-page":"5253","volume-title":"32nd USENIX Security Symposium (USENIX Security 23)","author":"Carlini Nicolas","year":"2023","unstructured":"Nicolas Carlini, Jamie Hayes, Milad Nasr, Matthew Jagielski, Vikash Sehwag, Florian Tramer, Borja Balle, Daphne Ippolito, and Eric Wallace. 2023. Extracting training data from diffusion models. In 32nd USENIX Security Symposium (USENIX Security 23). 5253\u20135270."},{"key":"e_1_3_3_3_19_2","doi-asserted-by":"publisher","unstructured":"Samuelle Carlson and Ben Anderson. 2007. What Are Data? The Many Kinds of Data and Their Implications for Data Re-Use. Journal of Computer-Mediated Communication 12 2 (01 2007) 635\u2013651. 10.1111\/j.1083-6101.2007.00342.x arXiv:https:\/\/academic.oup.com\/jcmc\/article-pdf\/12\/2\/635\/22317230\/jjcmcom0635.pdf","DOI":"10.1111\/j.1083-6101.2007.00342.x"},{"key":"e_1_3_3_3_20_2","unstructured":"Louis Castricato Nathan Lile Rafael Rafailov Jan-Philipp Fr\u00e4nken and Chelsea Finn. 2024. PERSONA: A Reproducible Testbed for Pluralistic Alignment. arxiv:https:\/\/arXiv.org\/abs\/2407.17387\u00a0[cs.CL] https:\/\/arxiv.org\/abs\/2407.17387"},{"key":"e_1_3_3_3_21_2","doi-asserted-by":"publisher","unstructured":"Srravya Chandhiramowuli Alex\u00a0S. Taylor Sara Heitlinger and Ding Wang. 2024. Making Data Work Count. Proc. ACM Hum.-Comput. Interact. 8 CSCW1 Article 90 (apr 2024) 26\u00a0pages. 10.1145\/3637367","DOI":"10.1145\/3637367"},{"key":"e_1_3_3_3_22_2","doi-asserted-by":"crossref","unstructured":"Irene\u00a0Y Chen Shalmali Joshi Marzyeh Ghassemi and Rajesh Ranganath. 2021. Probabilistic machine learning for healthcare. Annual review of biomedical data science 4 1 (2021) 393\u2013415.","DOI":"10.1146\/annurev-biodatasci-092820-033938"},{"key":"e_1_3_3_3_23_2","unstructured":"Mark Chen Jerry Tworek Heewoo Jun Qiming Yuan Henrique Ponde De\u00a0Oliveira Pinto Jared Kaplan Harri Edwards Yuri Burda Nicholas Joseph Greg Brockman et\u00a0al. 2021. Evaluating large language models trained on code. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2107.03374 (2021)."},{"key":"e_1_3_3_3_24_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-ijcnlp.32"},{"key":"e_1_3_3_3_25_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.870"},{"key":"e_1_3_3_3_26_2","unstructured":"Aakanksha Chowdhery Sharan Narang Jacob Devlin Maarten Bosma Gaurav Mishra Adam Roberts Paul Barham Hyung\u00a0Won Chung Charles Sutton Sebastian Gehrmann et\u00a0al. 2023. Palm: Scaling language modeling with pathways. Journal of Machine Learning Research 24 240 (2023) 1\u2013113."},{"key":"e_1_3_3_3_27_2","doi-asserted-by":"crossref","unstructured":"Carter Cousineau Rozita Dara and Ataharul Chowdhury. 2024. Trustworthy AI: AI developers\u2019 lens to implementation challenges and opportunities. Data and Information Management (2024) 100082.","DOI":"10.1016\/j.dim.2024.100082"},{"key":"e_1_3_3_3_28_2","unstructured":"D Coyle S Diepeveen J Wdowin L Kay and J Tennison. 2020. Informing the global data future: benchmarking data governance frameworks. Data & Policy Cambridge Core (2020)."},{"key":"e_1_3_3_3_29_2","doi-asserted-by":"crossref","unstructured":"Arghavan\u00a0Moradi Dakhel Vahid Majdinasab Amin Nikanjam Foutse Khomh Michel\u00a0C Desmarais and Zhen Ming\u00a0Jack Jiang. 2023. Github copilot ai pair programmer: Asset or liability? Journal of Systems and Software 203 (2023) 111734.","DOI":"10.1016\/j.jss.2023.111734"},{"key":"e_1_3_3_3_30_2","doi-asserted-by":"publisher","unstructured":"Andrew\u00a0Gary Darwin\u00a0Holmes. 2020. Researcher Positionality - A Consideration of Its Influence and Place in Qualitative Research - A New Researcher Guide. Shanlax International Journal of Education 8 4 (Sep. 2020) 1\u201310. 10.34293\/education.v8i4.3232","DOI":"10.34293\/education.v8i4.3232"},{"key":"e_1_3_3_3_31_2","unstructured":"Aline de Campos Jorge Melegati Nicolas Nascimento Rafael Chanin Afonso Sales and Igor Wiese. 2024. Some things never change: how far generative AI can really change software engineering practice. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2406.09725 (2024)."},{"key":"e_1_3_3_3_32_2","doi-asserted-by":"publisher","DOI":"10.1145\/3593013.3594037"},{"key":"e_1_3_3_3_33_2","doi-asserted-by":"publisher","DOI":"10.7551\/mitpress\/11805.001.0001"},{"key":"e_1_3_3_3_34_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445188"},{"key":"e_1_3_3_3_35_2","doi-asserted-by":"publisher","DOI":"10.1145\/3025453.3025837"},{"key":"e_1_3_3_3_36_2","doi-asserted-by":"crossref","unstructured":"Luciano Floridi and Josh Cowls. 2022. A unified framework of five principles for AI in society. Machine learning and the city: Applications in architecture and urban design (2022) 535\u2013545.","DOI":"10.1002\/9781119815075.ch45"},{"key":"e_1_3_3_3_37_2","doi-asserted-by":"publisher","unstructured":"Iason Gabriel. 2020. Artificial Intelligence Values and Alignment. Minds Mach. 30 3 (sep 2020) 411\u2013437. 10.1007\/s11023-020-09539-2","DOI":"10.1007\/s11023-020-09539-2"},{"key":"e_1_3_3_3_38_2","doi-asserted-by":"publisher","DOI":"10.1145\/3531146.3533229"},{"key":"e_1_3_3_3_39_2","doi-asserted-by":"publisher","unstructured":"Timnit Gebru Jamie Morgenstern Briana Vecchione Jennifer\u00a0Wortman Vaughan Hanna Wallach Hal\u00a0Daum\u00e9 III and Kate Crawford. 2021. Datasheets for datasets. Commun. ACM 64 12 (nov 2021) 86\u201392. 10.1145\/3458723","DOI":"10.1145\/3458723"},{"key":"e_1_3_3_3_40_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3580782"},{"key":"e_1_3_3_3_41_2","doi-asserted-by":"publisher","DOI":"10.1145\/2463676.2463712"},{"key":"e_1_3_3_3_42_2","doi-asserted-by":"publisher","DOI":"10.1145\/3544548.3580999"},{"key":"e_1_3_3_3_43_2","doi-asserted-by":"publisher","DOI":"10.1145\/3630106.3659009"},{"key":"e_1_3_3_3_44_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642872"},{"key":"e_1_3_3_3_45_2","doi-asserted-by":"publisher","DOI":"10.1145\/3593013.3594067"},{"key":"e_1_3_3_3_46_2","doi-asserted-by":"crossref","unstructured":"Jeffrey\u00a0T Hancock Mor Naaman and Karen Levy. 2020. AI-mediated communication: Definition research agenda and ethical considerations. Journal of Computer-Mediated Communication 25 1 (2020) 89\u2013100.","DOI":"10.1093\/jcmc\/zmz022"},{"key":"e_1_3_3_3_47_2","doi-asserted-by":"publisher","DOI":"10.1115\/DETC2021-68103"},{"key":"e_1_3_3_3_48_2","unstructured":"Jonathan Ho Tim Salimans Alexey Gritsenko William Chan Mohammad Norouzi and David\u00a0J Fleet. 2022. Video diffusion models. Advances in Neural Information Processing Systems 35 (2022) 8633\u20138646."},{"key":"e_1_3_3_3_49_2","unstructured":"Ari Holtzman Jan Buys Li Du Maxwell Forbes and Yejin Choi. 2019. The curious case of neural text degeneration. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1904.09751 (2019)."},{"key":"e_1_3_3_3_50_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.806"},{"key":"e_1_3_3_3_51_2","doi-asserted-by":"crossref","unstructured":"Javier\u00a0Camacho Ib\u00e1\u00f1ez and M\u00f3nica\u00a0Villas Olmeda. 2022. Operationalising AI ethics: how are companies bridging the gap between practice and principles? An exploratory study. Ai & Society 37 4 (2022) 1663\u20131687.","DOI":"10.1007\/s00146-021-01267-0"},{"key":"e_1_3_3_3_52_2","doi-asserted-by":"publisher","unstructured":"Andrew Iliadis and Federica Russo. 2016. Critical data studies: An introduction. Big Data & Society 3 2 (2016) 2053951716674238. 10.1177\/2053951716674238 arXiv:10.1177\/2053951716674238","DOI":"10.1177\/2053951716674238"},{"key":"e_1_3_3_3_53_2","doi-asserted-by":"crossref","unstructured":"Marijn Janssen. 2025. Responsible governance of generative AI: conceptualizing GenAI as complex adaptive systems. Policy and Society (2025) puae040.","DOI":"10.1093\/polsoc\/puae040"},{"key":"e_1_3_3_3_54_2","doi-asserted-by":"publisher","unstructured":"Marijn Janssen Paul Brous Elsa Estevez Luis\u00a0S. Barbosa and Tomasz Janowski. 2020. Data governance: Organizing data for trustworthy Artificial Intelligence. Government Information Quarterly 37 3 (2020) 101493. 10.1016\/j.giq.2020.101493","DOI":"10.1016\/j.giq.2020.101493"},{"key":"e_1_3_3_3_55_2","doi-asserted-by":"publisher","DOI":"10.1145\/3531146.3534637"},{"key":"e_1_3_3_3_56_2","unstructured":"James Jordan Florimond Houssiau Giovanni Cherubin Samuel\u00a0N Cohen Lukasz Szpruch Mirko Bottarelli Carsten Maple and Adrian Weller. 2022. https:\/\/royalsociety.org\/-\/media\/policy\/projects\/privacy-enhancing-technologies\/Synthetic_Data_Survey-24.pdf"},{"key":"e_1_3_3_3_57_2","doi-asserted-by":"publisher","DOI":"10.1145\/3618260.3649777"},{"key":"e_1_3_3_3_58_2","first-page":"15696","volume-title":"International Conference on Machine Learning","author":"Kandpal Nikhil","year":"2023","unstructured":"Nikhil Kandpal, Haikang Deng, Adam Roberts, Eric Wallace, and Colin Raffel. 2023. Large language models struggle to learn long-tail knowledge. In International Conference on Machine Learning. PMLR, 15696\u201315707."},{"key":"e_1_3_3_3_59_2","doi-asserted-by":"publisher","DOI":"10.1145\/3580305.3599557"},{"key":"e_1_3_3_3_60_2","doi-asserted-by":"crossref","unstructured":"Julian\u00a0J Koplin. 2023. Dual-use implications of AI text generation. Ethics and Information Technology 25 2 (2023) 32.","DOI":"10.1007\/s10676-023-09703-z"},{"key":"e_1_3_3_3_61_2","unstructured":"Anurakt Kumar Divyanshu Kumar Jatan Loya Nitin\u00a0Aravind Birur Tanay Baswa Sahil Agarwal and Prashanth Harshangi. 2024. SAGE-RT: Synthetic Alignment data Generation for Safety Evaluation and Red Teaming. arxiv:https:\/\/arXiv.org\/abs\/2408.11851\u00a0[cs.AI] https:\/\/arxiv.org\/abs\/2408.11851"},{"key":"e_1_3_3_3_62_2","doi-asserted-by":"publisher","DOI":"10.1145\/3491102.3502030"},{"key":"e_1_3_3_3_63_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642428"},{"key":"e_1_3_3_3_64_2","doi-asserted-by":"crossref","unstructured":"Yujia Li David Choi Junyoung Chung Nate Kushman Julian Schrittwieser R\u00e9mi Leblond Tom Eccles James Keeling Felix Gimeno Agustin Dal\u00a0Lago et\u00a0al. 2022. Competition-level code generation with alphacode. Science 378 6624 (2022) 1092\u20131097.","DOI":"10.1126\/science.abq1158"},{"key":"e_1_3_3_3_65_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.naacl-main.15"},{"key":"e_1_3_3_3_66_2","doi-asserted-by":"publisher","DOI":"10.1145\/3498366.3505817"},{"key":"e_1_3_3_3_67_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.647"},{"key":"e_1_3_3_3_68_2","doi-asserted-by":"crossref","unstructured":"Q.\u00a0Vera Liao and Jennifer Wortman\u00a0Vaughan. 2024. AI Transparency in the Age of LLMs: A Human-Centered Research Roadmap. Harvard Data Science ReviewSpecial Issue 5 (may 31 2024). https:\/\/hdsr.mitpress.mit.edu\/pub\/aelql9qy.","DOI":"10.1162\/99608f92.8036d03b"},{"key":"e_1_3_3_3_69_2","unstructured":"Haohe Liu Zehua Chen Yi Yuan Xinhao Mei Xubo Liu Danilo Mandic Wenwu Wang and Mark\u00a0D Plumbley. 2023. Audioldm: Text-to-audio generation with latent diffusion models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2301.12503 (2023)."},{"key":"e_1_3_3_3_70_2","unstructured":"Ruibo Liu Jerry Wei Fangyu Liu Chenglei Si Yanzhe Zhang Jinmeng Rao Steven Zheng Daiyi Peng Diyi Yang Denny Zhou et\u00a0al. 2024. Best practices and lessons learned on synthetic data for language models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2404.07503 (2024)."},{"key":"e_1_3_3_3_71_2","doi-asserted-by":"crossref","unstructured":"Yang Liu Jiahuan Cao Chongyu Liu Kai Ding and Lianwen Jin. 2024. Datasets for Large Language Models: A Comprehensive Survey. arxiv:https:\/\/arXiv.org\/abs\/2402.18041\u00a0[cs.CL] https:\/\/arxiv.org\/abs\/2402.18041","DOI":"10.21203\/rs.3.rs-3996137\/v1"},{"key":"e_1_3_3_3_72_2","first-page":"2638","volume-title":"Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024)","author":"Liu Yuxuan","year":"2024","unstructured":"Yuxuan Liu, Tianchi Yang, Shaohan Huang, Zihan Zhang, Haizhen Huang, Furu Wei, Weiwei Deng, Feng Sun, and Qi Zhang. 2024. Calibrating LLM-Based Evaluator. In Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024), Nicoletta Calzolari, Min-Yen Kan, Veronique Hoste, Alessandro Lenci, Sakriani Sakti, and Nianwen Xue (Eds.). ELRA and ICCL, Torino, Italia, 2638\u20132656. https:\/\/aclanthology.org\/2024.lrec-main.237"},{"key":"e_1_3_3_3_73_2","unstructured":"Shayne Longpre Stella Biderman Alon Albalak Hailey Schoelkopf Daniel McDuff Sayash Kapoor Kevin Klyman Kyle Lo Gabriel Ilharco Nay San Maribeth Rauh Aviya Skowron Bertie Vidgen Laura Weidinger Arvind Narayanan Victor Sanh David Adelani Percy Liang Rishi Bommasani Peter Henderson Sasha Luccioni Yacine Jernite and Luca Soldaini. 2024. The Responsible Foundation Model Development Cheatsheet: A Review of Tools and Resources. arxiv:https:\/\/arXiv.org\/abs\/2406.16746\u00a0[cs.LG] https:\/\/arxiv.org\/abs\/2406.16746"},{"key":"e_1_3_3_3_74_2","doi-asserted-by":"publisher","DOI":"10.7551\/mitpress\/11543.001.0001"},{"key":"e_1_3_3_3_75_2","doi-asserted-by":"publisher","DOI":"10.1145\/3630106.3658988"},{"key":"e_1_3_3_3_76_2","volume-title":"Proceedings of the fourth international conference on computational creativity","volume":"147","author":"Maher Mary\u00a0Lou","year":"2013","unstructured":"Mary\u00a0Lou Maher, Katherine Brady, and Douglas\u00a0H Fisher. 2013. Computational models of surprise in evaluating creative design. In Proceedings of the fourth international conference on computational creativity , Vol.\u00a0147. Citeseer."},{"key":"e_1_3_3_3_77_2","unstructured":"Laura Manduchi Kushagra Pandey Robert Bamler Ryan Cotterell Sina D\u00e4ubener Sophie Fellenz Asja Fischer Thomas G\u00e4rtner Matthias Kirchler Marius Kloft et\u00a0al. 2024. On the challenges and opportunities in generative ai. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2403.00025 (2024)."},{"key":"e_1_3_3_3_78_2","doi-asserted-by":"crossref","unstructured":"Matti M\u00e4ntym\u00e4ki Matti Minkkinen Teemu Birkstedt and Mika Viljanen. 2022. Defining organizational AI governance. AI and Ethics 2 4 (2022) 603\u2013609.","DOI":"10.1007\/s43681-022-00143-x"},{"key":"e_1_3_3_3_79_2","unstructured":"Nestor Maslej Loredana Fattorini Raymond Perrault Vanessa Parli Anka Reuel Erik Brynjolfsson John Etchemendy Katrina Ligett Terah Lyons James Manyika Juan\u00a0Carlos Niebles Yoav Shoham Russell Wald and Jack Clark. 2024. The AI Index 2024 Annual Report."},{"key":"e_1_3_3_3_80_2","doi-asserted-by":"crossref","unstructured":"Nora McDonald Sarita Schoenebeck and Andrea Forte. 2019. Reliability and inter-rater reliability in qualitative research: Norms and guidelines for CSCW and HCI practice. Proceedings of the ACM on human-computer interaction 3 CSCW (2019) 1\u201323.","DOI":"10.1145\/3359174"},{"key":"e_1_3_3_3_81_2","doi-asserted-by":"crossref","unstructured":"Bertalan Mesk\u00f3 and Eric\u00a0J Topol. 2023. The imperative for regulatory oversight of large language models (or generative AI) in healthcare. NPJ digital medicine 6 1 (2023) 120.","DOI":"10.1038\/s41746-023-00873-0"},{"key":"e_1_3_3_3_82_2","doi-asserted-by":"publisher","unstructured":"Milagros Miceli Martin Schuessler and Tianling Yang. 2020. Between Subjectivity and Imposition: Power Dynamics in Data Annotation for Computer Vision. Proc. ACM Hum.-Comput. Interact. 4 CSCW2 Article 115 (oct 2020) 25\u00a0pages. 10.1145\/3415186","DOI":"10.1145\/3415186"},{"key":"e_1_3_3_3_83_2","doi-asserted-by":"publisher","unstructured":"Milagros Miceli Tianling Yang Adriana Alvarado\u00a0Garcia Julian Posada Sonja\u00a0Mei Wang Marc Pohl and Alex Hanna. 2022. Documenting Data Production Processes: A Participatory Approach for Data Work. Proc. ACM Hum.-Comput. Interact. 6 CSCW2 Article 510 (nov 2022) 34\u00a0pages. 10.1145\/3555623","DOI":"10.1145\/3555623"},{"key":"e_1_3_3_3_84_2","doi-asserted-by":"publisher","DOI":"10.1145\/3442188.3445880"},{"key":"e_1_3_3_3_85_2","doi-asserted-by":"crossref","unstructured":"Marina Micheli Marisa Ponti Max Craglia and Anna Berti\u00a0Suman. 2020. Emerging models of data governance in the age of datafication. Big Data & Society 7 2 (2020) 2053951720948087.","DOI":"10.1177\/2053951720948087"},{"key":"e_1_3_3_3_86_2","doi-asserted-by":"crossref","unstructured":"Naja\u00a0Holten M\u00f8ller Claus Bossen Kathleen\u00a0H Pine Trine\u00a0Rask Nielsen and Gina Neff. 2020. Who does the work of data? Interactions 27 3 (2020) 52\u201355.","DOI":"10.1145\/3386389"},{"key":"e_1_3_3_3_87_2","doi-asserted-by":"crossref","unstructured":"Jessica Morley Luciano Floridi Libby Kinsey and Anat Elhalal. 2020. From what to how: an initial review of publicly available AI ethics tools methods and research to translate principles into practices. Science and engineering ethics 26 4 (2020) 2141\u20132168.","DOI":"10.1007\/s11948-019-00165-5"},{"key":"e_1_3_3_3_88_2","doi-asserted-by":"publisher","DOI":"10.1145\/3406865.3418584"},{"key":"e_1_3_3_3_89_2","volume-title":"International Conference on Computational Creativity","author":"Muller Michael","year":"2023","unstructured":"Michael Muller, Heloisa Candello, and Justin Weisz. 2023. Interactional Co-Creativity of Human and AI in Analogy-Based Design. In International Conference on Computational Creativity."},{"key":"e_1_3_3_3_90_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3636294"},{"key":"e_1_3_3_3_91_2","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300356"},{"key":"e_1_3_3_3_92_2","doi-asserted-by":"publisher","DOI":"10.1145\/3290605.3300356"},{"key":"e_1_3_3_3_93_2","doi-asserted-by":"publisher","DOI":"10.1145\/3491102.3517644"},{"key":"e_1_3_3_3_94_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445402"},{"key":"e_1_3_3_3_95_2","doi-asserted-by":"crossref","unstructured":"AkshatKumar Nigam Robert Pollice Mario Krenn Gabriel dos Passos\u00a0Gomes and Alan Aspuru-Guzik. 2021. Beyond generative models: superfast traversal optimization novelty exploration and discovery (STONED) algorithm for molecules using SELFIES. Chemical science 12 20 (2021) 7079\u20137090.","DOI":"10.1039\/D1SC00231G"},{"key":"e_1_3_3_3_96_2","unstructured":"Uditi Ojha. 2022. Towards fairness AI: A data-centric approach. Ph.\u00a0D. Dissertation. Politecnico di Torino."},{"key":"e_1_3_3_3_97_2","unstructured":"Achiam\u00a0J OpenAI Steven Adler Sandhini Agarwal Lama Ahmad Ilge Akkaya Florencia\u00a0Leoni Aleman Diogo Almeida Janko Altenschmidt Sam Altman Shyamal Anadkat et\u00a0al. [n. d.]. GPT\u20134 Technical Report. 2024. URL: https:\/\/arxiv. org\/abs\/2303.08774 ([n. d.])."},{"key":"e_1_3_3_3_98_2","doi-asserted-by":"crossref","unstructured":"Samir Passi and Steven\u00a0J Jackson. 2018. Trust in data science: Collaboration translation and accountability in corporate data science projects. Proceedings of the ACM on human-computer interaction 2 CSCW (2018) 1\u201328.","DOI":"10.1145\/3274405"},{"key":"e_1_3_3_3_99_2","doi-asserted-by":"crossref","unstructured":"Pat Pataranutaporn Valdemar Danry Joanne Leong Parinya Punpongsanon Dan Novy Pattie Maes and Misha Sra. 2021. AI-generated characters for supporting personalized learning and well-being. Nature Machine Intelligence 3 12 (2021) 1013\u20131022.","DOI":"10.1038\/s42256-021-00417-9"},{"key":"e_1_3_3_3_100_2","volume-title":"Data stewardship: An actionable guide to effective data management and data governance","author":"Plotkin David","year":"2020","unstructured":"David Plotkin. 2020. Data stewardship: An actionable guide to effective data management and data governance. Academic press."},{"key":"e_1_3_3_3_101_2","doi-asserted-by":"publisher","DOI":"10.1016\/B978-0-7506-9718-7.50010-X"},{"key":"e_1_3_3_3_102_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3651007"},{"key":"e_1_3_3_3_103_2","unstructured":"Nazneen Rajani Nathan Lambert and Lewis Tunstall. 2023. Red-Teaming Large Language Models. https:\/\/huggingface.co\/blog\/red-teaming"},{"key":"e_1_3_3_3_104_2","doi-asserted-by":"publisher","unstructured":"Bogdana Rakova Jingying Yang Henriette Cramer and Rumman Chowdhury. 2021. Where Responsible AI meets Reality: Practitioner Perspectives on Enablers for Shifting Organizational Practices. Proc. ACM Hum.-Comput. Interact. 5 CSCW1 Article 7 (apr 2021) 23\u00a0pages. 10.1145\/3449081","DOI":"10.1145\/3449081"},{"key":"e_1_3_3_3_105_2","doi-asserted-by":"crossref","unstructured":"Suman Ravuri Karel Lenc Matthew Willson Dmitry Kangin Remi Lam Piotr Mirowski Megan Fitzsimons Maria Athanassiadou Sheleem Kashem Sam Madge et\u00a0al. 2021. Skilful precipitation nowcasting using deep generative models of radar. Nature 597 7878 (2021) 672\u2013677.","DOI":"10.1038\/s41586-021-03854-z"},{"key":"e_1_3_3_3_106_2","unstructured":"Anka Reuel and Trond\u00a0Arne Undheim. 2024. Generative AI Needs Adaptive Governance. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2406.04554 (2024)."},{"key":"e_1_3_3_3_107_2","doi-asserted-by":"publisher","DOI":"10.1145\/3600211.3604702"},{"key":"e_1_3_3_3_108_2","doi-asserted-by":"crossref","unstructured":"Annabel Rothschild Amanda Meng Carl DiSalvo Britney Johnson Ben\u00a0Rydal Shapiro and Betsy DiSalvo. 2022. Interrogating data work as a community of practice. Proceedings of the ACM on Human-Computer Interaction 6 CSCW2 (2022) 1\u201328.","DOI":"10.1145\/3555198"},{"key":"e_1_3_3_3_109_2","doi-asserted-by":"crossref","unstructured":"Hannah Ruschemeier. 2024. Generative AI and Data Protection. (2024).","DOI":"10.1017\/cfl.2024.2"},{"key":"e_1_3_3_3_110_2","volume-title":"Human compatible : artificial intelligence and the problem of control","author":"Russell Stuart J. (Stuart\u00a0Jonathan)","year":"2019","unstructured":"Stuart J. (Stuart\u00a0Jonathan) Russell. 2019. Human compatible : artificial intelligence and the problem of control. Allen Lane\/Penguin Books, London."},{"key":"e_1_3_3_3_111_2","doi-asserted-by":"crossref","unstructured":"Daniel Russo. 2024. Navigating the complexity of generative ai adoption in software engineering. ACM Transactions on Software Engineering and Methodology (2024).","DOI":"10.1145\/3652154"},{"key":"e_1_3_3_3_112_2","doi-asserted-by":"publisher","DOI":"10.1145\/3411764.3445518"},{"key":"e_1_3_3_3_113_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3636268"},{"key":"e_1_3_3_3_114_2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-67268-2_1"},{"key":"e_1_3_3_3_115_2","first-page":"28","volume-title":"EconPol Forum","author":"Savona Maria","year":"2024","unstructured":"Maria Savona. 2024. Data governance: Main challenges. In EconPol Forum , Vol.\u00a025. Munich: CESifo GmbH, 28\u201331."},{"key":"e_1_3_3_3_116_2","first-page":"0","volume-title":"Proceedings of the European conference on computer vision (ECCV) workshops","author":"Sbai Othman","year":"2018","unstructured":"Othman Sbai, Mohamed Elhoseiny, Antoine Bordes, Yann LeCun, and Camille Couprie. 2018. Design: Design inspiration from generative networks. In Proceedings of the European conference on computer vision (ECCV) workshops. 0\u20130."},{"key":"e_1_3_3_3_117_2","doi-asserted-by":"crossref","unstructured":"Morgan\u00a0Klaus Scheuerman Alex Hanna and Emily Denton. 2021. Do datasets have politics? Disciplinary values in computer vision dataset development. Proceedings of the ACM on Human-Computer Interaction 5 CSCW2 (2021) 1\u201337.","DOI":"10.1145\/3476058"},{"key":"e_1_3_3_3_118_2","doi-asserted-by":"publisher","unstructured":"Morgan\u00a0Klaus Scheuerman Alex Hanna and Emily Denton. 2021. Do Datasets Have Politics? Disciplinary Values in Computer Vision Dataset Development. Proc. ACM Hum.-Comput. Interact. 5 CSCW2 Article 317 (oct 2021) 37\u00a0pages. 10.1145\/3476058","DOI":"10.1145\/3476058"},{"key":"e_1_3_3_3_119_2","unstructured":"Johannes Schneider Rene Abraham and Christian Meske. 2024. Governance of generative artificial intelligence for companies. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2403.08802 (2024)."},{"key":"e_1_3_3_3_120_2","unstructured":"Uriel Singer Adam Polyak Thomas Hayes Xi Yin Jie An Songyang Zhang Qiyuan Hu Harry Yang Oron Ashual Oran Gafni et\u00a0al. 2022. Make-a-video: Text-to-video generation without text-video data. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2209.14792 (2022)."},{"key":"e_1_3_3_3_121_2","unstructured":"JoAnn Stonier Lauren Woodman Majed Alshammari Ren\u00e9e Cummings Nighat Dad Arti Garg Alberto\u00a0Giovanni Busetto Katherine Hsiao Maui Hudson Parminder\u00a0Jeet Singh et\u00a0al. 2023. Data Equity: Foundational Concepts for Generative AI. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2311.10741 (2023)."},{"key":"e_1_3_3_3_122_2","doi-asserted-by":"publisher","DOI":"10.1145\/3490099.3511119"},{"key":"e_1_3_3_3_123_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642160"},{"key":"e_1_3_3_3_124_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3641924"},{"key":"e_1_3_3_3_125_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.emnlp-main.54"},{"key":"e_1_3_3_3_126_2","unstructured":"Xiangru Tang Qiao Jin Kunlun Zhu Tongxin Yuan Yichi Zhang Wangchunshu Zhou Meng Qu Yilun Zhao Jian Tang Zhuosheng Zhang et\u00a0al. 2024. Prioritizing safeguarding over autonomy: Risks of llm agents for science. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2402.04247 (2024)."},{"key":"e_1_3_3_3_127_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642902"},{"key":"e_1_3_3_3_128_2","unstructured":"TechRadar. 2023. Samsung Workers Made a Major Error by Using ChatGPT. Online article. https:\/\/www.techradar.com\/news\/samsung-workers-leaked-company-secrets-by-using-chatgpt Accessed: 2025-02-06."},{"key":"e_1_3_3_3_129_2","unstructured":"D Thakkar. 2024. Towards examining Human-AI collaboration across the AI pipeline. Ph.\u00a0D. Dissertation. City University of London."},{"key":"e_1_3_3_3_130_2","doi-asserted-by":"publisher","DOI":"10.1145\/3491102.3501868"},{"key":"e_1_3_3_3_131_2","doi-asserted-by":"crossref","unstructured":"Angharad\u00a0N Valdivia. 2018. Algorithms of oppression: how search engines reinforce racism by Safiya Umoja Noble. Feminist Formations 30 3 (2018) 217\u2013220.","DOI":"10.1353\/ff.2018.0050"},{"key":"e_1_3_3_3_132_2","doi-asserted-by":"crossref","unstructured":"Quentin Vanhaelen Yen-Chu Lin and Alex Zhavoronkov. 2020. The advent of generative chemistry. ACS Medicinal Chemistry Letters 11 8 (2020) 1496\u20131505.","DOI":"10.1021\/acsmedchemlett.0c00088"},{"key":"e_1_3_3_3_133_2","doi-asserted-by":"publisher","unstructured":"April\u00a0Yi Wang Dakuo Wang Jaimie Drozdal Michael Muller Soya Park Justin\u00a0D. Weisz Xuye Liu Lingfei Wu and Casey Dugan. 2022. Documentation Matters: Human-Centered AI System to Assist Data Science Code Documentation in Computational Notebooks. ACM Trans. Comput.-Hum. Interact. 29 2 Article 17 (jan 2022) 33\u00a0pages. 10.1145\/3489465","DOI":"10.1145\/3489465"},{"key":"e_1_3_3_3_134_2","doi-asserted-by":"publisher","DOI":"10.1145\/3491102.3502121"},{"key":"e_1_3_3_3_135_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.754"},{"key":"e_1_3_3_3_136_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-naacl.235"},{"key":"e_1_3_3_3_137_2","unstructured":"Jason Wei Yi Tay Rishi Bommasani Colin Raffel Barret Zoph Sebastian Borgeaud Dani Yogatama Maarten Bosma Denny Zhou Donald Metzler et\u00a0al. 2022. Emergent abilities of large language models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2206.07682 (2022)."},{"key":"e_1_3_3_3_138_2","unstructured":"Laura Weidinger John Mellor Maribeth Rauh Conor Griffin Jonathan Uesato Po-Sen Huang Myra Cheng Mia Glaese Borja Balle Atoosa Kasirzadeh et\u00a0al. 2021. Ethical and social risks of harm from language models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2112.04359 (2021)."},{"key":"e_1_3_3_3_139_2","unstructured":"Laura Weidinger Maribeth Rauh Nahema Marchal Arianna Manzini Lisa\u00a0Anne Hendricks Juan Mateos-Garcia Stevie Bergman Jackie Kay Conor Griffin Ben Bariach Iason Gabriel Verena Rieser and William Isaac. 2023. Sociotechnical Safety Evaluation of Generative AI Systems. arxiv:https:\/\/arXiv.org\/abs\/2310.11986\u00a0[cs.AI] https:\/\/arxiv.org\/abs\/2310.11986"},{"key":"e_1_3_3_3_140_2","doi-asserted-by":"publisher","DOI":"10.1145\/3531146.3533088"},{"key":"e_1_3_3_3_141_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642466"},{"key":"e_1_3_3_3_142_2","unstructured":"Justin\u00a0D. Weisz Michael Muller Jessica He and Stephanie Houde. 2023. Toward General Design Principles for Generative AI Applications. arxiv:https:\/\/arXiv.org\/abs\/2301.05578\u00a0[cs.HC] https:\/\/arxiv.org\/abs\/2301.05578"},{"key":"e_1_3_3_3_143_2","doi-asserted-by":"publisher","DOI":"10.1145\/3630106.3659002"},{"key":"e_1_3_3_3_144_2","doi-asserted-by":"publisher","unstructured":"David\u00a0Gray Widder and Dawn Nafus. 2023. Dislocated accountabilities in the \u201cAI supply chain\u201d: Modularity and developers\u2019 notions of responsibility. Big Data & Society 10 1 (2023) 20539517231177620. 10.1177\/20539517231177620 arXiv:10.1177\/20539517231177620","DOI":"10.1177\/20539517231177620"},{"key":"e_1_3_3_3_145_2","doi-asserted-by":"publisher","DOI":"10.1145\/3593013.3594072"},{"key":"e_1_3_3_3_146_2","doi-asserted-by":"crossref","unstructured":"Richmond\u00a0Y Wong Michael\u00a0A Madaio and Nick Merrill. 2023. Seeing like a toolkit: How toolkits envision the work of AI ethics. Proceedings of the ACM on Human-Computer Interaction 7 CSCW1 (2023) 1\u201327.","DOI":"10.1145\/3579621"},{"key":"e_1_3_3_3_147_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613904.3642700"},{"key":"e_1_3_3_3_148_2","doi-asserted-by":"publisher","DOI":"10.1145\/3613905.3636302"},{"key":"e_1_3_3_3_149_2","doi-asserted-by":"crossref","unstructured":"Khensani Xivuri and Hosanna Twinomurinzi. 2023. How AI developers can assure algorithmic fairness. Discover Artificial Intelligence 3 1 (2023) 27.","DOI":"10.1007\/s44163-023-00074-4"},{"key":"e_1_3_3_3_150_2","doi-asserted-by":"crossref","unstructured":"Ruihan Yang Prakhar Srivastava and Stephan Mandt. 2023. Diffusion probabilistic modeling for video generation. Entropy 25 10 (2023) 1469.","DOI":"10.3390\/e25101469"},{"key":"e_1_3_3_3_151_2","doi-asserted-by":"crossref","unstructured":"Amy\u00a0X Zhang Michael Muller and Dakuo Wang. 2020. How do data science workers collaborate? roles workflows and tools. Proceedings of the ACM on Human-Computer Interaction 4 CSCW1 (2020) 1\u201323.","DOI":"10.1145\/3392826"},{"key":"e_1_3_3_3_152_2","unstructured":"Dawen Zhang Boming Xia Yue Liu Xiwei Xu Thong Hoang Zhenchang Xing Mark Staples Qinghua Lu and Liming Zhu. 2023. Navigating privacy and copyright challenges across the data lifecycle of generative ai. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2311.18252 (2023)."},{"key":"e_1_3_3_3_153_2","unstructured":"Qiang Zhang Keyang Ding Tianwen Lyv Xinda Wang Qingyu Yin Yiwen Zhang Jing Yu Yuhao Wang Xiaotong Li Zhuoyi Xiang Kehua Feng Xiang Zhuang Zeyuan Wang Ming Qin Mengyao Zhang Jinlu Zhang Jiyu Cui Tao Huang Pengju Yan Renjun Xu Hongyang Chen Xiaolin Li Xiaohui Fan Huabin Xing and Huajun Chen. 2024. Scientific Large Language Models: A Survey on Biological and Chemical Domains. arxiv:https:\/\/arXiv.org\/abs\/2401.14656\u00a0[cs.CL] https:\/\/arxiv.org\/abs\/2401.14656"},{"key":"e_1_3_3_3_154_2","series-title":"Proceedings of Machine Learning Research","first-page":"60644","volume-title":"Proceedings of the 41st International Conference on Machine Learning","volume":"235","author":"Zhao Dora","year":"2024","unstructured":"Dora Zhao, Jerone Andrews, Orestis Papakyriakopoulos, and Alice Xiang. 2024. Position: Measure Dataset Diversity, Don\u2019t Just Claim It. In Proceedings of the 41st International Conference on Machine Learning(Proceedings of Machine Learning Research, Vol.\u00a0235), Ruslan Salakhutdinov, Zico Kolter, Katherine Heller, Adrian Weller, Nuria Oliver, Jonathan Scarlett, and Felix Berkenkamp (Eds.). PMLR, 60644\u201360673. https:\/\/proceedings.mlr.press\/v235\/zhao24a.html"},{"key":"e_1_3_3_3_155_2","unstructured":"Dora Zhao Morgan\u00a0Klaus Scheuerman Pooja Chitre Jerone\u00a0TA Andrews Georgia Panagiotidou Shawn Walker Kathleen\u00a0H Pine and Alice Xiang. 2024. A Taxonomy of Challenges to Curating Fair Datasets. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2406.06407 (2024)."},{"key":"e_1_3_3_3_156_2","unstructured":"Wayne\u00a0Xin Zhao Kun Zhou Junyi Li Tianyi Tang Xiaolei Wang Yupeng Hou Yingqian Min Beichen Zhang Junjie Zhang Zican Dong Yifan Du Chen Yang Yushuo Chen Zhipeng Chen Jinhao Jiang Ruiyang Ren Yifan Li Xinyu Tang Zikang Liu Peiyu Liu Jian-Yun Nie and Ji-Rong Wen. 2023. A Survey of Large Language Models. arxiv:https:\/\/arXiv.org\/abs\/2303.18223\u00a0[cs.CL] https:\/\/arxiv.org\/abs\/2303.18223"},{"key":"e_1_3_3_3_157_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i17.29946"}],"event":{"name":"CHI 2025: CHI Conference on Human Factors in Computing Systems","location":"Yokohama Japan","acronym":"CHI '25","sponsor":["SIGCHI ACM Special Interest Group on Computer-Human Interaction"]},"container-title":["Proceedings of the 2025 CHI Conference on Human Factors in Computing Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3706598.3714069","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3706598.3714069","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,4]],"date-time":"2025-07-04T05:16:31Z","timestamp":1751606191000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3706598.3714069"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,25]]},"references-count":156,"alternative-id":["10.1145\/3706598.3714069","10.1145\/3706598"],"URL":"https:\/\/doi.org\/10.1145\/3706598.3714069","relation":{},"subject":[],"published":{"date-parts":[[2025,4,25]]},"assertion":[{"value":"2025-04-25","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}