{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,3]],"date-time":"2026-03-03T17:01:33Z","timestamp":1772557293848,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":104,"publisher":"ACM","license":[{"start":{"date-parts":[[2022,6,20]],"date-time":"2022-06-20T00:00:00Z","timestamp":1655683200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"Alfred. P Sloan Foundation"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2022,6,21]]},"DOI":"10.1145\/3531146.3533086","type":"proceedings-article","created":{"date-parts":[[2022,6,20]],"date-time":"2022-06-20T14:27:10Z","timestamp":1655735230000},"page":"199-212","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":10,"title":["A Framework for Deprecating Datasets: Standardizing Documentation, Identification, and Communication"],"prefix":"10.1145","author":[{"given":"Alexandra Sasha","family":"Luccioni","sequence":"first","affiliation":[{"name":"Hugging Face, Canada"}]},{"given":"Frances","family":"Corry","sequence":"additional","affiliation":[{"name":"University of Southern California, USA"}]},{"given":"Hamsini","family":"Sridharan","sequence":"additional","affiliation":[{"name":"University of Southern California, USA"}]},{"given":"Mike","family":"Ananny","sequence":"additional","affiliation":[{"name":"University of Southern California, USA"}]},{"given":"Jason","family":"Schultz","sequence":"additional","affiliation":[{"name":"New York University, USA"}]},{"given":"Kate","family":"Crawford","sequence":"additional","affiliation":[{"name":"University of Southern California, USA and Microsoft Research, USA"}]}],"member":"320","published-online":{"date-parts":[[2022,6,20]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Authors Guild v. Google","year":"2007","unstructured":"[n.d.]. Authors Guild v. Google, Inc.804 F. 3d 202, 2d Cir. 2007([n. d.])."},{"key":"e_1_3_2_1_2_1","unstructured":"[n.d.]. AV Ex Rel. Vanderhye v. iParadigms LLC. 804 F. 3d 202 2d Cir. 2007([n. d.])."},{"key":"e_1_3_2_1_3_1","unstructured":"[n.d.]. Perfect 10 Inc. v. Amazon. com Inc.508 F. 3d 1146 9th Cir. 2007([n. d.])."},{"key":"e_1_3_2_1_4_1","volume-title":"Thornley v. Clearview AI","unstructured":"[n.d.]. Thornley v. Clearview AI, Inc.984 F. 20-3249, Court of Appeals, 7th Circuit ([n. d.])."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/UBMK.2019.8907181"},{"key":"e_1_3_2_1_6_1","volume-title":"Documentation Debt","author":"Bandy Jack","year":"2021","unstructured":"Jack Bandy and Nicholas Vincent. 2021. Addressing\u201d Documentation Debt\u201d in Machine Learning Research: A Retrospective Datasheet for BookCorpus. arXiv preprint arXiv:2105.05241(2021)."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11192-018-2802-y"},{"key":"e_1_3_2_1_8_1","volume-title":"9th Annual Conference of the Special Interest Group for Computing, Information and Society.","author":"Barocas Solon","year":"2017","unstructured":"Solon Barocas, Kate Crawford, Aaron Shapiro, and Hanna Wallach. 2017. The problem with bias: Allocative versus representational harms in machine learning. In 9th Annual Conference of the Special Interest Group for Computing, Information and Society."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.3390\/jimaging6060041"},{"key":"e_1_3_2_1_10_1","unstructured":"Thomas Baumhauer Pascal Sch\u00f6ttle and Matthias Zeppelzauer. 2020. Machine unlearning: Linear filtration for logit-based classifiers. arXiv preprint arXiv:2002.02730(2020)."},{"key":"e_1_3_2_1_11_1","unstructured":"Misha Benjamin Paul Gagnon Negar Rostamzadeh Chris Pal Yoshua Bengio and Alex Shee. 2019. Towards standardization of data licenses: The montreal data license. arXiv preprint arXiv:1903.12262(2019)."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/JCDL52503.2021.00077"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.pubrev.2020.101975"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/SP40001.2021.00019"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.5555\/380681"},{"key":"e_1_3_2_1_16_1","volume-title":"Microsoft Pulls Open Facial Recognition Dataset after Financial Times Investigation. The Verge","author":"Brandom Russel","year":"2019","unstructured":"Russel Brandom. 2019. Microsoft Pulls Open Facial Recognition Dataset after Financial Times Investigation. The Verge (2019)."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00628"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1177\/2053951720983865"},{"key":"e_1_3_2_1_19_1","volume-title":"Conference on fairness, accountability and transparency. PMLR, 77\u201391","author":"Buolamwini Joy","year":"2018","unstructured":"Joy Buolamwini and Timnit Gebru. 2018. Gender shades: Intersectional accuracy disparities in commercial gender classification. In Conference on fairness, accountability and transparency. PMLR, 77\u201391."},{"key":"e_1_3_2_1_20_1","first-page":"283","article-title":"Algorithmic fair use","volume":"86","author":"Burk L","year":"2019","unstructured":"Dan\u00a0L Burk. 2019. Algorithmic fair use. The University of Chicago Law Review 86 (2019), 283.","journal-title":"The University of Chicago Law Review"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/SP.2015.35"},{"key":"e_1_3_2_1_22_1","unstructured":"Nicholas Carlini Florian Tramer Eric Wallace Matthew Jagielski Ariel Herbert-Voss Katherine Lee Adam Roberts Tom Brown Dawn Song Ulfar Erlingsson 2020. Extracting training data from large language models. arXiv preprint arXiv:2012.07805(2020)."},{"key":"e_1_3_2_1_23_1","volume-title":"Facebook will pay $550 million to settle class action lawsuit over privacy violations. TechCrunch","author":"Coldewey D.","year":"2020","unstructured":"D. Coldewey. 2020. Facebook will pay $550 million to settle class action lawsuit over privacy violations. TechCrunch (2020)."},{"key":"e_1_3_2_1_24_1","unstructured":"Federal\u00a0Trade Commission. 2021. FTC Finalizes Settlement with Photo App Developer Related to Misuse of Facial Recognition Technology.Federal Trade Commission(2021). Available at: https:\/\/www.ftc.gov\/news-events\/press-releases\/2021\/05\/ftc-finalizes-settlement-photo-app-developer-related-misuse."},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-52581-1_18"},{"key":"e_1_3_2_1_26_1","volume-title":"Yahoo! Answers is shutting down and taking a record of my teenage self with it. Los Angeles Times","author":"Corry Frances","year":"2021","unstructured":"Frances Corry. 2021. Op-Ed: Yahoo! Answers is shutting down and taking a record of my teenage self with it. Los Angeles Times (2021). Available at: https:\/\/www.latimes.com\/opinion\/story\/2021-05-04\/yahoo-answers-shut-down-social-platforms."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","unstructured":"Frances Corry. 2021. Why does a platform die? Diagnosing platform death at Friendster\u2019s end.Internet Histories. (2021). Available at: https:\/\/doi.org\/10.1080\/24701475.2021.1985360.","DOI":"10.1080\/24701475.2021.1985360"},{"key":"e_1_3_2_1_28_1","volume-title":"More work for mother","author":"Ruth\u00a0Schwartz","unstructured":"Ruth\u00a0Schwartz Cowan 1983. More work for mother. Basic Books."},{"key":"e_1_3_2_1_29_1","volume-title":"Atlas of AI : Power, Politics, and the Planetary Costs of Artificial Intelligence","author":"Crawford Kate","unstructured":"Kate Crawford. 2021. Atlas of AI : Power, Politics, and the Planetary Costs of Artificial Intelligence. Yale University Press."},{"key":"e_1_3_2_1_30_1","unstructured":"Kate Crawford and Trevor Paglen. 2019. Excavating AI : The politics of training sets for machine learning. https:\/\/www.excavating.ai."},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1177\/20539517211035955"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"crossref","unstructured":"Jesse Dodge Maarten Sap Ana Marasovi\u0107 William Agnew Gabriel Ilharco Dirk Groeneveld Margaret Mitchell and Matt Gardner. 2021. Documenting Large Webtext Corpora: A Case Study on the Colossal Clean Crawled Corpus. arXiv preprint arXiv:2104.08758(2021).","DOI":"10.18653\/v1\/2021.emnlp-main.98"},{"key":"e_1_3_2_1_34_1","unstructured":"Timnit Gebru Jamie Morgenstern Briana Vecchione Jennifer\u00a0Wortman Vaughan Hanna Wallach Hal Daum\u00e9\u00a0III and Kate Crawford. 2018. Datasheets for datasets. arXiv preprint arXiv:1803.09010(2018)."},{"key":"e_1_3_2_1_35_1","volume-title":"Raw data is an oxymoron","author":"Gitelman Lisa","unstructured":"Lisa Gitelman. 2013. Raw data is an oxymoron. MIT press."},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.24251\/HICSS.2019.258"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0044118"},{"key":"e_1_3_2_1_38_1","unstructured":"Mark Hahnel. 2012. All research outputs should be citable.Available at: https:\/\/figshare.com\/blog\/All+research+outputs+should+be+citable\/32."},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"crossref","unstructured":"William\u00a0L Hamilton Jure Leskovec and Dan Jurafsky. 2016. Diachronic word embeddings reveal statistical laws of semantic change. arXiv preprint arXiv:1605.09096(2016).","DOI":"10.18653\/v1\/P16-1141"},{"key":"e_1_3_2_1_40_1","unstructured":"Karen Hao. 2021. Deleting unethical data sets isn\u2019t good enough.Available at https:\/\/www.technologyreview.com\/2021\/08\/13\/1031836\/ai-ethics-responsible-data-stewardship\/."},{"key":"e_1_3_2_1_41_1","unstructured":"Adam Harvey and Jules LaPlace. 2019. MegaPixels: Face Recognition Training Datasets. https:\/\/ahprojects.com\/megapixels."},{"key":"e_1_3_2_1_42_1","unstructured":"Adam Harvey and Jules LaPlace. 2021. Exposing AI. https:\/\/www.excavating.ai."},{"key":"e_1_3_2_1_43_1","volume-title":"How photos of your kids are powering surveillance technology. The New York Times","author":"Hill Kashmir","year":"2019","unstructured":"Kashmir Hill and Aaron Krolik. 2019. How photos of your kids are powering surveillance technology. The New York Times (2019)."},{"key":"e_1_3_2_1_44_1","volume-title":"Terms of inclusion: Data, discourse, violence","author":"Hoffmann Anna\u00a0Lauren","year":"2020","unstructured":"Anna\u00a0Lauren Hoffmann. 2020. Terms of inclusion: Data, discourse, violence. New Media & Society(2020), 1461444820958725."},{"key":"e_1_3_2_1_45_1","volume-title":"Art Manion, and Chris King","author":"Householder D","year":"2017","unstructured":"Allen\u00a0D Householder, Garret Wassermann, Art Manion, and Chris King. 2017. The CERT guide to coordinated vulnerability disclosure. Technical Report. Carnegie-Mellon Univ Pittsburgh Pa Pittsburgh United States."},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"crossref","unstructured":"Ben Hutchinson Vinodkumar Prabhakaran Emily Denton Kellie Webster Yu Zhong and Stephen Denuyl. 2020. Social biases in NLP models as barriers for persons with disabilities. arXiv preprint arXiv:2005.00813(2020).","DOI":"10.18653\/v1\/2020.acl-main.487"},{"key":"e_1_3_2_1_47_1","unstructured":"iSight. 2021. A Practical Guide to Data Privacy Laws by Country [2021]. Available at: https:\/\/www.i-sight.com\/resources\/a-practical-guide-to-data-privacy-laws-by-country\/."},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"crossref","unstructured":"Steven\u00a0J Jackson. 2017. Speed time infrastructure. The Sociology of Speed: Digital Organizational and Social Temporalities 169(2017).","DOI":"10.1093\/acprof:oso\/9780198782858.003.0012"},{"key":"e_1_3_2_1_49_1","volume-title":"Data Lives: How Data Are Made and Shape Our World","author":"Kitchin Rob","year":"2021","unstructured":"Rob Kitchin. 2021. Data Lives: How Data Are Made and Shape Our World. Policy Press."},{"key":"e_1_3_2_1_50_1","unstructured":"Bernard Koch Emily Denton Alex Hanna and Jacob\u00a0G Foster. 2021. Reduced Reused and Recycled: The Life of a Dataset in Machine Learning Research. NeurIPS 2021 Datasets and Benchmarks Track(2021)."},{"key":"e_1_3_2_1_51_1","unstructured":"Alex Krizhevsky Geoffrey Hinton 2009. Learning multiple layers of features from tiny images. (2009)."},{"key":"e_1_3_2_1_52_1","unstructured":"Andrey Kutuzov Lilja \u00d8vrelid Terrence Szymanski and Erik Velldal. 2018. Diachronic word embeddings and semantic shifts: a survey. arXiv preprint arXiv:1806.03537(2018)."},{"key":"e_1_3_2_1_53_1","unstructured":"Katherine Lee Daphne Ippolito Andrew Nystrom Chiyuan Zhang Douglas Eck Chris Callison-Burch and Nicholas Carlini. 2021. Deduplicating training data makes language models better. arXiv preprint arXiv:2107.06499(2021)."},{"key":"e_1_3_2_1_54_1","first-page":"579","article-title":"How copyright law can fix artificial intelligence\u2019s implicit bias problem","volume":"93","author":"Levendowski Amanda","year":"2018","unstructured":"Amanda Levendowski. 2018. How copyright law can fix artificial intelligence\u2019s implicit bias problem. Wash. L. Rev. 93(2018), 579.","journal-title":"Wash. L. Rev."},{"key":"e_1_3_2_1_55_1","volume-title":"Head Detection Method for Indoor Scene. In Theoretical Computer Science: 38th National Conference, NCTCS 2020","author":"Li Zhi","year":"2021","unstructured":"Zhi Li, Yong Li, and Xipeng Wang. 2021. Head Detection Method for Indoor Scene. In Theoretical Computer Science: 38th National Conference, NCTCS 2020, Nanning, China, November 13\u201315, 2020, Revised Selected Papers. Springer, 139\u2013146."},{"key":"e_1_3_2_1_56_1","doi-asserted-by":"publisher","DOI":"10.3390\/electronics10131565"},{"key":"e_1_3_2_1_57_1","doi-asserted-by":"crossref","unstructured":"Alexandra\u00a0Sasha Luccioni and Joseph\u00a0D Viviano. 2021. What\u2019s in the Box? An Analysis of Undesirable Content in the Common Crawl Corpus. arXiv preprint arXiv:2105.02732(2021).","DOI":"10.18653\/v1\/2021.acl-short.24"},{"key":"e_1_3_2_1_58_1","doi-asserted-by":"publisher","DOI":"10.1145\/3313831.3376445"},{"key":"e_1_3_2_1_59_1","doi-asserted-by":"publisher","DOI":"10.1177\/0306312715602073"},{"key":"e_1_3_2_1_60_1","volume-title":"How Might AI Label You. The New York Times","author":"Metz Cade","year":"2019","unstructured":"Cade Metz. 2019. \u2019Nerd\u2019, \u2019Nonsmoker,\u2019 \u2019Wrongdoer\u2019 : How Might AI Label You. The New York Times (2019). Available at: https:\/\/www.nytimes.com\/2019\/09\/20\/arts\/design\/imagenet-trevor-paglen-ai-facial-recognition.html."},{"key":"e_1_3_2_1_61_1","volume-title":"European privacy activists launch international assault on Clearview AI \u2019s facial recognition service. Fortune","author":"Meyer D","year":"2021","unstructured":"D Meyer. 2021. European privacy activists launch international assault on Clearview AI \u2019s facial recognition service. Fortune (2021). Available at: https:\/\/fortune.com\/2021\/05\/27\/europe-clearview-ai-gdpr-complaints-privacy\/."},{"key":"e_1_3_2_1_62_1","volume-title":"MS-Celeb-1M: A Dataset and Benchmark for Large-Scale Face Recognition","year":"2019","unstructured":"Microsoft. 2019. MS-Celeb-1M: A Dataset and Benchmark for Large-Scale Face Recognition. Academic Torrents (2019). Available at: https:\/\/academictorrents.com\/details\/9e67eb7cc23c9417f39778a8e06cca5e26196a97."},{"key":"e_1_3_2_1_63_1","doi-asserted-by":"publisher","DOI":"10.1093\/ijl\/3.4.235"},{"key":"e_1_3_2_1_64_1","doi-asserted-by":"publisher","DOI":"10.1145\/3287560.3287596"},{"key":"e_1_3_2_1_66_1","volume-title":"Microsoft quietly deletes largest public face recognition data set. Financial Times","author":"Murgia Madhumita","year":"2019","unstructured":"Madhumita Murgia. 2019. Microsoft quietly deletes largest public face recognition data set. Financial Times (2019). Available at: https:\/\/www.ft.com\/content\/7d3e0d6a-87a0-11e9-a028-86cea8523dc2."},{"key":"e_1_3_2_1_67_1","volume-title":"Who\u2019s using your face? The ugly truth about facial recognition. Financial Times","author":"Murgia Madhumita","year":"2019","unstructured":"Madhumita Murgia and Max Harlow. 2019. Who\u2019s using your face? The ugly truth about facial recognition. Financial Times (2019)."},{"key":"e_1_3_2_1_68_1","volume-title":"Pervasive label errors in test sets destabilize machine learning benchmarks. arXiv pre-print 2103.14749","author":"Northcutt G.","year":"2021","unstructured":"Curtis\u00a0G. Northcutt, Anish Athalye, and Jonas Mueller. 2021. Pervasive label errors in test sets destabilize machine learning benchmarks. arXiv pre-print 2103.14749 (2021), 1\u201324. https:\/\/arxiv.org\/abs\/2103.14749."},{"key":"e_1_3_2_1_69_1","unstructured":"Information\u00a0Commissioner\u2019s Office.2020. The Office of the Australian Information Commissioner and the UK\u2019s Information Commissioner\u2019s Office open joint investigation into Clearview AI Inc.Available at: https:\/\/ico.org.uk\/about-the-ico\/news-and-events\/news-and-blogs\/2020\/07\/oaic-and-ico-open-joint-investigation-into-clearview-ai-inc\/."},{"key":"e_1_3_2_1_70_1","unstructured":"L Pascu. 2020. California residents file class action against Clearview AI biometric data collection citing CCPA. Available at: https:\/\/www.biometricupdate.com\/202003\/california-residents-file-class-action-against-clearview-ai-biometric-data-collection-citing-ccpa."},{"key":"e_1_3_2_1_71_1","volume-title":"Digital object identifier (DOI\u00ae) system. Encyclopedia of library and information sciences 3","author":"Paskin Norman","year":"2010","unstructured":"Norman Paskin. 2010. Digital object identifier (DOI\u00ae) system. Encyclopedia of library and information sciences 3 (2010), 1586\u20131592."},{"key":"e_1_3_2_1_72_1","doi-asserted-by":"crossref","unstructured":"Amandalynne Paullada Inioluwa\u00a0Deborah Raji Emily\u00a0M Bender Emily Denton and Alex Hanna. 2020. Data and its (dis) contents: A survey of dataset development and use in machine learning research. arXiv preprint arXiv:2012.05345(2020).","DOI":"10.1016\/j.patter.2021.100336"},{"key":"e_1_3_2_1_73_1","volume-title":"But It\u2019s Not Dead.VICE","author":"Pearson J","year":"2019","unstructured":"J Pearson. 2019. Microsoft Deleted a Massive Facial Recognition Database, But It\u2019s Not Dead.VICE (2019). Available at: https:\/\/www.vice.com\/en\/article\/a3x4mp\/microsoft-deleted-a-facial-recognition-database-but-its-not-dead."},{"key":"e_1_3_2_1_74_1","unstructured":"Kenny Peng Arunesh Mathur and Arvind Narayanan. 2021. Mitigating dataset harms requires stewardship: Lessons from 1000 papers. arXiv preprint arXiv:2108.02922(2021)."},{"key":"e_1_3_2_1_75_1","unstructured":"Vinay\u00a0Uday Prabhu and Abeba Birhane. 2020. Large image datasets: A pyrrhic win for computer vision?arXiv preprint arXiv:2006.16923(2020)."},{"key":"e_1_3_2_1_76_1","doi-asserted-by":"publisher","DOI":"10.1177\/0306312710380301"},{"key":"e_1_3_2_1_77_1","unstructured":"Colin Raffel Noam Shazeer Adam Roberts Katherine Lee Sharan Narang Michael Matena Yanqi Zhou Wei Li and Peter\u00a0J Liu. 2019. Exploring the limits of transfer learning with a unified text-to-text transformer. arXiv preprint arXiv:1910.10683(2019)."},{"key":"e_1_3_2_1_78_1","doi-asserted-by":"publisher","DOI":"10.1145\/3375627.3375820"},{"key":"e_1_3_2_1_79_1","volume-title":"Resist Fund v","author":"Renderos Steven","unstructured":"Steven Renderos, Valeria\u00a0Thais Suarez\u00a0Rojas, Reyna Maldonado, Lisa Knox, and Mijente\u00a0Support Committee. [n.d.]. Resist Fund v. Clearview AI Inc."},{"key":"e_1_3_2_1_80_1","doi-asserted-by":"crossref","unstructured":"Microsoft Research. 2016. MS-Celeb-1M: Challenge of Recognizing One Million Celebrities in the Real World.(2016). Available at: https:\/\/www.microsoft.com\/en-us\/research\/project\/ms-celeb-1m-challenge-recognizing-one-million-celebrities-real-world\/.","DOI":"10.2352\/ISSN.2470-1173.2016.11.IMAWM-463"},{"key":"e_1_3_2_1_81_1","doi-asserted-by":"crossref","unstructured":"Microsoft Research. 2016. MS-Celeb-1M: Challenge of Recognizing One Million Celebrities in the Real World. (2016). Available at: https:\/\/www.msceleb.org\/.","DOI":"10.2352\/ISSN.2470-1173.2016.11.IMAWM-463"},{"key":"e_1_3_2_1_82_1","unstructured":"C. Rizzi. 2021. Google Microsoft Amazon FaceFirst Hit with Biometric Privacy Class Actions Centered on IBM\u2019s \u2018Diversity in Faces\u2019 Dataset.Available at: https:\/\/www.classaction.org\/news\/google-microsoft-amazon-facefirst-hit-with-biometric-privacy-class-actions-centered-on-ibms-diversity-in-faces-dataset."},{"key":"e_1_3_2_1_83_1","volume-title":"Towards tracking semantic change by visual analytics","author":"Rohrdantz Christian","unstructured":"Christian Rohrdantz, Annette Hautli, Thomas Mayer, Miriam Butt, Daniel Keim, and Frans Plank. 2011. Towards tracking semantic change by visual analytics. In Association for Computational Linguistics. 305\u2013310."},{"key":"e_1_3_2_1_84_1","volume-title":"Leading online database to remove 600,000 images after art project reveals its racist bias. The Art Newspaper","author":"Ruiz Christina","year":"2019","unstructured":"Christina Ruiz. 2019. Leading online database to remove 600,000 images after art project reveals its racist bias. The Art Newspaper (2019), 23."},{"key":"e_1_3_2_1_85_1","doi-asserted-by":"publisher","DOI":"10.1353\/tech.2018.0004"},{"key":"e_1_3_2_1_86_1","volume-title":"International Conference on Machine Learning. PMLR, 8326\u20138335","author":"Sablayrolles Alexandre","year":"2020","unstructured":"Alexandre Sablayrolles, Matthijs Douze, Cordelia Schmid, and Herv\u00e9 J\u00e9gou. 2020. Radioactive data: tracing through training. In International Conference on Machine Learning. PMLR, 8326\u20138335."},{"key":"e_1_3_2_1_87_1","volume-title":"Data Cascades in High-Stakes AI. In proceedings of the 2021 CHI Conference on Human Factors in Computing Systems. 1\u201315","author":"Sambasivan Nithya","year":"2021","unstructured":"Nithya Sambasivan, Shivani Kapania, Hannah Highfill, Diana Akrong, Praveen Paritosh, and Lora\u00a0M Aroyo. 2021. \u201cEveryone wants to do the model work, not the data work\u201d: Data Cascades in High-Stakes AI. In proceedings of the 2021 CHI Conference on Human Factors in Computing Systems. 1\u201315."},{"key":"e_1_3_2_1_88_1","unstructured":"Christian Sandvig Kevin Hamilton Karrie Karahalios and Cedric Langbort. 2014. Auditing algorithms: Research methods for detecting discrimination on internet platforms. Data and discrimination: converting critical concerns into productive inquiry 22(2014) 4349\u20134357."},{"key":"e_1_3_2_1_89_1","volume-title":"Faces","author":"Satisky Jake","year":"2019","unstructured":"Jake Satisky. 2019. A Duke Study Recorded Thousands of Students\u2019 Faces; Now They\u2019re Being Used All over the World. The Chronicle (2019)."},{"key":"e_1_3_2_1_90_1","doi-asserted-by":"publisher","DOI":"10.1145\/3476058"},{"key":"e_1_3_2_1_91_1","volume-title":"International Data Privacy Law 21","author":"Schwartz P","year":"2019","unstructured":"P Schwartz and K Peifer. 2019. Structuring International Data Privacy Law. International Data Privacy Law 21 (2019)."},{"key":"e_1_3_2_1_92_1","unstructured":"Shreya Shankar Yoni Halpern Eric Breck James Atwood Jimbo Wilson and D Sculley. 2017. No classification without representation: Assessing geodiversity issues in open data sets for the developing world. arXiv preprint arXiv:1711.08536(2017)."},{"key":"e_1_3_2_1_93_1","unstructured":"David\u00a0Marco Sommer Liwei Song Sameer Wagh and Prateek Mittal. 2020. Towards probabilistic verification of machine unlearning. arXiv preprint arXiv:2003.04247(2020)."},{"key":"e_1_3_2_1_94_1","volume-title":"Data is the new what? Popular metaphors & professional ethics in emerging data culture. SocArXiv","author":"Stark Luke","year":"2019","unstructured":"Luke Stark and Anna\u00a0Lauren Hoffmann. 2019. Data is the new what? Popular metaphors & professional ethics in emerging data culture. SocArXiv (2019)."},{"key":"e_1_3_2_1_95_1","volume-title":"Letter: Video analysis research at Duke.The Chronicle.","author":"Tomasi Carlo","year":"2019","unstructured":"Carlo Tomasi. 2019. Letter: Video analysis research at Duke.The Chronicle. (2019). Available at: https:\/\/www.dukechronicle.com\/article\/2019\/06\/duke-university-video-analysis-research-at-duke-carlo-tomasi."},{"key":"e_1_3_2_1_96_1","unstructured":"A. Torralba R. Fergus and B. Freeman. 2020. 80 Million Tiny Images (Dataset Removal Notice).(2020). Available at: http:\/\/groups.csail.mit.edu\/vision\/TinyImages\/."},{"key":"e_1_3_2_1_97_1","unstructured":"GRAIL University\u00a0of Washington. 2015. MegaFace and MF2: Million-Scale Face Recognition. Available at: http:\/\/megaface.cs.washington.edu\/."},{"key":"e_1_3_2_1_98_1","doi-asserted-by":"publisher","DOI":"10.9785\/cri-2021-220402"},{"key":"e_1_3_2_1_99_1","volume-title":"Transgender YouTubers had their videos grabbed to train facial recognition software. The Verge","author":"Vincent James","year":"2017","unstructured":"James Vincent. 2017. Transgender YouTubers had their videos grabbed to train facial recognition software. The Verge (2017). Available at: https:\/\/www.theverge.com\/2017\/8\/22\/16180080\/transgender-youtubers-ai-facial-recognition-dataset."},{"key":"e_1_3_2_1_100_1","unstructured":"Lee Vinsel and Andrew\u00a0L Russell. 2020. The innovation delusion: How our obsession with the new has disrupted the work that matters most. Currency."},{"key":"e_1_3_2_1_101_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2956775"},{"key":"e_1_3_2_1_102_1","doi-asserted-by":"publisher","DOI":"10.1145\/3351095.3375709"},{"key":"e_1_3_2_1_103_1","unstructured":"Kaiyu Yang Jacqueline Yau Li Fei-Fei Jia Deng and Olga Russakovsky. 2021. A Study of Face Obfuscation in ImageNet. arXiv preprint arXiv:2103.06191v2(2021)."},{"key":"e_1_3_2_1_104_1","doi-asserted-by":"publisher","DOI":"10.1145\/3372297.3417880"},{"key":"e_1_3_2_1_105_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.7000"}],"event":{"name":"FAccT '22: 2022 ACM Conference on Fairness, Accountability, and Transparency","location":"Seoul Republic of Korea","acronym":"FAccT '22","sponsor":["ACM Association for Computing Machinery"]},"container-title":["2022 ACM Conference on Fairness Accountability and Transparency"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3531146.3533086","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3531146.3533086","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T19:02:10Z","timestamp":1750186930000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3531146.3533086"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,6,20]]},"references-count":104,"alternative-id":["10.1145\/3531146.3533086","10.1145\/3531146"],"URL":"https:\/\/doi.org\/10.1145\/3531146.3533086","relation":{},"subject":[],"published":{"date-parts":[[2022,6,20]]},"assertion":[{"value":"2022-06-20","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}