{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,30]],"date-time":"2026-06-30T06:32:28Z","timestamp":1782801148313,"version":"3.54.5"},"publisher-location":"New York, NY, USA","reference-count":84,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,6,12]],"date-time":"2023-06-12T00:00:00Z","timestamp":1686528000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-sa\/4.0\/"}],"funder":[{"name":"NIST","award":["60NANB20D212T"],"award-info":[{"award-number":["60NANB20D212T"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,6,12]]},"DOI":"10.1145\/3593013.3594072","type":"proceedings-article","created":{"date-parts":[[2023,6,12]],"date-time":"2023-06-12T14:40:46Z","timestamp":1686580846000},"page":"1174-1185","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":32,"title":["Contrastive Language-Vision AI Models Pretrained on Web-Scraped Multimodal Data Exhibit Sexual Objectification Bias"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7133-695X","authenticated-orcid":false,"given":"Robert","family":"Wolfe","sequence":"first","affiliation":[{"name":"Information School, University of Washington, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-0136-6465","authenticated-orcid":false,"given":"Yiwei","family":"Yang","sequence":"additional","affiliation":[{"name":"Information School, University of Washington, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8588-8472","authenticated-orcid":false,"given":"Bill","family":"Howe","sequence":"additional","affiliation":[{"name":"Information School, University of Washington, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7154-8629","authenticated-orcid":false,"given":"Aylin","family":"Caliskan","sequence":"additional","affiliation":[{"name":"Information School, University of Washington, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2023,6,12]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Jong Wook Kim, and Miles Brundage","author":"Agarwal Sandhini","year":"2021","unstructured":"Sandhini Agarwal, Gretchen Krueger, Jack Clark, Alec Radford, Jong Wook Kim, and Miles Brundage. 2021. Evaluating CLIP: Towards Characterization of Broader Capabilities and Downstream Implications. arXiv preprint arXiv:2108.02818 (2021)."},{"key":"e_1_3_2_1_2_1","volume-title":"CM3: A Causal Masked Multimodal Model of the Internet. arXiv preprint arXiv:2201.07520","author":"Aghajanyan Armen","year":"2022","unstructured":"Armen Aghajanyan, Bernie Huang, Candace Ross, Vladimir Karpukhin, Hu Xu, Naman Goyal, Dmytro Okhonko, Mandar Joshi, Gargi Ghosh, Mike Lewis, 2022. CM3: A Causal Masked Multimodal Model of the Internet. arXiv preprint arXiv:2201.07520 (2022)."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10339-019-00927-w"},{"key":"e_1_3_2_1_4_1","volume-title":"Face-ism: Five studies of sex differences in facial prominence.Journal of Personality and social Psychology 45, 4","author":"Archer Dane","year":"1983","unstructured":"Dane Archer, Bonita Iritani, Debra D Kimes, and Michael Barrios. 1983. Face-ism: Five studies of sex differences in facial prominence.Journal of Personality and social Psychology 45, 4 (1983), 725."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1080\/15205436.2010.513468"},{"key":"e_1_3_2_1_6_1","volume-title":"Easily accessible text-to-image generation amplifies demographic stereotypes at large scale. arXiv preprint arXiv:2211.03759","author":"Bianchi Federico","year":"2022","unstructured":"Federico Bianchi, Pratyusha Kalluri, Esin Durmus, Faisal Ladhak, Myra Cheng, Debora Nozza, Tatsunori Hashimoto, Dan Jurafsky, James Zou, and Aylin Caliskan. 2022. Easily accessible text-to-image generation amplifies demographic stereotypes at large scale. arXiv preprint arXiv:2211.03759 (2022)."},{"key":"e_1_3_2_1_7_1","volume-title":"Vinay Uday Prabhu, and Emmanuel Kahembwe","author":"Birhane Abeba","year":"2021","unstructured":"Abeba Birhane, Vinay Uday Prabhu, and Emmanuel Kahembwe. 2021. Multimodal datasets: misogyny, pornography, and malignant stereotypes. arXiv preprint arXiv:2110.01963 (2021)."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/WACV51458.2022.00158"},{"key":"e_1_3_2_1_9_1","volume-title":"Conference on fairness, accountability and transparency. PMLR, 77\u201391","author":"Buolamwini Joy","year":"2018","unstructured":"Joy Buolamwini and Timnit Gebru. 2018. Gender shades: Intersectional accuracy disparities in commercial gender classification. In Conference on fairness, accountability and transparency. PMLR, 77\u201391."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/3514094.3534162"},{"key":"e_1_3_2_1_11_1","volume-title":"Semantics derived automatically from language corpora contain human-like biases. Science 356, 6334","author":"Caliskan Aylin","year":"2017","unstructured":"Aylin Caliskan, Joanna J Bryson, and Arvind Narayanan. 2017. Semantics derived automatically from language corpora contain human-like biases. Science 356, 6334 (2017), 183\u2013186."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"crossref","unstructured":"Rachel M Calogero. 2012. Objectification theory self-objectification and body image. (2012).","DOI":"10.1016\/B978-0-12-384925-0.00091-2"},{"key":"e_1_3_2_1_13_1","volume-title":"International Conference on Machine Learning. PMLR, 1691\u20131703","author":"Chen Mark","year":"2020","unstructured":"Mark Chen, Alec Radford, Rewon Child, Jeffrey Wu, Heewoo Jun, David Luan, and Ilya Sutskever. 2020. Generative pretraining from pixels. In International Conference on Machine Learning. PMLR, 1691\u20131703."},{"key":"e_1_3_2_1_14_1","volume-title":"Charles Sutton","author":"Chowdhery Aakanksha","year":"2022","unstructured":"Aakanksha Chowdhery, Sharan Narang, Jacob Devlin, Maarten Bosma, Gaurav Mishra, Adam Roberts, Paul Barham, Hyung Won Chung, Charles Sutton, Sebastian Gehrmann, 2022. Palm: Scaling language modeling with pathways. arXiv preprint arXiv:2204.02311 (2022)."},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0102172"},{"key":"e_1_3_2_1_16_1","volume-title":"Statistical power analysis. Current directions in psychological science 1, 3","author":"Cohen Jacob","year":"1992","unstructured":"Jacob Cohen. 1992. Statistical power analysis. Current directions in psychological science 1, 3 (1992), 98\u2013101."},{"key":"e_1_3_2_1_17_1","volume-title":"VQGAN-CLIP: Open Domain Image Generation and Editing with Natural Language Guidance. arXiv preprint arXiv:2204.08583","author":"Crowson Katherine","year":"2022","unstructured":"Katherine Crowson, Stella Biderman, Daniel Kornis, Dashiell Stander, Eric Hallahan, Louis Castricato, and Edward Raff. 2022. VQGAN-CLIP: Open Domain Image Generation and Editing with Natural Language Guidance. arXiv preprint arXiv:2204.08583 (2022)."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.bodyim.2020.02.016"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"e_1_3_2_1_20_1","volume-title":"International Conference on Learning Representations.","author":"Dosovitskiy Alexey","year":"2020","unstructured":"Alexey Dosovitskiy, Lucas Beyer, Alexander Kolesnikov, Dirk Weissenborn, Xiaohua Zhai, Thomas Unterthiner, Mostafa Dehghani, Matthias Minderer, Georg Heigold, Sylvain Gelly, 2020. An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale. In International Conference on Learning Representations."},{"key":"e_1_3_2_1_21_1","volume-title":"Gender stereotypes and attitudes toward women and men. Personality and social psychology bulletin 15, 4","author":"Eagly Alice H","year":"1989","unstructured":"Alice H Eagly and Antonio Mladinic. 1989. Gender stereotypes and attitudes toward women and men. Personality and social psychology bulletin 15, 4 (1989), 543\u2013558."},{"key":"e_1_3_2_1_22_1","volume-title":"Are people prejudiced against women? Some answers from research on attitudes, gender stereotypes, and judgments of competence. European review of social psychology 5, 1","author":"Eagly Alice H","year":"1994","unstructured":"Alice H Eagly and Antonio Mladinic. 1994. Are people prejudiced against women? Some answers from research on attitudes, gender stereotypes, and judgments of competence. European review of social psychology 5, 1 (1994), 1\u201335."},{"key":"e_1_3_2_1_23_1","unstructured":"Lensa Image Editor. [n. d.]. In https:\/\/prisma-ai.com\/lensa."},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01268"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1111\/j.1460-2466.2007.00354.x"},{"key":"e_1_3_2_1_26_1","volume-title":"Objectification theory: Toward understanding women\u2019s lived experiences and mental health risks. Psychology of women quarterly 21, 2","author":"Fredrickson Barbara L","year":"1997","unstructured":"Barbara L Fredrickson and Tomi-Ann Roberts. 1997. Objectification theory: Toward understanding women\u2019s lived experiences and mental health risks. Psychology of women quarterly 21, 2 (1997), 173\u2013206."},{"key":"e_1_3_2_1_27_1","volume-title":"The happiness effect: How social media is driving a generation to appear perfect at any cost","author":"Freitas Donna","unstructured":"Donna Freitas. 2017. The happiness effect: How social media is driving a generation to appear perfect at any cost. Oxford University Press."},{"key":"e_1_3_2_1_28_1","volume-title":"Devise: A deep visual-semantic embedding model.","author":"Frome Andrea","year":"2013","unstructured":"Andrea Frome, Greg Corrado, Jonathon Shlens, Samy Bengio, Jeffrey Dean, Marc\u2019Aurelio Ranzato, and Tomas Mikolov. 2013. Devise: A deep visual-semantic embedding model. (2013)."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/3458723"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1002\/ejsp.1890"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.23915\/distill.00030"},{"key":"e_1_3_2_1_32_1","volume-title":"Open-vocabulary Object Detection via Vision and Language Knowledge Distillation. arXiv preprint arXiv:2104.13921 2","author":"Gu Xiuye","year":"2021","unstructured":"Xiuye Gu, Tsung-Yi Lin, Weicheng Kuo, and Yin Cui. 2021. Open-vocabulary Object Detection via Vision and Language Knowledge Distillation. arXiv preprint arXiv:2104.13921 2 (2021)."},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/3461702.3462536"},{"key":"e_1_3_2_1_34_1","volume-title":"Ethics of Data and Analytics","author":"Harwell Drew","unstructured":"Drew Harwell. 2019. A face-scanning algorithm increasingly decides whether you deserve the job. In Ethics of Data and Analytics. Auerbach Publications, 206\u2013211."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jesp.2010.12.020"},{"key":"e_1_3_2_1_37_1","unstructured":"Melissa Heikkil\u00e4a. 2022. The viral AI avatar app Lensa undressed me\u2014without my consent. The viral AI avatar app Lensa undressed me\u2014without my consent"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.3301573"},{"key":"e_1_3_2_1_39_1","volume-title":"Women rising: The unseen barriers. Harvard business review 91, 9","author":"Ibarra Herminia","year":"2013","unstructured":"Herminia Ibarra, Robin Ely, and Deborah Kolb. 2013. Women rising: The unseen barriers. Harvard business review 91, 9 (2013), 60\u201366."},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","unstructured":"Gabriel Ilharco Mitchell Wortsman Ross Wightman Cade Gordon Nicholas Carlini Rohan Taori Achal Dave Vaishaal Shankar Hongseok Namkoong John Miller Hannaneh Hajishirzi Ali Farhadi and Ludwig Schmidt. 2021. OpenCLIP. https:\/\/doi.org\/10.5281\/zenodo.5143773 If you use this software please cite it as below..","DOI":"10.5281\/zenodo.5143773"},{"key":"e_1_3_2_1_41_1","volume-title":"Scaling Up Visual and Vision-Language Representation Learning With Noisy Text Supervision. arXiv e-prints","author":"Jia Chao","year":"2021","unstructured":"Chao Jia, Yinfei Yang, Ye Xia, Yi-Ting Chen, Zarana Parekh, Hieu Pham, Quoc V Le, Yunhsuan Sung, Zhen Li, and Tom Duerig. 2021. Scaling Up Visual and Vision-Language Representation Learning With Noisy Text Supervision. arXiv e-prints (2021), arXiv\u20132102."},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00453"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/3461702.3462609"},{"key":"e_1_3_2_1_44_1","unstructured":"Gant Laborde. [n. d.]. Deep NN for NSFW Detection. https:\/\/github.com\/GantMan\/nsfw_model"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.703"},{"key":"e_1_3_2_1_46_1","volume-title":"Proceedings of the IEEE International Conference on Computer Vision. 4183\u20134192","author":"Li Ang","unstructured":"Ang Li, Allan Jabri, Armand Joulin, and Laurens van der Maaten. 2017. Learning visual n-grams from web data. In Proceedings of the IEEE International Conference on Computer Vision. 4183\u20134192."},{"key":"e_1_3_2_1_47_1","volume-title":"BLIP: Bootstrapping Language-Image Pre-training for Unified Vision-Language Understanding and Generation. arXiv preprint arXiv:2201.12086","author":"Li Junnan","year":"2022","unstructured":"Junnan Li, Dongxu Li, Caiming Xiong, and Steven Hoi. 2022. BLIP: Bootstrapping Language-Image Pre-training for Unified Vision-Language Understanding and Generation. arXiv preprint arXiv:2201.12086 (2022)."},{"key":"e_1_3_2_1_48_1","volume-title":"Incorporating priors with feature attribution on text classification. arXiv preprint arXiv:1906.08286","author":"Liu Frederick","year":"2019","unstructured":"Frederick Liu and Besim Avci. 2019. Incorporating priors with feature attribution on text classification. arXiv preprint arXiv:1906.08286 (2019)."},{"key":"e_1_3_2_1_49_1","volume-title":"An implicit gender sex-science association in the general population and STEM faculty. The Journal of General Psychology","author":"Marini Maddalena","year":"2020","unstructured":"Maddalena Marini and Mahzarin R Banaji. 2020. An implicit gender sex-science association in the general population and STEM faculty. The Journal of General Psychology (2020), 1\u201328."},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N19-1063"},{"key":"e_1_3_2_1_51_1","unstructured":"Merriam-Webster. [n. d.]. In https:\/\/www.merriam-webster.com\/dictionary\/."},{"key":"e_1_3_2_1_52_1","volume-title":"Clipcap: Clip prefix for image captioning. arXiv preprint arXiv:2111.09734","author":"Mokady Ron","year":"2021","unstructured":"Ron Mokady, Amir Hertz, and Amit H Bermano. 2021. Clipcap: Clip prefix for image captioning. arXiv preprint arXiv:2111.09734 (2021)."},{"key":"e_1_3_2_1_53_1","volume-title":"When a Stereotype Dumbfounds: Probing the Nature of the Surgeon= Male Belief. Current Research in Ecological and Social Psychology","author":"Morehouse Kirsten N","year":"2022","unstructured":"Kirsten N Morehouse, Benedek Kurdi, Ece Hakim, and Mahzarin R Banaji. 2022. When a Stereotype Dumbfounds: Probing the Nature of the Surgeon= Male Belief. Current Research in Ecological and Social Psychology (2022), 100044."},{"key":"e_1_3_2_1_54_1","volume-title":"SLIP: Self-supervision meets Language-Image Pre-training. arXiv preprint arXiv:2112.12750","author":"Mu Norman","year":"2021","unstructured":"Norman Mu, Alexander Kirillov, David Wagner, and Saining Xie. 2021. SLIP: Self-supervision meets Language-Image Pre-training. arXiv preprint arXiv:2112.12750 (2021)."},{"key":"e_1_3_2_1_55_1","volume-title":"Stereoset: Measuring stereotypical bias in pretrained language models. arXiv preprint arXiv:2004.09456","author":"Nadeem Moin","year":"2020","unstructured":"Moin Nadeem, Anna Bethke, and Siva Reddy. 2020. Stereoset: Measuring stereotypical bias in pretrained language models. arXiv preprint arXiv:2004.09456 (2020)."},{"key":"e_1_3_2_1_56_1","volume-title":"Glide: Towards photorealistic image generation and editing with text-guided diffusion models. arXiv preprint arXiv:2112.10741","author":"Nichol Alex","year":"2021","unstructured":"Alex Nichol, Prafulla Dhariwal, Aditya Ramesh, Pranav Shyam, Pamela Mishkin, Bob McGrew, Ilya Sutskever, and Mark Chen. 2021. Glide: Towards photorealistic image generation and editing with text-guided diffusion models. arXiv preprint arXiv:2112.10741 (2021)."},{"key":"e_1_3_2_1_57_1","volume-title":"Understanding the Representation and Representativeness of Age in AI Data Sets. arXiv preprint arXiv:2103.09058","author":"Park Joon Sung","year":"2021","unstructured":"Joon Sung Park, Michael S Bernstein, Robin N Brewer, Ece Kamar, and Meredith Ringel Morris. 2021. Understanding the Representation and Representativeness of Age in AI Data Sets. arXiv preprint arXiv:2103.09058 (2021)."},{"key":"e_1_3_2_1_58_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.patter.2021.100336"},{"key":"e_1_3_2_1_59_1","volume-title":"Chris Hallacy, Aditya Ramesh, Gabriel Goh, Sandhini Agarwal, Girish Sastry, Amanda Askell","author":"Radford Alec","year":"2021","unstructured":"Alec Radford, Jong Wook Kim, Chris Hallacy, Aditya Ramesh, Gabriel Goh, Sandhini Agarwal, Girish Sastry, Amanda Askell, Pamela Mishkin, Jack Clark, 2021. Learning transferable visual models from natural language supervision. arXiv preprint arXiv:2103.00020 (2021)."},{"key":"e_1_3_2_1_60_1","volume-title":"Language models are unsupervised multitask learners. OpenAI blog 1, 8","author":"Radford Alec","year":"2019","unstructured":"Alec Radford, Jeffrey Wu, Rewon Child, David Luan, Dario Amodei, Ilya Sutskever, 2019. Language models are unsupervised multitask learners. OpenAI blog 1, 8 (2019), 9."},{"key":"e_1_3_2_1_61_1","volume-title":"Hierarchical Text-Conditional Image Generation with CLIP Latents. arXiv preprint arXiv:2204.06125","author":"Ramesh Aditya","year":"2022","unstructured":"Aditya Ramesh, Prafulla Dhariwal, Alex Nichol, Casey Chu, and Mark Chen. 2022. Hierarchical Text-Conditional Image Generation with CLIP Latents. arXiv preprint arXiv:2204.06125 (2022)."},{"key":"e_1_3_2_1_62_1","volume-title":"Zero-shot text-to-image generation. arXiv preprint arXiv:2102.12092","author":"Ramesh Aditya","year":"2021","unstructured":"Aditya Ramesh, Mikhail Pavlov, Gabriel Goh, Scott Gray, Chelsea Voss, Alec Radford, Mark Chen, and Ilya Sutskever. 2021. Zero-shot text-to-image generation. arXiv preprint arXiv:2102.12092 (2021)."},{"key":"e_1_3_2_1_63_1","volume-title":"AAS\/Division for Planetary Sciences Meeting Abstracts# 47","volume":"47","author":"Richey Christina","year":"2015","unstructured":"Christina Richey. 2015. The CSWA survey on workplace climate and anti-harassment policies. In AAS\/Division for Planetary Sciences Meeting Abstracts# 47, Vol. 47. 406\u201301."},{"key":"e_1_3_2_1_64_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01042"},{"key":"e_1_3_2_1_65_1","volume-title":"The Sexual OBjectification and EMotion database: A free stimulus set and norming data of sexually objectified and non-objectified female targets expressing multiple emotions. Behavior Research Methods","author":"Ruzzante Daniela","year":"2021","unstructured":"Daniela Ruzzante, Bianca Monachesi, Noemi Orabona, and Jeroen Vaes. 2021. The Sexual OBjectification and EMotion database: A free stimulus set and norming data of sexually objectified and non-objectified female targets expressing multiple emotions. Behavior Research Methods (2021), 1\u201315."},{"key":"e_1_3_2_1_66_1","volume-title":"Large-scale classification of fine-art paintings: Learning the right metric on the right feature. arXiv preprint arXiv:1505.00855","author":"Saleh Babak","year":"2015","unstructured":"Babak Saleh and Ahmed Elgammal. 2015. Large-scale classification of fine-art paintings: Learning the right metric on the right feature. arXiv preprint arXiv:1505.00855 (2015)."},{"key":"e_1_3_2_1_67_1","volume-title":"Laion-400m: Open dataset of clip-filtered 400 million image-text pairs. arXiv preprint arXiv:2111.02114","author":"Schuhmann Christoph","year":"2021","unstructured":"Christoph Schuhmann, Richard Vencu, Romain Beaumont, Robert Kaczmarczyk, Clayton Mullis, Aarush Katta, Theo Coombes, Jenia Jitsev, and Aran Komatsuzaki. 2021. Laion-400m: Open dataset of clip-filtered 400 million image-text pairs. arXiv preprint arXiv:2111.02114 (2021)."},{"key":"e_1_3_2_1_68_1","volume-title":"Grad-CAM: Why did you say that?arXiv preprint arXiv:1611.07450","author":"Selvaraju Ramprasaath R","year":"2016","unstructured":"Ramprasaath R Selvaraju, Abhishek Das, Ramakrishna Vedantam, Michael Cogswell, Devi Parikh, and Dhruv Batra. 2016. Grad-CAM: Why did you say that?arXiv preprint arXiv:1611.07450 (2016)."},{"key":"e_1_3_2_1_69_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1238"},{"key":"e_1_3_2_1_70_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1339"},{"key":"e_1_3_2_1_71_1","volume-title":"Grading video interviews with fairness considerations. arXiv preprint arXiv:2007.05461","author":"Singhania Abhishek","year":"2020","unstructured":"Abhishek Singhania, Abhishek Unnam, and Varun Aggarwal. 2020. Grading video interviews with fairness considerations. arXiv preprint arXiv:2007.05461 (2020)."},{"key":"e_1_3_2_1_72_1","unstructured":"Richard Socher Milind Ganjoo Christopher D Manning and Andrew Ng. 2013. Zero-Shot Learning Through Cross-Modal Transfer. In Advances in Neural Information Processing Systems. 935\u2013943."},{"key":"e_1_3_2_1_73_1","doi-asserted-by":"publisher","DOI":"10.1145\/3442188.3445932"},{"key":"e_1_3_2_1_74_1","doi-asserted-by":"publisher","DOI":"10.1111\/0022-4537.00200"},{"key":"e_1_3_2_1_75_1","volume-title":"Contrastive Representation Distillation. In International Conference on Learning Representations.","author":"Tian Yonglong","year":"2019","unstructured":"Yonglong Tian, Dilip Krishnan, and Phillip Isola. 2019. Contrastive Representation Distillation. In International Conference on Learning Representations."},{"key":"e_1_3_2_1_76_1","doi-asserted-by":"publisher","DOI":"10.1093\/jpepsy\/jsv021"},{"key":"e_1_3_2_1_77_1","unstructured":"Saurabh Tiwary. 2021. Turing Bletchley: A Universal Image Language Representation model by Microsoft. https:\/\/www.microsoft.com\/en-us\/research\/blog\/turing-bletchley-a-universal-image-language-representation-model-by-microsoft\/"},{"key":"e_1_3_2_1_78_1","unstructured":"the-eye.eu. [n. d.]. Antarctic Captioner training corpus. https:\/\/the-eye.eu\/public\/AI\/models\/antarctic-captions\/postcache.txt."},{"key":"e_1_3_2_1_79_1","doi-asserted-by":"publisher","DOI":"10.1080\/23268743.2020.1741434"},{"key":"e_1_3_2_1_80_1","volume-title":"Are Gender-Neutral Queries Really Gender-Neutral? Mitigating Gender Bias in Image Search. arXiv preprint arXiv:2109.05433","author":"Wang Jialu","year":"2021","unstructured":"Jialu Wang, Yang Liu, and Xin Eric Wang. 2021. Are Gender-Neutral Queries Really Gender-Neutral? Mitigating Gender Bias in Image Search. arXiv preprint arXiv:2109.05433 (2021)."},{"key":"e_1_3_2_1_81_1","doi-asserted-by":"publisher","DOI":"10.1080\/00224499.2016.1142496"},{"key":"e_1_3_2_1_82_1","doi-asserted-by":"publisher","DOI":"10.1145\/3514094.3534136"},{"key":"e_1_3_2_1_83_1","doi-asserted-by":"publisher","DOI":"10.1145\/3278721.3278779"},{"key":"e_1_3_2_1_84_1","volume-title":"Contrastive learning of medical visual representations from paired images and text. arXiv preprint arXiv:2010.00747","author":"Zhang Yuhao","year":"2020","unstructured":"Yuhao Zhang, Hang Jiang, Yasuhide Miura, Christopher D Manning, and Curtis P Langlotz. 2020. Contrastive learning of medical visual representations from paired images and text. arXiv preprint arXiv:2010.00747 (2020)."}],"event":{"name":"FAccT '23: the 2023 ACM Conference on Fairness, Accountability, and Transparency","location":"Chicago IL USA","acronym":"FAccT '23"},"container-title":["2023 ACM Conference on Fairness Accountability and Transparency"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3593013.3594072","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3593013.3594072","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3593013.3594072","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T16:37:18Z","timestamp":1750178238000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3593013.3594072"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,6,12]]},"references-count":84,"alternative-id":["10.1145\/3593013.3594072","10.1145\/3593013"],"URL":"https:\/\/doi.org\/10.1145\/3593013.3594072","relation":{},"subject":[],"published":{"date-parts":[[2023,6,12]]},"assertion":[{"value":"2023-06-12","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}