{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,13]],"date-time":"2026-04-13T23:12:30Z","timestamp":1776121950251,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":80,"publisher":"ACM","license":[{"start":{"date-parts":[[2022,6,20]],"date-time":"2022-06-20T00:00:00Z","timestamp":1655683200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["2039656"],"award-info":[{"award-number":["2039656"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100006112","name":"Microsoft Research","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100006112","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100004318","name":"Microsoft","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100004318","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2022,6,21]]},"DOI":"10.1145\/3531146.3533099","type":"proceedings-article","created":{"date-parts":[[2022,6,20]],"date-time":"2022-06-20T14:27:10Z","timestamp":1655735230000},"page":"324-335","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":28,"title":["Measuring Representational Harms in Image Captioning"],"prefix":"10.1145","author":[{"given":"Angelina","family":"Wang","sequence":"first","affiliation":[{"name":"Princeton University, USA"}]},{"given":"Solon","family":"Barocas","sequence":"additional","affiliation":[{"name":"Microsoft Research, USA"}]},{"given":"Kristen","family":"Laird","sequence":"additional","affiliation":[{"name":"Microsoft, USA"}]},{"given":"Hanna","family":"Wallach","sequence":"additional","affiliation":[{"name":"Microsoft Research, USA"}]}],"member":"320","published-online":{"date-parts":[[2022,6,20]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611975673.90"},{"key":"e_1_3_2_1_2_1","volume-title":"Workshop on Bias Estimation in Face Analytics at ECCV 2018","author":"Alvi Mohsan","year":"2018","unstructured":"Mohsan Alvi, Andrew Zisserman, and Christoffer Nellaker. 2018. Turning a Blind Eye: Explicit Removal of Biases and Variation from Deep Neural Network Embeddings. Workshop on Bias Estimation in Face Analytics at ECCV 2018 (2018)."},{"key":"e_1_3_2_1_3_1","volume-title":"SPICE: Semantic Propositional Image Caption Evaluation. European Conference on Computer Vision (ECCV)","author":"Anderson Peter","year":"2016","unstructured":"Peter Anderson, Basura Fernando, Mark Johnson, and Stephen Gould. 2016. SPICE: Semantic Propositional Image Caption Evaluation. European Conference on Computer Vision (ECCV) (2016)."},{"key":"e_1_3_2_1_4_1","volume-title":"Bottom-Up and Top-Down Attention for Image Captioning and Visual Question Answering. IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","author":"Anderson Peter","year":"2018","unstructured":"Peter Anderson, Xiaodong He, Chris Buehler, Damien Teney, Mark Johnson, Stephen Gould, and Lei Zhang. 2018. Bottom-Up and Top-Down Attention for Image Captioning and Visual Question Answering. IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) (2018)."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00583"},{"key":"e_1_3_2_1_6_1","volume-title":"Muhammad Farooq\u00a0Khan Niazi, and Shafiq Hussain","author":"Ayesha Hareem","year":"2021","unstructured":"Hareem Ayesha, Sajid Iqbal, Mehreen Tariq, Muhammad Abrar, Muhammad Sanaullah, Ishaq Abbas, Amjad Rehman, Muhammad Farooq\u00a0Khan Niazi, and Shafiq Hussain. 2021. Automatic medical image interpretation: State of the art and future directions. Pattern Recognition (2021)."},{"key":"e_1_3_2_1_7_1","volume-title":"Proceedings of the acl workshop on intrinsic and extrinsic evaluation measures for machine translation and\/or summarization, 65\u201372","author":"Banerjee Satanjeev","year":"2005","unstructured":"Satanjeev Banerjee and Alon Lavie. 2005. METEOR: An automatic metric for MT evaluation with improved correlation with human judgments. Proceedings of the acl workshop on intrinsic and extrinsic evaluation measures for machine translation and\/or summarization, 65\u201372."},{"key":"e_1_3_2_1_8_1","volume-title":"Stereotype. ACM Conference on Computer-Supported Cooperative Work And Social Computing (CSCW)","author":"Barlas Pinar","year":"2020","unstructured":"Pinar Barlas, Kyriakos Kyriakou, Olivia Guest, Styliani Kleanthous, and Jahna Otterbacher. 2020. To \u201cSee\u201d is to Stereotype. ACM Conference on Computer-Supported Cooperative Work And Social Computing (CSCW) (2020)."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1609\/icwsm.v13i01.3255"},{"key":"e_1_3_2_1_10_1","volume-title":"Neither: The Dehumanization Potential of Automated Image Tagging. AAAI\/ACM Conference on Artificial Intelligence, Ethics, and Society (AIES)","author":"Barlas Pinar","year":"2021","unstructured":"Pinar Barlas, Kyriakos Kyriakou, Styliani Kleanthous, and Jahna Otterbacher. 2021. Person, Human, Neither: The Dehumanization Potential of Automated Image Tagging. AAAI\/ACM Conference on Artificial Intelligence, Ethics, and Society (AIES) (2021)."},{"key":"e_1_3_2_1_11_1","volume-title":"Proceedings of SIGCIS","author":"Barocas Solon","year":"2017","unstructured":"Solon Barocas, Kate Crawford, Aaron Shapiro, and Hanna Wallach. 2017. The Problem With Bias: Allocative Versus Representational Harms in Machine Learning. In Proceedings of SIGCIS. Philadelphia, PA."},{"key":"e_1_3_2_1_12_1","volume-title":"Experiencing Dehumanization: Cognitive and Emotional Effects of Everyday Dehumanization. Basic and Applied Social Psychology(2011).","author":"Bastian Brock","year":"2011","unstructured":"Brock Bastian and Nick Haslam. 2011. Experiencing Dehumanization: Cognitive and Emotional Effects of Everyday Dehumanization. Basic and Applied Social Psychology(2011)."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/3442188.3445922"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6248100"},{"key":"e_1_3_2_1_15_1","volume":"201","author":"Camiel\u00a0","unstructured":"Camiel\u00a0J. Beukeboom. 2014. Mechanisms of linguistic bias: How words reflect and maintain stereotypic expectancies. Social cognition and communication(2014).","journal-title":"J. Beukeboom."},{"key":"e_1_3_2_1_16_1","volume-title":"Exposing and Correcting the Gender Bias in Image Captioning Datasets and Models. arXiv:1912.00578","author":"Bhargava Shruti","year":"2019","unstructured":"Shruti Bhargava and David Forsyth. 2019. Exposing and Correcting the Gender Bias in Image Captioning Datasets and Models. arXiv:1912.00578 (2019)."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.5555\/1717171"},{"key":"e_1_3_2_1_18_1","volume-title":"Multimodal datasets: misogyny, pornography, and malignant stereotypes. arXiv:2110.01963","author":"Birhane Abeba","year":"2021","unstructured":"Abeba Birhane, Vinay\u00a0Uday Prabhu, and Emmanuel Kahembwe. 2021. Multimodal datasets: misogyny, pornography, and malignant stereotypes. arXiv:2110.01963 (2021)."},{"key":"e_1_3_2_1_19_1","volume-title":"NLPAssociation for Computational Linguistics (ACL)","author":"Blodgett Su\u00a0Lin","year":"2020","unstructured":"Su\u00a0Lin Blodgett, Solon Barocas, Hal\u00a0Daume III, and Hanna Wallach. 2020. Language (Technology) is Power: A Critical Survey of \u201cBias\u201d in NLP. Association for Computational Linguistics (ACL) (2020)."},{"key":"e_1_3_2_1_20_1","volume-title":"Gender Shades: Intersectional Accuracy Disparities in Commercial Gender Classification. Conference on Fairness, Accountability and Transparency (FAccT)","author":"Buolamwini Joy","year":"2018","unstructured":"Joy Buolamwini and Timnit Gebru. 2018. Gender Shades: Intersectional Accuracy Disparities in Commercial Gender Classification. Conference on Fairness, Accountability and Transparency (FAccT) (2018)."},{"key":"e_1_3_2_1_21_1","unstructured":"Xinlei Chen Hao Fang Tsung-Yi Lin Ramakrishna Vedantam Saurabh Gupta Piotr Doll\u00e1r and C.\u00a0Lawrence Zitnick. 2015. Microsoft coco captions: Data collection and evaluation server. arXiv preprint arXiv:1504.00325(2015)."},{"key":"e_1_3_2_1_22_1","volume-title":"Ethnicity and Race: Making Identities in a Changing World","author":"Cornell Stephen","year":"2006","unstructured":"Stephen Cornell and Douglas Hartmann. 2006. Ethnicity and Race: Making Identities in a Changing World. SAGE Publications (2006)."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00608"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.323"},{"key":"e_1_3_2_1_25_1","volume-title":"Case: Hithon v. Tyson Foods","author":"NAACP\u00a0Legal Defense and Inc. Educational\u00a0Fund.","year":"2010","unstructured":"NAACP\u00a0Legal Defense and Inc. Educational\u00a0Fund. 2010. Case: Hithon v. Tyson Foods, Inc.(2010)."},{"key":"e_1_3_2_1_26_1","unstructured":"Terrance DeVries Ishan Misra Changhan Wang and Laurens van\u00a0der Maaten. 2019. Does Object Recognition Work for Everyone?Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)(2019)."},{"key":"e_1_3_2_1_27_1","volume-title":"Documenting Large Webtext Corpora: A Case Study on the Colossal Clean Crawled Corpus. Conference on Empirical Methods in Natural Language Processing (EMNLP)","author":"Dodge Jesse","year":"2021","unstructured":"Jesse Dodge, Maarten Sap, Ana Marasovi\u0107, William Agnew, Gabriel Ilharco, Dirk Groeneveld, Margaret Mitchell, and Matt Gardner. 2021. Documenting Large Webtext Corpora: A Case Study on the Colossal Clean Crawled Corpus. Conference on Empirical Methods in Natural Language Processing (EMNLP) (2021)."},{"key":"e_1_3_2_1_28_1","volume-title":"Google Photos labeled black people \u2019gorillas\u2019. USA Today","author":"Guynn Jessica","year":"2015","unstructured":"Jessica Guynn. 2015. Google Photos labeled black people \u2019gorillas\u2019. USA Today (2015)."},{"key":"e_1_3_2_1_29_1","unstructured":"Xiaotian Han Jianwei Yang Houdong Hu Lei Zhang Jianfeng Gao and Pengchuan Zhang. 2021. Image Scene Graph Generation (SGG) Benchmark. arxiv:2107.12604\u00a0[cs.CV]"},{"key":"e_1_3_2_1_30_1","volume-title":"Dehumanization: A new perspective. Social and Personality Psychology Compass(2007).","author":"Haslam Nick","year":"2007","unstructured":"Nick Haslam, Stephen Loughnan, Catherine Reynolds, and Samuel Wilson. 2007. Dehumanization: A new perspective. Social and Personality Psychology Compass(2007)."},{"key":"e_1_3_2_1_31_1","volume-title":"The art of Alt Text. UX Collective","author":"Heinrich Alexa","year":"2020","unstructured":"Alexa Heinrich. 2020. The art of Alt Text. UX Collective (2020)."},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01219-9_47"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","unstructured":"Matthew Honnibal Ines Montani Sofie Van\u00a0Landeghem and Adriane Boyd. 2020. spaCy: Industrial-strength Natural Language Processing in Python. https:\/\/doi.org\/10.5281\/zenodo.1212303","DOI":"10.5281\/zenodo.1212303"},{"key":"e_1_3_2_1_34_1","unstructured":"Sethurathienam Iyer Shubham Chaturvedi and Tirtharaj Dash. 2018. Image Captioning-Based Image Search Engine: An Alternative to Retrieval by Metadata. Soft Computing for Problem Solving(2018)."},{"key":"e_1_3_2_1_35_1","volume-title":"Measurement and Fairness. Conference on Fairness, Accountability and Transparency (FAccT)","author":"Z.","year":"2021","unstructured":"Abigail\u00a0Z. Jacobs and Hanna Wallach. 2021. Measurement and Fairness. Conference on Fairness, Accountability and Transparency (FAccT) (2021)."},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1145\/3351095.3372829"},{"key":"e_1_3_2_1_37_1","volume-title":"Representational Harms in Image Tagging. Beyond Fair Computer Vision Workshop at CVPR 2021","author":"Katzman Jared","year":"2021","unstructured":"Jared Katzman, Solon Barocas, Su\u00a0Lin Blodgett, Kristen Laird, Morgan\u00a0Klaus Scheuerman, and Hanna Wallach. 2021. Representational Harms in Image Tagging. Beyond Fair Computer Vision Workshop at CVPR 2021 (2021). https:\/\/drive.google.com\/file\/d\/1oJp8CqNpYEsOlO8cwv4cTnHGbOjWxEZ-\/view"},{"key":"e_1_3_2_1_38_1","volume-title":"Visual Genome: Connecting Language and Vision Using Crowdsourced Dense Image Annotations. https:\/\/arxiv.org\/abs\/1602.07332","author":"Krishna Ranjay","year":"2016","unstructured":"Ranjay Krishna, Yuke Zhu, Oliver Groth, Justin Johnson, Kenji Hata, Joshua Kravitz, Stephanie Chen, Yannis Kalantidis, Li-Jia Li, David\u00a0A Shamma, Michael Bernstein, and Li Fei-Fei. 2016. Visual Genome: Connecting Language and Vision Using Crowdsourced Dense Image Annotations. https:\/\/arxiv.org\/abs\/1602.07332"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1609\/icwsm.v13i01.3232"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.7551\/mitpress\/7287.003.0018"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"crossref","unstructured":"Harriet\u00a0E. Lerner. 1976. Girls ladies or women? The unconscious dynamics of language choice. Comprehensive Psychiatry(1976).","DOI":"10.1016\/0010-440X(76)90003-1"},{"key":"e_1_3_2_1_42_1","volume-title":"Oscar: Object-Semantics Aligned Pre-training for Vision-Language Tasks. European Conference on Computer Vision (ECCV)","author":"Li Xiujun","year":"2020","unstructured":"Xiujun Li, Xi Yin, Chunyuan Li, Pengchuan Zhang, Xiaowei Hu, Lei Zhang, Lijuan Wang, Houdong Hu, Li Dong, Furu Wei, Yejin Choi, and Jianfeng Gao. 2020. Oscar: Object-Semantics Aligned Pre-training for Vision-Language Tasks. European Conference on Computer Vision (ECCV) (2020)."},{"key":"e_1_3_2_1_43_1","volume-title":"ROUGE: A package for automatic evaluation of summaries. Text summarization branches out(2004), 74\u201381.","author":"Lin Chin-Yew","year":"2004","unstructured":"Chin-Yew Lin. 2004. ROUGE: A package for automatic evaluation of summaries. Text summarization branches out(2004), 74\u201381."},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"e_1_3_2_1_45_1","volume-title":"Attention Correctness in Neural Image Captioning. AAAI Conference on Artificial Intelligence (AAAI-17)","author":"Liu Chenxi","year":"2017","unstructured":"Chenxi Liu, Junhua Mao, Fei Sha, and Alan Yuille. 2017. Attention Correctness in Neural Image Captioning. AAAI Conference on Artificial Intelligence (AAAI-17) (2017)."},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.345"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00728"},{"key":"e_1_3_2_1_48_1","volume-title":"Hate speech detection: Challenges and solutions. PLOS ONE","author":"MacAvaney Sean","year":"2019","unstructured":"Sean MacAvaney, Hao-Ren Yao, Eugene Yang, Katina Russell, Nazli Goharian, and Ophir Frieder. 2019. Hate speech detection: Challenges and solutions. PLOS ONE (2019)."},{"key":"e_1_3_2_1_49_1","volume-title":"Designing Tools for High-Quality Alt Text Authoring. International ACM SIGACCESS Conference on Computers and Accessibility (ASSETS)","author":"Mack Kelly","year":"2021","unstructured":"Kelly Mack, Edward Cutrell, Bongshin Lee, and Meredith\u00a0Ringel Morris. 2021. Designing Tools for High-Quality Alt Text Authoring. International ACM SIGACCESS Conference on Computers and Accessibility (ASSETS) (2021)."},{"key":"e_1_3_2_1_50_1","volume-title":"Understanding Blind People\u2019s Experiences with Computer-Generated Captions of Social Media Images. ACM Conference on Human Factors in Computing Systems (CHI)","author":"MacLeod Haley","year":"2017","unstructured":"Haley MacLeod, Cynthia\u00a0L. Bennett, Meredith\u00a0Ringel Morris, and Edward Cutrell. 2017. Understanding Blind People\u2019s Experiences with Computer-Generated Captions of Social Media Images. ACM Conference on Human Factors in Computing Systems (CHI) (2017)."},{"key":"e_1_3_2_1_51_1","volume-title":"Group (Un)Fairness in Natural Language Image Descriptions. The Seventh AAAI Conference on Human Computation and Crowdsourcing (HCOMP-19)","author":"Otterbacher Jahna","year":"2019","unstructured":"Jahna Otterbacher, P\u0131nar Barlas, Styliani Kleanthous, and Kyriakos Kyriakou. 2019. How Do We Talk about Other People? Group (Un)Fairness in Natural Language Image Descriptions. The Seventh AAAI Conference on Human Computation and Crowdsourcing (HCOMP-19) (2019)."},{"key":"e_1_3_2_1_52_1","volume-title":"BLEU: a method for automatic evaluation of machine translation","author":"Papineni Kishore","year":"2002","unstructured":"Kishore Papineni, Salim Roukos, Todd Ward, and Wei-Jing Zhu. 2002. BLEU: a method for automatic evaluation of machine translation. Association for Computational Linguistics (ACL) (2002)."},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.5244\/C.29.52"},{"key":"e_1_3_2_1_54_1","doi-asserted-by":"publisher","DOI":"10.1609\/hcomp.v5i1.13301"},{"key":"e_1_3_2_1_55_1","volume-title":"The Risk of Racial Bias in Hate Speech Detection. Annual Meeting of the Association for Computational Linguistics","author":"Sap Maarten","year":"2019","unstructured":"Maarten Sap, Dallas Card, Saadia Gabriel, Yejin Choi, and Noah\u00a0A. Smith. 2019. The Risk of Racial Bias in Hate Speech Detection. Annual Meeting of the Association for Computational Linguistics (2019)."},{"key":"e_1_3_2_1_56_1","volume-title":"Revisiting Gendered Web Forms: An Evaluation of Gender Inputs with (Non-)Binary People. ACM Conference on Human Factors in Computing Systems (CHI)","author":"Scheuerman Morgan\u00a0Klaus","year":"2021","unstructured":"Morgan\u00a0Klaus Scheuerman, Aaron Jiang, Katta Spiel, and Jed\u00a0R. Brubaker. 2021. Revisiting Gendered Web Forms: An Evaluation of Gender Inputs with (Non-)Binary People. ACM Conference on Human Factors in Computing Systems (CHI) (2021)."},{"key":"e_1_3_2_1_57_1","volume-title":"Identity: Constructing Race and Gender in Image Databases for Facial Analysis. ACM Conference on Human Factors in Computing Systems (CHI)","author":"Scheuerman Morgan\u00a0Klaus","year":"2020","unstructured":"Morgan\u00a0Klaus Scheuerman, Kandrea Wade, Caitlin Lustig, and Jed\u00a0R. Brubaker. 2020. How We\u2019ve Taught Algorithms to See Identity: Constructing Race and Gender in Image Databases for Facial Analysis. ACM Conference on Human Factors in Computing Systems (CHI) (2020)."},{"key":"e_1_3_2_1_58_1","unstructured":"Christoph Schuhmann. 2021. LAION-400-Million Open Dataset. (2021). https:\/\/laion.ai\/laion-400-open-dataset\/"},{"key":"e_1_3_2_1_59_1","volume-title":"Semin and Klaus Fiedler","author":"R.","year":"1988","unstructured":"Gun\u00a0R. Semin and Klaus Fiedler. 1988. The cognitive functions of linguistic categories in describing persons: Social cognition and language.Journal of Personality and Social Psychology (1988)."},{"key":"e_1_3_2_1_60_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1238"},{"key":"e_1_3_2_1_61_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.445"},{"key":"e_1_3_2_1_62_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.acl-short.36"},{"key":"e_1_3_2_1_63_1","volume-title":"What People with Vision Impairments Want in Image Descriptions. ACM Conference on Human Factors in Computing Systems (CHI)","author":"Stangl Abigale","year":"2020","unstructured":"Abigale Stangl, Meredith\u00a0Ringel Morris, and Danna Gurari. 2020. \u201cPerson, Shoes, Tree. Is the Person Naked?\u201d What People with Vision Impairments Want in Image Descriptions. ACM Conference on Human Factors in Computing Systems (CHI) (2020)."},{"key":"e_1_3_2_1_64_1","doi-asserted-by":"publisher","DOI":"10.1145\/3441852.3471233"},{"key":"e_1_3_2_1_65_1","volume-title":"Conference on Neural Information Processing Systems (NeurIPS)","author":"Tang Kaihua","year":"2020","unstructured":"Kaihua Tang, Jianqiang Huang, and Hanwang Zhang. 2020. Long-Tailed Classification by Keeping the Good and Removing the Bad Momentum Causal Effect. Conference on Neural Information Processing Systems (NeurIPS) (2020)."},{"key":"e_1_3_2_1_66_1","volume-title":"Mitigating Gender Bias in Captioning Systems. arXiv:2006.08315","author":"Tang Ruixiang","year":"2020","unstructured":"Ruixiang Tang, Mengnan Du, Yuening Li, Zirui Liu, and Xia Hu. 2020. Mitigating Gender Bias in Captioning Systems. arXiv:2006.08315 (2020)."},{"key":"e_1_3_2_1_67_1","unstructured":"Princeton University. 2010. About WordNet. Princeton University(2010)."},{"key":"e_1_3_2_1_68_1","volume-title":"Proceedings of the Workshop on Multimodal Corpora (MMC)","author":"van Miltenburg Emiel","year":"2016","unstructured":"Emiel van Miltenburg. 2016. Stereotyping and Bias in the Flickr30K Dataset. Proceedings of the Workshop on Multimodal Corpora (MMC) (2016)."},{"key":"e_1_3_2_1_69_1","volume-title":"Measuring the Diversity of Automatic Image Descriptions. International Conference on Computational Linguistics","author":"van Miltenburg Emiel","year":"2018","unstructured":"Emiel van Miltenburg, Desmond Elliott, and Piek Vossen. 2018. Measuring the Diversity of Automatic Image Descriptions. International Conference on Computational Linguistics (2018)."},{"key":"e_1_3_2_1_70_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W18-6550"},{"key":"e_1_3_2_1_71_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7299087"},{"key":"e_1_3_2_1_72_1","volume-title":"Show and Tell: A Neural Image Caption Generator. IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","author":"Vinyals Oriol","year":"2015","unstructured":"Oriol Vinyals, Alexander Toshev, Samy Bengio, and Dumitru Erhan. 2015. Show and Tell: A Neural Image Caption Generator. IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) (2015)."},{"key":"e_1_3_2_1_73_1","volume-title":"REVISE: A Tool for Measuring and Mitigating Bias in Visual Datasets. European Conference on Computer Vision (ECCV)","author":"Wang Angelina","year":"2020","unstructured":"Angelina Wang, Arvind Narayanan, and Olga Russakovsky. 2020. REVISE: A Tool for Measuring and Mitigating Bias in Visual Datasets. European Conference on Computer Vision (ECCV) (2020)."},{"key":"e_1_3_2_1_74_1","volume-title":"Balanced Datasets Are Not Enough: Estimating and Mitigating Gender Bias in Deep Image Representations. International Conference on Computer Vision (ICCV)","author":"Wang Tianlu","year":"2019","unstructured":"Tianlu Wang, Jieyu Zhao, Mark Yatskar, Kai-Wei Chang, and Vicente Ordonez. 2019. Balanced Datasets Are Not Enough: Estimating and Mitigating Gender Bias in Deep Image Representations. International Conference on Computer Vision (ICCV) (2019)."},{"key":"e_1_3_2_1_75_1","volume-title":"Predictive Inequity in Object Detection. arXiv:1902.11097","author":"Wilson Benjamin","year":"2019","unstructured":"Benjamin Wilson, Judy Hoffman, and Jamie Morgenstern. 2019. Predictive Inequity in Object Detection. arXiv:1902.11097 (2019)."},{"key":"e_1_3_2_1_76_1","doi-asserted-by":"publisher","DOI":"10.1145\/2998181.2998364"},{"key":"e_1_3_2_1_77_1","doi-asserted-by":"publisher","DOI":"10.1145\/3351095.3375709"},{"key":"e_1_3_2_1_78_1","volume-title":"Image Captioning with Semantic Attention. IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","author":"You Quanzeng","year":"2016","unstructured":"Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and Jiebo Luo. 2016. Image Captioning with Semantic Attention. IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) (2016)."},{"key":"e_1_3_2_1_79_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00553"},{"key":"e_1_3_2_1_80_1","volume-title":"Understanding and Evaluating Racial Biases in Image Captioning. International Conference on Computer Vision (ICCV)","author":"Zhao Dora","year":"2021","unstructured":"Dora Zhao, Angelina Wang, and Olga Russakovsky. 2021. Understanding and Evaluating Racial Biases in Image Captioning. International Conference on Computer Vision (ICCV) (2021)."}],"event":{"name":"FAccT '22: 2022 ACM Conference on Fairness, Accountability, and Transparency","location":"Seoul Republic of Korea","acronym":"FAccT '22","sponsor":["ACM Association for Computing Machinery"]},"container-title":["2022 ACM Conference on Fairness Accountability and Transparency"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3531146.3533099","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3531146.3533099","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3531146.3533099","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T19:02:10Z","timestamp":1750186930000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3531146.3533099"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,6,20]]},"references-count":80,"alternative-id":["10.1145\/3531146.3533099","10.1145\/3531146"],"URL":"https:\/\/doi.org\/10.1145\/3531146.3533099","relation":{},"subject":[],"published":{"date-parts":[[2022,6,20]]},"assertion":[{"value":"2022-06-20","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}