{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,27]],"date-time":"2026-06-27T22:28:00Z","timestamp":1782599280170,"version":"3.54.5"},"publisher-location":"New York, NY, USA","reference-count":20,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,7,21]],"date-time":"2021-07-21T00:00:00Z","timestamp":1626825600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,7,21]]},"DOI":"10.1145\/3461702.3462530","type":"proceedings-article","created":{"date-parts":[[2021,7,31]],"date-time":"2021-07-31T01:21:38Z","timestamp":1627694498000},"page":"24-34","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":23,"title":["Gender Bias and Under-Representation in Natural Language Processing Across Human Languages"],"prefix":"10.1145","author":[{"given":"Yan","family":"Chen","sequence":"first","affiliation":[{"name":"Clarkson University, Potsdam, NY, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Christopher","family":"Mahoney","sequence":"additional","affiliation":[{"name":"Clarkson University, Potsdam, NY, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Isabella","family":"Grasso","sequence":"additional","affiliation":[{"name":"Clarkson University, Potsdam, NY, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Esma","family":"Wali","sequence":"additional","affiliation":[{"name":"Clarkson University, Potsdam , NY, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Abigail","family":"Matthews","sequence":"additional","affiliation":[{"name":"University of Wisconsin, Madison, WI, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Thomas","family":"Middleton","sequence":"additional","affiliation":[{"name":"Clarkson University, Potsdam, NY, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Mariama","family":"Njie","sequence":"additional","affiliation":[{"name":"Iona College, New York, NY, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jeanna","family":"Matthews","sequence":"additional","affiliation":[{"name":"Clarkson University, Potsdam, NY, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2021,7,30]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Quantifying Gender Bias in Different Corpora. In Companion Proceedings of the Web Conference 2020","author":"Babaeianjelodar Marzieh","year":"2020","unstructured":"Marzieh Babaeianjelodar , Stephen Lorenz , Josh Gordon , Jeanna Matthews , and Evan Freitag . 2020 . Quantifying Gender Bias in Different Corpora. In Companion Proceedings of the Web Conference 2020 ( Taipei, Taiwan) (WWW '20). Association for Computing Machinery, New York, NY, USA, 752--759. https:\/\/doi.org\/10. 1145\/3366424.3383559 Marzieh Babaeianjelodar, Stephen Lorenz, Josh Gordon, Jeanna Matthews, and Evan Freitag. 2020. Quantifying Gender Bias in Different Corpora. In Companion Proceedings of the Web Conference 2020 (Taipei, Taiwan) (WWW '20). Association for Computing Machinery, New York, NY, USA, 752--759. https:\/\/doi.org\/10. 1145\/3366424.3383559"},{"key":"e_1_3_2_1_2_1","unstructured":"D. Banerjee. 2020. Natural Language Processing (NLP) Simplified: A Step-bystep Guide. https:\/\/datascience.foundation\/sciencewhitepaper\/natural-languageprocessing- nlp-simplified-a-step-by-step-guide.  D. Banerjee. 2020. Natural Language Processing (NLP) Simplified: A Step-bystep Guide. https:\/\/datascience.foundation\/sciencewhitepaper\/natural-languageprocessing- nlp-simplified-a-step-by-step-guide."},{"key":"e_1_3_2_1_3_1","unstructured":"BERT. 2020. BERT Pretrained models on Github. https:\/\/github.com\/googleresearch\/ bert#bert.  BERT. 2020. BERT Pretrained models on Github. https:\/\/github.com\/googleresearch\/ bert#bert."},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.5555\/3157382.3157584"},{"key":"e_1_3_2_1_5_1","volume-title":"Proceedings of the 1st Conference on Fairness, Accountability and Transparency","author":"Gebru Buolamwini","unstructured":"J; Buolamwini and T. Gebru . 2018. Gender Shades: Intersectional Accuracy Disparities in Commercial Gender Classification . In Proceedings of the 1st Conference on Fairness, Accountability and Transparency ( New York, USA) (FAccT'18). 77--91. J; Buolamwini and T. Gebru. 2018. Gender Shades: Intersectional Accuracy Disparities in Commercial Gender Classification. In Proceedings of the 1st Conference on Fairness, Accountability and Transparency (New York, USA) (FAccT'18). 77--91."},{"key":"e_1_3_2_1_6_1","volume-title":"BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. arXiv:1810.04805 [cs.CL]","author":"Devlin Jacob","year":"2019","unstructured":"Jacob Devlin , Ming-Wei Chang , Kenton Lee , and Kristina Toutanova . 2019 . BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. arXiv:1810.04805 [cs.CL] Jacob Devlin, Ming-Wei Chang, Kenton Lee, and Kristina Toutanova. 2019. BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. arXiv:1810.04805 [cs.CL]"},{"key":"e_1_3_2_1_7_1","volume":"201","author":"M.","unstructured":"M. J. Garbade. 201 8. A Simple Introduction To Natural Language Processing. https:\/\/becominghuman.ai\/a-simple-introduction-to-natural-languageprocessing- ea66a1747b32. M. J. Garbade. 2018. A Simple Introduction To Natural Language Processing. https:\/\/becominghuman.ai\/a-simple-introduction-to-natural-languageprocessing- ea66a1747b32.","journal-title":"J. Garbade."},{"key":"e_1_3_2_1_8_1","unstructured":"D. Karani. 2018. Introduction to Word Embedding and Word2Vec. https:\/\/towardsdatascience.com\/introduction-to-word-embedding-andword2vec- 652d0c2060fa.  D. Karani. 2018. Introduction to Word Embedding and Word2Vec. https:\/\/towardsdatascience.com\/introduction-to-word-embedding-andword2vec- 652d0c2060fa."},{"key":"e_1_3_2_1_9_1","unstructured":"Tomas Mikolov Kai Chen Greg Corrado and Jeffrey Dean. 2013. Efficient Estimation of Word Representations in Vector Space. arXiv:1301.3781 [cs.CL]  Tomas Mikolov Kai Chen Greg Corrado and Jeffrey Dean. 2013. Efficient Estimation of Word Representations in Vector Space. arXiv:1301.3781 [cs.CL]"},{"key":"e_1_3_2_1_10_1","unstructured":"NLTK. 2005. Natural Language Toolkit. http:\/\/www.nltk.org\/.  NLTK. 2005. Natural Language Toolkit. http:\/\/www.nltk.org\/."},{"key":"e_1_3_2_1_11_1","unstructured":"R. Siegel. 2019. Search result not found: China bans Wikipedia in all languages. https:\/\/www.washingtonpost.com\/business\/2019\/05\/15\/china-banswikipedia- all-languages\/.  R. Siegel. 2019. Search result not found: China bans Wikipedia in all languages. https:\/\/www.washingtonpost.com\/business\/2019\/05\/15\/china-banswikipedia- all-languages\/."},{"key":"e_1_3_2_1_12_1","unstructured":"Q. G. Su. 2019. Which Parts of the World Speaks Mandarin Chinese? https: \/\/www.thoughtco.com\/where-is-mandarin-spoken-2278443.  Q. G. Su. 2019. Which Parts of the World Speaks Mandarin Chinese? https: \/\/www.thoughtco.com\/where-is-mandarin-spoken-2278443."},{"key":"e_1_3_2_1_13_1","volume-title":"Participatory ML Workshop,Thirty-seventh International Conference on Machine Learning (ICML 2020)","author":"Wali Esma","year":"2020","unstructured":"Esma Wali , Yan Chen , Christopher Mahoney , Thomas Middleton , Marzieh Babaeianjelodar , Mariama Njie , and Jeanna Neefe Matthews . 2020 . Is Machine Learning Speaking my Language? A Critical Look at the NLP-Pipeline Across 8 Human Languages . In Participatory ML Workshop,Thirty-seventh International Conference on Machine Learning (ICML 2020) , July 17 2020. Esma Wali, Yan Chen, Christopher Mahoney, Thomas Middleton, Marzieh Babaeianjelodar, Mariama Njie, and Jeanna Neefe Matthews. 2020. Is Machine Learning Speaking my Language? A Critical Look at the NLP-Pipeline Across 8 Human Languages. In Participatory ML Workshop,Thirty-seventh International Conference on Machine Learning (ICML 2020), July 17 2020."},{"key":"e_1_3_2_1_14_1","unstructured":"Wikipedia. 2020. German language. https:\/\/en.wikipedia.org\/wiki\/German_ language.  Wikipedia. 2020. German language. https:\/\/en.wikipedia.org\/wiki\/German_ language."},{"key":"e_1_3_2_1_15_1","unstructured":"Wikipedia. 2020. List of languages by total number of speakers. https:\/\/en. wikipedia.org\/wiki\/List_of_languages_by_total_number_of_speakers.  Wikipedia. 2020. List of languages by total number of speakers. https:\/\/en. wikipedia.org\/wiki\/List_of_languages_by_total_number_of_speakers."},{"key":"e_1_3_2_1_16_1","unstructured":"Wikipedia. 2020. List of Wikipedias. https:\/\/en.wikipedia.org\/wiki\/List_of_ Wikipedias.  Wikipedia. 2020. List of Wikipedias. https:\/\/en.wikipedia.org\/wiki\/List_of_ Wikipedias."},{"key":"e_1_3_2_1_17_1","unstructured":"Wikipedia. 2020. Wolof Wikipedia. https:\/\/en.wikipedia.org\/wiki\/Wolof_ Wikipedia.  Wikipedia. 2020. Wolof Wikipedia. https:\/\/en.wikipedia.org\/wiki\/Wolof_ Wikipedia."},{"key":"e_1_3_2_1_18_1","unstructured":"Nangia N. Bowma S. Williams A. 2020. MultiNLI The Multi-Genre NLI Corpus. https:\/\/cims.nyu.edu\/~sbowman\/multinli.  Nangia N. Bowma S. Williams A. 2020. MultiNLI The Multi-Genre NLI Corpus. https:\/\/cims.nyu.edu\/~sbowman\/multinli."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"crossref","unstructured":"Ikuya Yamada Akari Asai Jin Sakuma Hiroyuki Shindo Hideaki Takeda Yoshiyasu Takefuji and Yuji Matsumoto. 2020. Wikipedia2Vec: An Efficient Toolkit for Learning and Visualizing the Embeddings of Words and Entities from Wikipedia. arXiv:1812.06280 [cs.CL]  Ikuya Yamada Akari Asai Jin Sakuma Hiroyuki Shindo Hideaki Takeda Yoshiyasu Takefuji and Yuji Matsumoto. 2020. Wikipedia2Vec: An Efficient Toolkit for Learning and Visualizing the Embeddings of Words and Entities from Wikipedia. arXiv:1812.06280 [cs.CL]","DOI":"10.18653\/v1\/2020.emnlp-demos.4"},{"key":"e_1_3_2_1_20_1","unstructured":"V. Yordanov. 2018. Introduction To Natural Language Processing For Text. Medium. https:\/\/towardsdatascience.com\/introduction-to-naturallanguage- processing-for-text-df845750fb63.  V. Yordanov. 2018. Introduction To Natural Language Processing For Text. Medium. https:\/\/towardsdatascience.com\/introduction-to-naturallanguage- processing-for-text-df845750fb63."}],"event":{"name":"AIES '21: AAAI\/ACM Conference on AI, Ethics, and Society","location":"Virtual Event USA","acronym":"AIES '21","sponsor":["SIGAI ACM Special Interest Group on Artificial Intelligence","AAAI"]},"container-title":["Proceedings of the 2021 AAAI\/ACM Conference on AI, Ethics, and Society"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3461702.3462530","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3461702.3462530","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T20:49:06Z","timestamp":1750193346000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3461702.3462530"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,7,21]]},"references-count":20,"alternative-id":["10.1145\/3461702.3462530","10.1145\/3461702"],"URL":"https:\/\/doi.org\/10.1145\/3461702.3462530","relation":{},"subject":[],"published":{"date-parts":[[2021,7,21]]},"assertion":[{"value":"2021-07-30","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}