{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,5]],"date-time":"2025-11-05T11:29:39Z","timestamp":1762342179501,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":49,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,10,21]],"date-time":"2023-10-21T00:00:00Z","timestamp":1697846400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,10,21]]},"DOI":"10.1145\/3583780.3614792","type":"proceedings-article","created":{"date-parts":[[2023,10,21]],"date-time":"2023-10-21T07:45:42Z","timestamp":1697874342000},"page":"1400-1410","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":2,"title":["Bias Invariant Approaches for Improving Word Embedding Fairness"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5709-3015","authenticated-orcid":false,"given":"Siyu","family":"Liao","sequence":"first","affiliation":[{"name":"Amazon.com, Seattle, WA, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2420-2438","authenticated-orcid":false,"given":"Rongting","family":"Zhang","sequence":"additional","affiliation":[{"name":"Amazon.com, Seattle, WA, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7669-645X","authenticated-orcid":false,"given":"Barbara","family":"Poblete","sequence":"additional","affiliation":[{"name":"University of Chile &amp; Amazon.com, Santiago, Chile"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1682-0081","authenticated-orcid":false,"given":"Vanessa","family":"Murdock","sequence":"additional","affiliation":[{"name":"Amazon.com, Seattle, WA, USA"}]}],"member":"320","published-online":{"date-parts":[[2023,10,21]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/2976749.2978318"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2020\/60"},{"key":"e_1_3_2_1_3_1","volume-title":"7th International Conference on Learning Representations, ICLR 2019","author":"Bai Yu","year":"2019","unstructured":"Yu Bai, Yu-Xiang Wang, and Edo Liberty. 2019. ProxQuant: Quantized Neural Networks via Proximal Operators. In 7th International Conference on Learning Representations, ICLR 2019, New Orleans, LA, USA, May 6--9, 2019. OpenReview.net. https:\/\/openreview.net\/forum?id=HyzMyhCcK7"},{"key":"e_1_3_2_1_4_1","volume-title":"International Conference on Machine Learning. PMLR, 394--403","author":"Balle Borja","year":"2018","unstructured":"Borja Balle and Yu-Xiang Wang. 2018. Improving the Gaussian mechanism for differential privacy: Analytical calibration and optimal denoising. In International Conference on Machine Learning. PMLR, 394--403."},{"key":"e_1_3_2_1_5_1","volume-title":"A neural probabilistic language model. The journal of machine learning research","author":"Bengio Yoshua","year":"2003","unstructured":"Yoshua Bengio, R\u00e9jean Ducharme, Pascal Vincent, and Christian Janvin. 2003. A neural probabilistic language model. The journal of machine learning research, Vol. 3 (2003), 1137--1155."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-25385-0_12"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.485"},{"key":"e_1_3_2_1_8_1","volume-title":"Man is to computer programmer as woman is to homemaker? debiasing word embeddings. Advances in neural information processing systems","author":"Bolukbasi Tolga","year":"2016","unstructured":"Tolga Bolukbasi, Kai-Wei Chang, James Y Zou, Venkatesh Saligrama, and Adam T Kalai. 2016. Man is to computer programmer as woman is to homemaker? debiasing word embeddings. Advances in neural information processing systems, Vol. 29 (2016), 4349--4357."},{"key":"e_1_3_2_1_9_1","volume-title":"Science","volume":"356","author":"Caliskan Aylin","year":"2017","unstructured":"Aylin Caliskan, Joanna J Bryson, and Arvind Narayanan. 2017. Semantics derived automatically from language corpora contain human-like biases. Science, Vol. 356, 6334 (2017), 183--186."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W16-2501"},{"key":"e_1_3_2_1_11_1","volume-title":"Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies","volume":"1","author":"Devlin Jacob","year":"2019","unstructured":"Jacob Devlin, Ming-Wei Chang, Kenton Lee, and Kristina Toutanova. 2019. BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. In Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers). Association for Computational Linguistics, Minneapolis, Minnesota, 4171--4186. https:\/\/doi.org\/10.18653\/v1\/N19--1423"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1128"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/1645953.1646160"},{"key":"e_1_3_2_1_14_1","first-page":"3","article-title":"The algorithmic foundations of differential privacy","volume":"9","author":"Dwork Cynthia","year":"2014","unstructured":"Cynthia Dwork, Aaron Roth, et al. 2014. The algorithmic foundations of differential privacy. Found. Trends Theor. Comput. Sci., Vol. 9, 3--4 (2014), 211--407.","journal-title":"Found. Trends Theor. Comput. Sci."},{"key":"e_1_3_2_1_15_1","volume-title":"Noiseless Privacy: Definition, Guarantees, and Applications","author":"Farokhi Farhad","year":"2021","unstructured":"Farhad Farokhi. 2021. Noiseless Privacy: Definition, Guarantees, and Applications. IEEE Transactions on Big Data (2021)."},{"key":"e_1_3_2_1_16_1","volume-title":"A synopsis of linguistic theory","author":"Firth John R","year":"1930","unstructured":"John R Firth. 1957. A synopsis of linguistic theory, 1930--1955. Studies in linguistic analysis (1957)."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1720347115"},{"key":"e_1_3_2_1_18_1","volume-title":"Proceedings of NAACL-HLT.","author":"Gonen Hila","year":"2019","unstructured":"Hila Gonen and Yoav Goldberg. 2019. Lipstick on a Pig: Debiasing Methods Cover up Systematic Gender Biases in Word Embeddings But do not Remove Them. In Proceedings of NAACL-HLT."},{"key":"e_1_3_2_1_19_1","volume-title":"Proceedings of the International Conference on Language Resources and Evaluation (LREC","author":"Grave Edouard","year":"2018","unstructured":"Edouard Grave, Piotr Bojanowski, Prakhar Gupta, Armand Joulin, and Tomas Mikolov. 2018. Learning Word Vectors for 157 Languages. In Proceedings of the International Conference on Language Resources and Evaluation (LREC 2018)."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1037\/0022-3514.74.6.1464"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/3052973.3052992"},{"key":"e_1_3_2_1_22_1","volume-title":"Proceedings of the 28th International Conference on Computational Linguistics: System Demonstrations. International Committee on Computational Linguistics (ICCL), Barcelona, Spain (Online), 34--40","author":"Hollenstein Nora","year":"1865","unstructured":"Nora Hollenstein, Adrian van der Lek, and Ce Zhang. 2020. CogniVal in Action: An Interface for Customizable Cognitive Word Embedding Evaluation. In Proceedings of the 28th International Conference on Computational Linguistics: System Demonstrations. International Committee on Computational Linguistics (ICCL), Barcelona, Spain (Online), 34--40. https:\/\/doi.org\/10.18653\/v1\/2020.coling-demos.7"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/3336191.3371779"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00327"},{"key":"e_1_3_2_1_25_1","volume-title":"Word2bits-quantized word vectors. arXiv preprint arXiv:1803.05651","author":"Lam Maximilian","year":"2018","unstructured":"Maximilian Lam. 2018. Word2bits-quantized word vectors. arXiv preprint arXiv:1803.05651 (2018)."},{"key":"e_1_3_2_1_26_1","volume-title":"Neural word embedding as implicit matrix factorization. Advances in neural information processing systems","author":"Levy Omer","year":"2014","unstructured":"Omer Levy and Yoav Goldberg. 2014. Neural word embedding as implicit matrix factorization. Advances in neural information processing systems, Vol. 27 (2014), 2177--2185."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2021.07.045"},{"key":"e_1_3_2_1_28_1","volume-title":"Shared-private bilingual word embeddings for neural machine translation. arXiv preprint arXiv:1906.03100","author":"Liu Xuebo","year":"2019","unstructured":"Xuebo Liu, Derek F Wong, Yang Liu, Lidia S Chao, Tong Xiao, and Jingbo Zhu. 2019. Shared-private bilingual word embeddings for neural machine translation. arXiv preprint arXiv:1906.03100 (2019)."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N19-1062"},{"key":"e_1_3_2_1_30_1","volume-title":"Building a large annotated corpus of English: The Penn Treebank. Using Large Corpora","author":"Marcinkiewicz Mary Ann","year":"1994","unstructured":"Mary Ann Marcinkiewicz. 1994. Building a large annotated corpus of English: The Penn Treebank. Using Large Corpora (1994), 273."},{"key":"e_1_3_2_1_31_1","volume-title":"Efficient estimation of word representations in vector space. arXiv preprint arXiv:1301.3781","author":"Mikolov Tomas","year":"2013","unstructured":"Tomas Mikolov, Kai Chen, Greg Corrado, and Jeffrey Dean. 2013a. Efficient estimation of word representations in vector space. arXiv preprint arXiv:1301.3781 (2013)."},{"key":"e_1_3_2_1_32_1","unstructured":"Tomas Mikolov Ilya Sutskever Kai Chen Greg S Corrado and Jeff Dean. 2013b. Distributed representations of words and phrases and their compositionality. In Advances in neural information processing systems. 3111--3119."},{"key":"e_1_3_2_1_33_1","volume-title":"MS MARCO: A human generated machine reading comprehension dataset. choice","author":"Nguyen Tri","year":"2016","unstructured":"Tri Nguyen, Mir Rosenberg, Xia Song, Jianfeng Gao, Saurabh Tiwary, Rangan Majumder, and Li Deng. 2016. MS MARCO: A human generated machine reading comprehension dataset. choice, Vol. 2640 (2016), 660."},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1162"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/3269206.3269277"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P16-2068"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1145\/361219.361220"},{"key":"e_1_3_2_1_38_1","volume-title":"Introduction to the CoNLL-2000 shared task: Chunking. arXiv preprint cs\/0009008","author":"Sang Erik F","year":"2000","unstructured":"Erik F Sang and Sabine Buchholz. 2000. Introduction to the CoNLL-2000 shared task: Chunking. arXiv preprint cs\/0009008 (2000)."},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.3115\/1119176.1119195"},{"key":"e_1_3_2_1_40_1","volume-title":"Measuring word significance using distributed representations of words. arXiv preprint arXiv:1508.02297","author":"Schakel Adriaan MJ","year":"2015","unstructured":"Adriaan MJ Schakel and Benjamin J Wilson. 2015. Measuring word significance using distributed representations of words. arXiv preprint arXiv:1508.02297 (2015)."},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1511656113"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.gebnlp-1.15"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"crossref","unstructured":"Robyn Speer Joshua Chin and Catherine Havasi. 2017. ConceptNet 5.5: An Open Multilingual Graph of General Knowledge. 4444--4451. http:\/\/aaai.org\/ocs\/index.php\/AAAI\/AAAI17\/paper\/view\/14972","DOI":"10.1609\/aaai.v31i1.11164"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ins.2018.09.001"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1162"},{"key":"e_1_3_2_1_46_1","article-title":"Visualizing data using t-SNE","volume":"9","author":"der Maaten Laurens Van","year":"2008","unstructured":"Laurens Van der Maaten and Geoffrey Hinton. 2008. Visualizing data using t-SNE. Journal of machine learning research, Vol. 9, 11 (2008).","journal-title":"Journal of machine learning research"},{"key":"e_1_3_2_1_47_1","volume-title":"Controlled experiments for word embeddings. arXiv preprint arXiv:1510.02675","author":"Wilson Benjamin J","year":"2015","unstructured":"Benjamin J Wilson and Adriaan MJ Schakel. 2015. Controlled experiments for word embeddings. arXiv preprint arXiv:1510.02675 (2015)."},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i05.6485"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-2003"}],"event":{"name":"CIKM '23: The 32nd ACM International Conference on Information and Knowledge Management","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGIR ACM Special Interest Group on Information Retrieval"],"location":"Birmingham United Kingdom","acronym":"CIKM '23"},"container-title":["Proceedings of the 32nd ACM International Conference on Information and Knowledge Management"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3583780.3614792","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3583780.3614792","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T16:36:56Z","timestamp":1750178216000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3583780.3614792"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,21]]},"references-count":49,"alternative-id":["10.1145\/3583780.3614792","10.1145\/3583780"],"URL":"https:\/\/doi.org\/10.1145\/3583780.3614792","relation":{},"subject":[],"published":{"date-parts":[[2023,10,21]]},"assertion":[{"value":"2023-10-21","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}