{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,5]],"date-time":"2026-06-05T01:24:09Z","timestamp":1780622649722,"version":"3.54.1"},"reference-count":46,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,11,27]],"date-time":"2025-11-27T00:00:00Z","timestamp":1764201600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,11,27]],"date-time":"2025-11-27T00:00:00Z","timestamp":1764201600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"name":"National Research Foundation of South Africa","award":["137755"],"award-info":[{"award-number":["137755"]}]},{"name":"National Research Foundation of South Africa","award":["137755"],"award-info":[{"award-number":["137755"]}]},{"DOI":"10.13039\/501100001711","name":"Swiss National Science Foundation","doi-asserted-by":"crossref","award":["10001AL_205032"],"award-info":[{"award-number":["10001AL_205032"]}],"id":[{"id":"10.13039\/501100001711","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001711","name":"Swiss National Science Foundation","doi-asserted-by":"crossref","award":["10001AL_205032"],"award-info":[{"award-number":["10001AL_205032"]}],"id":[{"id":"10.13039\/501100001711","id-type":"DOI","asserted-by":"crossref"}]},{"name":"University of Johannesburg, Johannesburg, South Africa"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["EPJ Data Sci."],"DOI":"10.1140\/epjds\/s13688-025-00594-2","type":"journal-article","created":{"date-parts":[[2025,11,27]],"date-time":"2025-11-27T08:46:36Z","timestamp":1764233196000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["The news in black and white: word embeddings quantify racism in South African news"],"prefix":"10.1140","volume":"14","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8633-8103","authenticated-orcid":false,"given":"Nnaemeka","family":"Ohamadike","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2926-5953","authenticated-orcid":false,"given":"Kevin","family":"Durrheim","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5270-3619","authenticated-orcid":false,"given":"Mpho","family":"Primus","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,11,27]]},"reference":[{"issue":"2","key":"594_CR1","first-page":"7","volume":"10","author":"V Alhadeff","year":"2018","unstructured":"Alhadeff V (2018) Journalism during South Africa\u2019s apartheid regime. Cosmop Civ Soc, Interdiscip J 10(2):7\u201311","journal-title":"Cosmop Civ Soc, Interdiscip J"},{"issue":"4","key":"594_CR2","doi-asserted-by":"publisher","first-page":"1484","DOI":"10.1177\/00491241221122603","volume":"51","author":"A Arseniev-Koehler","year":"2022","unstructured":"Arseniev-Koehler A, Foster JG (2022) Machine learning as a model for cultural learning: teaching an algorithm what it means to be fat. Sociol Methods Res 51(4):1484\u20131539","journal-title":"Sociol Methods Res"},{"key":"594_CR3","unstructured":"Berger G (2000) Submission for HRC investigation into racism and the media. Unpublished Paper, submitted to the Human Rights Commission"},{"issue":"1\u20132","key":"594_CR4","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1080\/02560240185310081","volume":"15","author":"G Berger","year":"2001","unstructured":"Berger G (2001) Problematising race for journalists: critical reflections on the South African human rights commission inquiry into media racism. Crit Arts 15(1\u20132):69\u201396","journal-title":"Crit Arts"},{"key":"594_CR5","series-title":"Lecture notes on data engineering and communications technologies","volume-title":"Innovative data communication technologies and application","author":"SS Birunda","year":"2021","unstructured":"Birunda SS, Devi RK (2021) A review on word embedding techniques for text classification. In: Raj JS, Iliyasu AM, Bestak R, Baig ZA (eds) Innovative data communication technologies and application. Lecture notes on data engineering and communications technologies, vol\u00a059. Springer, Singapore"},{"key":"594_CR6","unstructured":"Bolukbasi T, Chang KW, Zou JY, Saligrama V, Kalai AT (2016) Man is to computer programmer as woman is to homemaker? Debiasing word embeddings. Adv. Neural Inf. Process. Syst. 29"},{"key":"594_CR7","volume-title":"Human rights commission, interim report into racism in the media","author":"C Braude","year":"1999","unstructured":"Braude C (1999) Cultural bloodstains: towards understanding the legacy of apartheid and the perpetuation of racial stereotypes in the contemporary South African media. In: Human rights commission, interim report into racism in the media. South African Human Rights Commission, Johannesburg"},{"issue":"6334","key":"594_CR8","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1126\/science.aal4230","volume":"356","author":"A Caliskan","year":"2017","unstructured":"Caliskan A, Bryson JJ, Narayanan A (2017) Semantics derived automatically from language corpora contain human-like biases. Science 356(6334):183\u2013186","journal-title":"Science"},{"key":"594_CR9","first-page":"594","volume-title":"Handbook of language analysis in psychology","author":"TE Charlesworth","year":"2022","unstructured":"Charlesworth TE, Banaji MR (2022) Word embeddings reveal social group attitudes and stereotypes in large language corpora. In: Handbook of language analysis in psychology, pp 594\u2013608"},{"key":"594_CR10","unstructured":"ChatGPT (2024a) Personal Communication on Race Stereotypes. OpenAI. https:\/\/chatgpt.com\/share\/2d6e3a17-e726-497e-b654-0a4ae9e308e0. Retrieved 19 May 2024"},{"key":"594_CR11","unstructured":"ChatGPT (2024b) Personal Communication on Black and White South African Names. OpenAI. https:\/\/chatgpt.com\/share\/de3c1ef8-678a-4e89-ae33-fbf24ad28cb9. Retrieved 19 May 2024"},{"key":"594_CR12","unstructured":"Devlin J, Chang MW, Lee K, Toutanova K (2018) Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805"},{"key":"594_CR13","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1163\/156914907X207757","volume":"6","author":"L Dris-A\u00eft-Hamadouche","year":"2007","unstructured":"Dris-A\u00eft-Hamadouche L, Zoubir Y (2007) The Maghreb: social, political, and economic developments. Perspect Glob Dev Technol 6:261\u2013290. https:\/\/doi.org\/10.1163\/156914907X207757","journal-title":"Perspect Glob Dev Technol"},{"issue":"1\u20132","key":"594_CR14","doi-asserted-by":"publisher","first-page":"167","DOI":"10.1080\/02560040585310111","volume":"19","author":"K Durrheim","year":"2005","unstructured":"Durrheim K, Quayle M, Whitehead K, Kriel A (2005) Denying racism: discursive strategies used by the South African media. Crit Arts 19(1\u20132):167\u2013186","journal-title":"Crit Arts"},{"key":"594_CR15","doi-asserted-by":"publisher","first-page":"617","DOI":"10.1111\/bjso.12560","volume":"62","author":"K Durrheim","year":"2023","unstructured":"Durrheim K, Schuld M, Mafunda M, Mazibuko S (2023) Using word embeddings to investigate cultural biases. Br J Soc Psychol 62:617\u2013629. https:\/\/doi.org\/10.1111\/bjso.12560","journal-title":"Br J Soc Psychol"},{"key":"594_CR16","doi-asserted-by":"publisher","first-page":"E3635","DOI":"10.1073\/pnas.1720347115","volume":"115","author":"N Garg","year":"2018","unstructured":"Garg N, Schiebinger L, Jurafsky D, Zou J (2018) Word embeddings quantify 100 years of gender and ethnic stereotypes. Proc Natl Acad Sci USA 115:E3635\u2013E3644. https:\/\/doi.org\/10.1073\/pnas.1720347115","journal-title":"Proc Natl Acad Sci USA"},{"issue":"396","key":"594_CR17","doi-asserted-by":"publisher","first-page":"373","DOI":"10.1093\/afraf\/99.396.373","volume":"99","author":"D Glaser","year":"2000","unstructured":"Glaser D (2000) The media inquiry reports of the South African human rights commission: a critique. Afr Aff 99(396):373\u2013393","journal-title":"Afr Aff"},{"issue":"2","key":"594_CR18","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1080\/23743670.2022.2096090","volume":"43","author":"P Govenden","year":"2022","unstructured":"Govenden P (2022) Does black economic empowerment ownership matter? A decolonial analysis of \u201cblack visibility\u201d in South Africa\u2019s print media content, 1994\u20132014. Afr Journal Stud 43(2):1\u201320. https:\/\/doi.org\/10.1080\/23743670.2022.2096090","journal-title":"Afr Journal Stud"},{"key":"594_CR19","unstructured":"Green M (2012) Media representations of gratuitous violence in South Africa. Doctoral dissertation"},{"issue":"6","key":"594_CR20","doi-asserted-by":"publisher","first-page":"1464","DOI":"10.1037\/0022-3514.74.6.1464","volume":"74","author":"AG Greenwald","year":"1998","unstructured":"Greenwald AG, McGhee DE, Schwartz JL (1998) Measuring individual differences in implicit cognition: the implicit association test. J Pers Soc Psychol 74(6):1464","journal-title":"J Pers Soc Psychol"},{"key":"594_CR21","volume-title":"Interim report of the inquiry into racism in the media","author":"Human Rights Commission (HRC)","year":"1999","unstructured":"Human Rights Commission (HRC) (1999) Interim report of the inquiry into racism in the media. South African Human Rights Commission, Johannesburg"},{"key":"594_CR22","unstructured":"Jacobson M (2020) Social equity considerations: an imperative in a time of a pandemic. Governing. https:\/\/www.governing.com\/community\/Social-Equity-Considerations-An-Imperative-in-a-Time-of-Pandemic.html"},{"key":"594_CR23","unstructured":"Kolbe HR (2005). The South African print media: from apartheid to transformation"},{"issue":"5","key":"594_CR24","doi-asserted-by":"publisher","first-page":"905","DOI":"10.1177\/0003122419877135","volume":"84","author":"AC Kozlowski","year":"2019","unstructured":"Kozlowski AC, Taddy M, Evans JA (2019) The geometry of culture: analyzing the meanings of class through word embeddings. Am Sociol Rev 84(5):905\u2013949","journal-title":"Am Sociol Rev"},{"issue":"5","key":"594_CR25","doi-asserted-by":"publisher","first-page":"569","DOI":"10.1037\/amp0000364","volume":"74","author":"B Kurdi","year":"2019","unstructured":"Kurdi B, Seitchik AE, Axt JR, Carroll TJ, Karapetyan A, Kaushik N, Banaji MR (2019) Relationship between the implicit association test and intergroup behavior: a meta-analysis. Am Psychol 74(5):569","journal-title":"Am Psychol"},{"key":"594_CR26","doi-asserted-by":"publisher","unstructured":"Mafunda MC, Schuld M, Durrheim K, Mazibuko S (2022) A word embedding trained on South African news data. Afr. J. Inf. Commun. 30. https:\/\/doi.org\/10.23962\/ajic.i30.13906","DOI":"10.23962\/ajic.i30.13906"},{"key":"594_CR27","unstructured":"Majavu A (2015) Merging the Black press with mainstream newspapers in post-apartheid South Africa: a phenomenological study of journalists at Sowetan newspaper between 2009 and 2012. Doctoral dissertation, Auckland University of Technology"},{"key":"594_CR28","unstructured":"Media Development and Diversity Agency (MDDA) (2024) About us. https:\/\/www.mdda.org.za\/overview.html. Accessed 10 Jun 2024"},{"key":"594_CR29","volume-title":"Human rights commission, interim report into racism in the media","author":"Media Monitoring Project","year":"1999","unstructured":"Media Monitoring Project (1999) The news in black and white: an investigation into racial stereotyping in the media. In: Human rights commission, interim report into racism in the media. South African Human Rights Commission, Johannesburg"},{"key":"594_CR30","unstructured":"Media Monitoring Project (2006) Revealing Race: an analysis of the coverage of race and xenophobia in the South African print media. https:\/\/www.mediamonitoringafrica.org\/images\/uploads\/Final_report_v5_Print_final.pdf. Accessed 06 Jun 2024"},{"issue":"1\u20132","key":"594_CR31","doi-asserted-by":"publisher","first-page":"50","DOI":"10.1080\/02560240185310071","volume":"15","author":"C Merrett","year":"2001","unstructured":"Merrett C (2001) A tale of two paradoxes: media censorship in South Africa, pre-liberation and post-apartheid. Crit Arts 15(1\u20132):50\u201368","journal-title":"Crit Arts"},{"key":"594_CR32","unstructured":"Mikolov T, Sutskever I, Chen K, Corrado G, Dean J (2013) Efficient Estimation of Word Representations in Vector Space. arXiv:1301.3781"},{"key":"594_CR33","first-page":"45","volume":"130","author":"N Nattrass","year":"2016","unstructured":"Nattrass N, Seekings J (2016) \u201cTwo nations\u201d? Race and economic inequality in South Africa today. Daedalus 130:45\u201370","journal-title":"Daedalus"},{"key":"594_CR34","unstructured":"Oxfam (2021) COVID-19 in South Africa: the intersections of race and inequality. https:\/\/www.oxfam.org.za\/covid-19-in-sa\/. Accessed 24 Nov 2024"},{"key":"594_CR35","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1162","volume-title":"Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP); Doha, Qatar","author":"J Pennington","year":"2014","unstructured":"Pennington J, Socher R, Manning C (2014) Glove: global vectors for word representation. In: Moschitti A, Pang B (eds) Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP); Doha, Qatar Association for computational linguistics, Stroudsburg. https:\/\/doi.org\/10.3115\/v1\/D14-1162"},{"issue":"397","key":"594_CR36","doi-asserted-by":"publisher","first-page":"525","DOI":"10.1093\/afraf\/99.397.525","volume":"99","author":"NB Pityana","year":"2000","unstructured":"Pityana NB (2000) South Africa\u2019s inquiry into racism in the media: the role of national institutions in the promotion and protection of human rights. Afr Aff 99(397):525\u2013532","journal-title":"Afr Aff"},{"key":"594_CR37","doi-asserted-by":"publisher","first-page":"154","DOI":"10.1007\/978-1-349-21074-9_6","volume-title":"Political violence and the struggle in South Africa","author":"D Posel","year":"1990","unstructured":"Posel D (1990) Symbolizing violence: state and media discourse in TV coverage of township protest, 1985\u20137. In: Political violence and the struggle in South Africa. Palgrave Macmillan UK, London, pp\u00a0154\u2013171"},{"issue":"1","key":"594_CR38","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1007\/s10579-022-09620-5","volume":"57","author":"Z Rahimi","year":"2023","unstructured":"Rahimi Z, Homayounpour MM (2023) The impact of preprocessing on word embedding quality: a comparative study. Lang Resour Eval 57(1):257\u2013291","journal-title":"Lang Resour Eval"},{"issue":"3","key":"594_CR39","first-page":"364","volume":"42","author":"KJ Roberto","year":"2020","unstructured":"Roberto KJ, Johnson AF, Rauhaus BM (2020) Stigmatization and prejudice during the COVID-19 pandemic. Adm Theory Prax 42(3):364\u2013378","journal-title":"Adm Theory Prax"},{"key":"594_CR40","doi-asserted-by":"crossref","unstructured":"Schuld M, Durrheim K, Mafunda M (2023) Speaker landscapes: Machine learning opens a window on the everyday language of opinion. Commun. Methods Meas.: 1\u201317","DOI":"10.31219\/osf.io\/smhn5"},{"key":"594_CR41","unstructured":"Shuyo N (2014). langdetect: Language detection library ported from Google\u2019s language-detection"},{"issue":"4","key":"594_CR42","doi-asserted-by":"publisher","first-page":"476","DOI":"10.1177\/008124631204200403","volume":"42","author":"K Talbot","year":"2012","unstructured":"Talbot K, Durrheim K (2012) The Princeton trilogy revisited: how have racial stereotypes changed in South Africa? S Afr J Psychol 42(4):476\u2013491","journal-title":"S Afr J Psychol"},{"key":"594_CR43","volume-title":"Report of the truth and reconciliation commission: volume four, Chapter Six","author":"Truth and Reconciliation Commission of South Africa (TRC)","year":"1998","unstructured":"Truth and Reconciliation Commission of South Africa (TRC) (1998) Report of the truth and reconciliation commission: volume four, Chapter Six. [Online]. Institutional Hearing. https:\/\/www.justice.gov.za\/trc\/report\/finalreport\/Volume%204.pdf. Accessed 06 Jun 2024"},{"key":"594_CR44","doi-asserted-by":"publisher","unstructured":"Wasserman H (2007) Is Our Media (Still) Racist? Global Media J.: Afr. Ed. 1(1). https:\/\/doi.org\/10.5789\/1-1-53","DOI":"10.5789\/1-1-53"},{"issue":"3","key":"594_CR45","doi-asserted-by":"publisher","first-page":"451","DOI":"10.1007\/s11616-020-00594-4","volume":"65","author":"H Wasserman","year":"2020","unstructured":"Wasserman H (2020) The state of South African media: a space to contest democracy. Publizistik 65(3):451\u2013465","journal-title":"Publizistik"},{"key":"594_CR46","unstructured":"World Bank (2021) Middle East and North Africa. https:\/\/www.worldbank.org\/en\/region\/mena\/overview. Accessed 18 Dec 2023"}],"container-title":["EPJ Data Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1140\/epjds\/s13688-025-00594-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1140\/epjds\/s13688-025-00594-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1140\/epjds\/s13688-025-00594-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,27]],"date-time":"2025-11-27T08:46:42Z","timestamp":1764233202000},"score":1,"resource":{"primary":{"URL":"https:\/\/epjdatascience.springeropen.com\/articles\/10.1140\/epjds\/s13688-025-00594-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11,27]]},"references-count":46,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["594"],"URL":"https:\/\/doi.org\/10.1140\/epjds\/s13688-025-00594-2","relation":{},"ISSN":["2193-1127"],"issn-type":[{"value":"2193-1127","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,11,27]]},"assertion":[{"value":"13 February 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 October 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 November 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"This study was conducted in strict accordance with ethical guidelines (University of Johannesburg ethical clearance code: 2025SCiiS089). All human participants provided informed consent prior to their involvement, having been fully briefed on the study\u2019s purpose and procedures. Confidentiality and anonymity were guaranteed and maintained throughout the research process.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare no competing interests.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"83"}}