{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T09:56:58Z","timestamp":1773482218447,"version":"3.50.1"},"reference-count":189,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,11,25]],"date-time":"2025-11-25T00:00:00Z","timestamp":1764028800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,11,25]],"date-time":"2025-11-25T00:00:00Z","timestamp":1764028800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"Deutsche Gesellschaft fur Internationale Zusammenarbeit (GIZ) GmbH"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Data Sci Anal"],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1007\/s41060-025-00954-1","type":"journal-article","created":{"date-parts":[[2025,11,25]],"date-time":"2025-11-25T13:51:41Z","timestamp":1764078701000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["A systematic review of accent classification techniques and datasets for inclusive speech recognition"],"prefix":"10.1007","volume":"21","author":[{"given":"Amina","family":"Salifu","sequence":"first","affiliation":[]},{"given":"Henry Nunoo","family":"Mensah","sequence":"additional","affiliation":[]},{"given":"Eric Tutu","family":"Tchao","sequence":"additional","affiliation":[]},{"given":"Ali Musah","family":"Ibrahim","sequence":"additional","affiliation":[]},{"given":"Francisca Adoma","family":"Acheampong","sequence":"additional","affiliation":[]},{"given":"Jerry John","family":"Kponyo","sequence":"additional","affiliation":[]},{"given":"Andrew Selasi","family":"Agbemenu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,11,25]]},"reference":[{"key":"954_CR1","doi-asserted-by":"crossref","unstructured":"Sharma, A., Bhargava, M., Khanna, A.V.: Native and non-native English speech classification: a premise to accent conversion. In: 2021 Fourth International Conference on Electrical, Computer and Communication Technologies (ICECCT), pp. 1\u20137. IEEE (2021)","DOI":"10.1109\/ICECCT52121.2021.9616718"},{"key":"954_CR2","doi-asserted-by":"crossref","unstructured":"Hughes, A., Trudgill, P., Watt, D.: English Accents and Dialects: An Introduction to Social and Regional Varieties of English in the British Isles. Routledge, London (2013)","DOI":"10.4324\/9780203784440"},{"key":"954_CR3","first-page":"1607","volume":"4","author":"J Jenkins","year":"2014","unstructured":"Jenkins, J., Leung, C.: English as a lingua franca. Companion Lang. Assess. 4, 1607\u20131616 (2014)","journal-title":"Companion Lang. Assess."},{"key":"954_CR4","unstructured":"Orr, R., Quen\u00e9, H.: D-Lucea: Curation of the UCU accent project data (2017). https:\/\/api.semanticscholar.org\/CorpusID:64947589"},{"key":"954_CR5","doi-asserted-by":"crossref","unstructured":"Shahriar, S., Lund, B.D., Mannuru, N.R., Arshad, M.A., Hayawi, K., Bevara, R.V.K., Mannuru, A., Batool, L.: Putting GPT-4o to the sword: A comprehensive evaluation of language, vision, speech, and multimodal proficiency. arXiv:2407.09519 (2024)","DOI":"10.20944\/preprints202406.1635.v1"},{"issue":"6","key":"954_CR6","doi-asserted-by":"publisher","first-page":"3848","DOI":"10.1121\/10.0026235","volume":"155","author":"S Ghorbani","year":"2023","unstructured":"Ghorbani, S., Hansen, J.H.L.: Advanced accent\/dialect identification and accentedness assessment with multi-embedding models and automatic speech recognition. J. Acoust. Soc. Am. 155(6), 3848\u20133860 (2023)","journal-title":"J. Acoust. Soc. Am."},{"key":"954_CR7","unstructured":"Zuluaga, J.P., Ahmed, S., Visockas, D., Subakan, C.: Commonaccent: exploring large acoustic pretrained models for accent classification based on common voice. arXiv:2305.18283 (2023)"},{"key":"954_CR8","doi-asserted-by":"crossref","unstructured":"Na, H.-J., Park, J.-S.: Accented speech recognition based on end-to-end domain adversarial training of neural networks. Appl. Sci. (2021)","DOI":"10.3390\/app11188412"},{"key":"954_CR9","doi-asserted-by":"crossref","unstructured":"Mikhailava, V., Lesnichaia, M., Bogach, N., Lezhenin, I., Blake, J., , Pyshkin, E.: Language accent detection with CNN using sparse data from a crowd-sourced speech archive. Mathematics (2022)","DOI":"10.3390\/math10162913"},{"key":"954_CR10","unstructured":"Li, Q.: Fine-tuning Cantonese based on wav2vec 2.0 XLRs model that pretrained on mandarin Chinese to improve ASR performance (2024)"},{"key":"954_CR11","doi-asserted-by":"publisher","first-page":"242","DOI":"10.4236\/ojml.2018.86021","volume":"08","author":"NA Algharabali","year":"2018","unstructured":"Algharabali, N.A., Taqi, H.: Performing speaking \u201cungrammatical\u2019\u2019 American English: A Kuwaiti linguistic phenomenon. Open J. Mod. Linguist. 08, 242\u2013261 (2018)","journal-title":"Open J. Mod. Linguist."},{"key":"954_CR12","doi-asserted-by":"crossref","unstructured":"Cheng, Z., She, Y., Fu, J., Xu, W.: Familiarity determines whether accent affects attitudes and behaviors of the listener. Behav. Sci. 14 (2024)","DOI":"10.3390\/bs14060430"},{"key":"954_CR13","doi-asserted-by":"crossref","unstructured":"Caffarra, S., Michell, E., Martin, C.D.: The impact of foreign accent on irony interpretation. PLoS ONE 13 (2018)","DOI":"10.1371\/journal.pone.0200939"},{"key":"954_CR14","doi-asserted-by":"crossref","unstructured":"Grant, L.H., Shahwan, A., Maoz, I., Keysar, B.: The influence of accent on the evaluation of trust-building efforts during conflict. PLOS ONE 19 (2024)","DOI":"10.1371\/journal.pone.0311373"},{"key":"954_CR15","doi-asserted-by":"crossref","unstructured":"Cowan, B.R., Doyle, P.R., Edwards, J., Garaialde, D., Hayes-Brady, A., Branigan, H.P., Cabral, J.P., Clark, L.M.H.: What\u2019s in an accent?: the impact of accented synthetic speech on lexical choice in human-machine dialogue. In: Proceedings of the 1st International Conference on Conversational User Interfaces (2019)","DOI":"10.1145\/3342775.3342786"},{"issue":"5","key":"954_CR16","doi-asserted-by":"publisher","first-page":"2473","DOI":"10.1121\/1.4744783","volume":"109","author":"CL Rogers","year":"2001","unstructured":"Rogers, C.L., Dalby, J.M., Nishi, K.: Effects of noise and proficiency level on intelligibility of Chinese-accented English. J. Acoust. Soc. Am. 109(5), 2473\u20132473 (2001)","journal-title":"J. Acoust. Soc. Am."},{"issue":"3","key":"954_CR17","doi-asserted-by":"publisher","first-page":"289","DOI":"10.1177\/002383099503800305","volume":"38","author":"MJ Munro","year":"1995","unstructured":"Munro, M.J., Derwing, T.M.: Processing time, accent, and comprehensibility in the perception of native and foreign-accented speech. Lang. Speech 38(3), 289\u2013306 (1995)","journal-title":"Lang. Speech"},{"issue":"1","key":"954_CR18","doi-asserted-by":"publisher","first-page":"8337","DOI":"10.1038\/s41598-022-12260-y","volume":"12","author":"M Orken","year":"2022","unstructured":"Orken, M., Dina, O., Keylan, A., Tolganay, T., Mohamed, O.: A study of transformer-based end-to-end speech recognition system for Kazakh language. Sci. Rep. 12(1), 8337 (2022)","journal-title":"Sci. Rep."},{"key":"954_CR19","doi-asserted-by":"publisher","first-page":"32176","DOI":"10.1109\/ACCESS.2023.3259901","volume":"11","author":"YA Wubet","year":"2023","unstructured":"Wubet, Y.A., Balram, D., Lian, K.-Y.: Intra-native accent shared features for improving neural network-based accent classification and accent similarity evaluation. IEEE Access 11, 32176\u201332186 (2023). https:\/\/doi.org\/10.1109\/ACCESS.2023.3259901","journal-title":"IEEE Access"},{"key":"954_CR20","doi-asserted-by":"crossref","unstructured":"Ito, Y.: Japanese EFL learners\u2019 perceptions of different accents in spoken English. Aust. J. Appl. Linguist. (2019)","DOI":"10.29140\/ajal.v2n2.160"},{"key":"954_CR21","unstructured":"Shriberg, E., Ferrer, L., Kajarekar, S.S., Scheffer, N., Stolcke, A., Akbacak, M.: Detecting nonnative speech using speaker recognition approaches. In: Odyssey, p. 26 (2008)"},{"issue":"2","key":"954_CR22","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2661637","volume":"14","author":"H-P Shen","year":"2015","unstructured":"Shen, H.-P., Wu, C.-H., Tsai, P.-S.: Model generation of accented speech using model transformation and verification for bilingual speech recognition. ACM Trans. Asian Low-Resource Lang. Inf. Process. (TALLIP) 14(2), 1\u201324 (2015)","journal-title":"ACM Trans. Asian Low-Resource Lang. Inf. Process. (TALLIP)"},{"key":"954_CR23","doi-asserted-by":"crossref","unstructured":"Najafian, M., Safavi, S., Weber, P., Russell, M.J.: Identification of british english regional accents using fusion of i-vector and multi-accent phonotactic systems. In: Odyssey, pp. 132\u2013139 (2016)","DOI":"10.21437\/Odyssey.2016-19"},{"key":"954_CR24","doi-asserted-by":"publisher","first-page":"120","DOI":"10.1016\/j.neucom.2017.01.116","volume":"277","author":"M Rizwan","year":"2018","unstructured":"Rizwan, M., Anderson, D.V.: A weighted accent classification using multiple words. Neurocomputing 277, 120\u2013128 (2018)","journal-title":"Neurocomputing"},{"key":"954_CR25","doi-asserted-by":"crossref","unstructured":"Krishna, G.R., Krishnan, R., Mittal, V.K.: A system for automatic regional accent classification. In: 2020 IEEE 17th India Council International Conference (INDICON), pp. 1\u20135. IEEE (2020)","DOI":"10.1109\/INDICON49873.2020.9342577"},{"key":"954_CR26","doi-asserted-by":"crossref","unstructured":"Gong, X., Lu, Y., Zhou, Z., Qian, Y.: Layer-wise fast adaptation for end-to-end multi-accent speech recognition. arXiv:2204.09883 (2022)","DOI":"10.21437\/Interspeech.2021-1075"},{"key":"954_CR27","doi-asserted-by":"crossref","unstructured":"Widyowaty, D.S., Sunyoto, A.: Accent recognition by native language using mel-frequency cepstral coefficient and k-nearest neighbor. In: 2020 3rd International Conference on Information and Communications Technology (ICOIACT), pp. 314\u2013318. IEEE (2020)","DOI":"10.1109\/ICOIACT50329.2020.9332026"},{"key":"954_CR28","doi-asserted-by":"crossref","unstructured":"Nicastro, D., Inguanez, F.: Multi-tier accent classification for improved transcribing. In: 2020 IEEE 10th International Conference on Consumer Electronics (ICCE-Berlin), pp. 1\u20136. IEEE (2020)","DOI":"10.1109\/ICCE-Berlin50680.2020.9352197"},{"key":"954_CR29","unstructured":"Duduka, S., Jain, H., Jain, V., Prabhu, H., Chawan, P.: Accent classification using machine learning. Int. Res. J. Eng. Technol. (IRJET) 7(11) (2020)"},{"key":"954_CR30","doi-asserted-by":"crossref","unstructured":"Al-Jumaili, Z., Bassiouny, T., Alanezi, A., Khan, W., Al-Jumeily, D., Hussain, A.J.: Classification of spoken English accents using deep learning and speech analysis. In: International Conference on Intelligent Computing, pp. 277\u2013287. Springer (2022)","DOI":"10.1007\/978-3-031-13832-4_24"},{"key":"954_CR31","doi-asserted-by":"publisher","first-page":"32176","DOI":"10.1109\/ACCESS.2023.3259901","volume":"11","author":"YA Wubet","year":"2023","unstructured":"Wubet, Y.A., Balram, D., Lian, K.-Y.: Intra-native accent shared features for improving neural network-based accent classification and accent similarity evaluation. IEEE Access 11, 32176\u201332186 (2023)","journal-title":"IEEE Access"},{"key":"954_CR32","doi-asserted-by":"crossref","unstructured":"Walsh, D., Dev, S., Nag, A.: Hilbert-huang-transform based features for accent classification of non-native english speakers. In: 2023 34th Irish Signals and Systems Conference (ISSC), pp. 1\u20136 (2023). IEEE","DOI":"10.1109\/ISSC59246.2023.10162075"},{"key":"954_CR33","doi-asserted-by":"crossref","unstructured":"Song, T., Nguyen, L.T.H., Ta, T.V.: Mpsa-densenet: A novel deep learning model for english accent classification. Computer Speech & Language, 101676 (2024)","DOI":"10.1016\/j.csl.2024.101676"},{"key":"954_CR34","doi-asserted-by":"crossref","unstructured":"Watanabe, C., Kameoka, H.: Ge2e-ac: Generalized end-to-end loss training for accent classification. In: 2024 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC), pp. 1\u20136 (2024). IEEE","DOI":"10.1109\/APSIPAASC63619.2025.10848863"},{"key":"954_CR35","doi-asserted-by":"crossref","unstructured":"Kashif, K., Alwan, A., Wu, Y., De\u00a0Nardis, L., Di\u00a0Benedetto, M.-G.: Mkelm based multi-classification model for foreign accent identification. Heliyon 10(16) (2024)","DOI":"10.1016\/j.heliyon.2024.e36460"},{"key":"954_CR36","doi-asserted-by":"crossref","unstructured":"Ahmed, G., Lawaye, A.A., Jain, V., Chatterjee, J.M., Mahajan, S.: Enhancing english accent identification in automatic speech recognition using spectral features and hybrid cnn-bilstm model. Multimedia Tools and Applications, 1\u201328 (2025)","DOI":"10.1007\/s11042-025-20678-5"},{"key":"954_CR37","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2024.109512","volume":"139","author":"D Subhash","year":"2025","unstructured":"Subhash, D., Premjith, B., Ravi, V., et al.: A robust accent classification system based on variational mode decomposition. Eng. Appl. Artif. Intell. 139, 109512 (2025)","journal-title":"Eng. Appl. Artif. Intell."},{"key":"954_CR38","unstructured":"Higgins, J., Green, S.: Cochrane handbook for systematic reviews of interventions version 5.1. 0 [updated march 2011]. the cochrane collaboration, 2011. available from www. cochrane-handbook. org. Accessed August 29 (2011)"},{"issue":"17","key":"954_CR39","first-page":"3140","volume":"116","author":"M Crowther","year":"2010","unstructured":"Crowther, M., Lim, W., Crowther, M.A.: Systematic review and meta-analysis methodology. Blood, The Journal of the American Society of Hematology 116(17), 3140\u20133146 (2010)","journal-title":"Blood, The Journal of the American Society of Hematology"},{"issue":"7446","key":"954_CR40","doi-asserted-by":"publisher","first-page":"1010","DOI":"10.1136\/bmj.328.7446.1010","volume":"328","author":"J Thomas","year":"2004","unstructured":"Thomas, J., Harden, A., Oakley, A., Oliver, S., Sutcliffe, K., Rees, R., Brunton, G., Kavanagh, J.: Integrating qualitative research with trials in systematic reviews. BMJ 328(7446), 1010\u20131012 (2004)","journal-title":"BMJ"},{"key":"954_CR41","doi-asserted-by":"crossref","unstructured":"Moher, D., Liberati, A., Tetzlaff, J., Altman, D.G., Group*, P.: Preferred reporting items for systematic reviews and meta-analyses: the prisma statement. Annals of internal medicine 151(4), 264\u2013269 (2009)","DOI":"10.7326\/0003-4819-151-4-200908180-00135"},{"issue":"2004","key":"954_CR42","first-page":"1","volume":"33","author":"B Kitchenham","year":"2004","unstructured":"Kitchenham, B.: Procedures for performing systematic reviews. Keele, UK, Keele University 33(2004), 1\u201326 (2004)","journal-title":"Keele, UK, Keele University"},{"key":"954_CR43","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1016\/j.jbusres.2019.07.039","volume":"104","author":"H Snyder","year":"2019","unstructured":"Snyder, H.: Literature review as a research methodology: An overview and guidelines. J. Bus. Res. 104, 333\u2013339 (2019)","journal-title":"J. Bus. Res."},{"key":"954_CR44","doi-asserted-by":"publisher","first-page":"55771","DOI":"10.1109\/ACCESS.2023.3282259","volume":"11","author":"AMA Alqadasi","year":"2023","unstructured":"Alqadasi, A.M.A., Abdulghafor, R., Sunar, M.S., Salam, M.S.B.H.J.: Modern standard arabic speech corpora: A systematic review. IEEE Access 11, 55771\u201355796 (2023). https:\/\/doi.org\/10.1109\/ACCESS.2023.3282259","journal-title":"IEEE Access"},{"key":"954_CR45","doi-asserted-by":"publisher","first-page":"55771","DOI":"10.1109\/ACCESS.2023.3282259","volume":"11","author":"AMA Alqadasi","year":"2023","unstructured":"Alqadasi, A.M.A., Abdulghafor, R., Sunar, M.S., Salam, M.S.B.H.: Modern standard arabic speech corpora: A systematic review. Ieee Access 11, 55771\u201355796 (2023)","journal-title":"Ieee Access"},{"key":"954_CR46","doi-asserted-by":"crossref","unstructured":"Iadkert, K., Hassan, R., Hashim, A.B.: Acoustic measurements and intelligibility of english vowels produced by thai speakers. Studies in English Language and Education (2024)","DOI":"10.24815\/siele.v11i2.33337"},{"key":"954_CR47","doi-asserted-by":"crossref","unstructured":"Winckel, E., D\u0105browska, E.: Language analytic ability, print exposure, memory and comprehension of complex syntax by adult native speakers. Journal of Cognition 7 (2024)","DOI":"10.5334\/joc.333"},{"key":"954_CR48","doi-asserted-by":"crossref","unstructured":"Rabinovich, E., Nisioi, S., Ordan, N., Wintner, S.: On the similarities between native, non-native and translated texts. arXiv:1609.03204 (2016)","DOI":"10.18653\/v1\/P16-1176"},{"key":"954_CR49","doi-asserted-by":"crossref","unstructured":"Riduan, G.M., Soesanti, I., Adji, T.B.: A systematic literature review of text classification: Datasets and methods. In: 2021 IEEE 5th International Conference on Information Technology, Information Systems and Electrical Engineering (ICITISEE), pp. 71\u201377 (2021). IEEE","DOI":"10.1109\/ICITISEE53823.2021.9655788"},{"key":"954_CR50","doi-asserted-by":"crossref","unstructured":"Humayun, M.A., Shuja, J., Abas, P.E.: A review of social background profiling of speakers from speech accents. PeerJ Computer Science 10 (2024)","DOI":"10.7717\/peerj-cs.1984"},{"key":"954_CR51","unstructured":"Weinberger, S.: Speech accent archive. george mason university. Online: http:\/\/accent.gmu.edu (2015)"},{"key":"954_CR52","unstructured":"Ahamad, A., Anand, A., Bhargava, P.: Accentdb: A database of non-native english accents to assist neural speech recognition. In: Proceedings of The 12th Language Resources and Evaluation Conference, pp. 5353\u20135360. European Language Resources Association, Marseille, France (2020). https:\/\/www.aclweb.org\/anthology\/2020.lrec-1.659"},{"key":"954_CR53","unstructured":"Veaux, C., Yamagishi, J., MacDonald, K.: Cstr vctk corpus: English multi-speaker corpus for cstr voice cloning toolkit. (2017)"},{"key":"954_CR54","unstructured":"Guevara-Rukoz, A., Demirsahin, I., He, F., Chu, S.-H.C., Sarin, S., Pipatsrisawat, K., Gutkin, A., Butryna, A., Kjartansson, O.: Crowdsourcing Latin American Spanish for Low-Resource Text-to-Speech. In: Proceedings of The 12th Language Resources and Evaluation Conference (LREC), pp. 6504\u20136513. European Language Resources Association (ELRA), Marseille, France (2020). https:\/\/www.aclweb.org\/anthology\/2020.lrec-1.801"},{"key":"954_CR55","unstructured":"Weinberger, S.: Speech Accent Archive. George Mason University (2015). http:\/\/accent.gmu.edu"},{"key":"954_CR56","unstructured":"Ardila, R., Branson, M., Davis, K., Henretty, M., Kohler, M., Meyer, J., Morais, R., Saunders, L., Tyers, F.M., Weber, G.: Common voice: A massively-multilingual speech corpus. In: Proceedings of the 12th Conference on Language Resources and Evaluation (LREC 2020), pp. 4211\u20134215 (2020)"},{"key":"954_CR57","doi-asserted-by":"publisher","unstructured":"Yamagishi, J., Veaux, C., MacDonald, K.: CSTR VCTK Corpus: English Multi-speaker Corpus for CSTR Voice Cloning Toolkit (version 0.92), [sound]. University of Edinburgh. The Centre for Speech Technology Research (CSTR) (2019). https:\/\/doi.org\/10.7488\/ds\/2645","DOI":"10.7488\/ds\/2645"},{"key":"954_CR58","doi-asserted-by":"crossref","unstructured":"Salesky, E., Wiesner, M., Bremerman, J., Cattoni, R., Negri, M., Turchi, M., Oard, D.W., Post, M.: Multilingual tedx corpus for speech recognition and translation. In: Proceedings of Interspeech (2021)","DOI":"10.21437\/Interspeech.2021-11"},{"key":"954_CR59","unstructured":"Garofolo, J.S., Lamel, L.F., Fisher, W.M., Fiscus, J.G., Pallett, D.S., Dahlgren, N.L., Zue, V.: Timit acoustic-phonetic continuous speech corpus. In: Linguistic Data Consortium (1993)"},{"key":"954_CR60","unstructured":"TalkBank: CallFriend. Accessed: 2024-07-01 (2024). https:\/\/ca.talkbank.org\/access\/CallFriend\/"},{"key":"954_CR61","doi-asserted-by":"publisher","unstructured":"Behravan, H., Hautam\u00e4ki, V., Kinnunen, T.: Foreign accent detection from spoken Finnish using i-vectors. In: Proc. Interspeech 2013, pp. 79\u201383 (2013). https:\/\/doi.org\/10.21437\/Interspeech.2013-42","DOI":"10.21437\/Interspeech.2013-42"},{"key":"954_CR62","unstructured":"Black, A.W., Lenzo, K.A.: Festvox Project. Accessed on: Dec 24, 2014 (2014). http:\/\/festvox.org\/index.html"},{"key":"954_CR63","doi-asserted-by":"crossref","unstructured":"Fu, Y., Cheng, L., Lv, S., Jv, Y., Kong, Y., Chen, Z., Hu, Y., Xie, L., Wu, J., Bu, H., et al.: Aishell-4: An open source dataset for speech enhancement, separation, recognition and speaker diarization in conference scenario. arXiv preprint arXiv:2104.03603 (2021)","DOI":"10.21437\/Interspeech.2021-1397"},{"key":"954_CR64","doi-asserted-by":"crossref","unstructured":"Ishikawa, S.: ICNALE (International Corpus Network of Asian Learners of English) Download Page. Kobe University, Japan (2023). https:\/\/language.sakura.ne.jp\/icnale\/download.html","DOI":"10.4324\/9781003252528-3"},{"key":"954_CR65","doi-asserted-by":"publisher","unstructured":"Panayotov, V., Chen, G., Povey, D., Khudanpur, S.: Librispeech: An asr corpus based on public domain audio books. In: 2015 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 5206\u20135210 (2015). https:\/\/doi.org\/10.1109\/ICASSP.2015.7178964","DOI":"10.1109\/ICASSP.2015.7178964"},{"key":"954_CR66","doi-asserted-by":"publisher","unstructured":"Sharma, A., Bhargava, M., Khanna, A.V.: Native and non-native english speech classification: A premise to accent conversion. In: 2021 Fourth International Conference on Electrical, Computer and Communication Technologies (ICECCT), pp. 1\u20137 (2021). https:\/\/doi.org\/10.1109\/ICECCT52121.2021.9616718","DOI":"10.1109\/ICECCT52121.2021.9616718"},{"key":"954_CR67","doi-asserted-by":"publisher","unstructured":"Bhowmik, T., Choudhury, A., Sharma, A., Verma, A., Kanthalia, B., Roy, B.: A comparative study on native and non-native english accent classifications. In: 2022 International Conference on Futuristic Technologies (INCOFT), pp. 1\u20136 (2022). https:\/\/doi.org\/10.1109\/INCOFT55651.2022.10094428","DOI":"10.1109\/INCOFT55651.2022.10094428"},{"key":"954_CR68","doi-asserted-by":"publisher","unstructured":"Carofilis, A., Alegre, E., Fidalgo, E., Fern\u00e1ndez-Robles, L.: Improvement of accent classification models through grad-transfer from spectrograms and gradient-weighted class activation mapping. IEEE\/ACM Transactions on Audio, Speech, and Language Processing 31, 2859\u20132871 (2023) https:\/\/doi.org\/10.1109\/TASLP.2023.3297961","DOI":"10.1109\/TASLP.2023.3297961"},{"key":"954_CR69","doi-asserted-by":"publisher","unstructured":"Melechovsky, J., Mehrish, A., Herremans, D., Sisman, B.: Learning accent representation with multi-level vae towards controllable speech synthesis. In: 2022 IEEE Spoken Language Technology Workshop (SLT), pp. 928\u2013935 (2023). https:\/\/doi.org\/10.1109\/SLT54892.2023.10023072","DOI":"10.1109\/SLT54892.2023.10023072"},{"key":"954_CR70","doi-asserted-by":"publisher","unstructured":"Hossain, M.F., Hasan, M.M., Ali, H., Sarker, M.R.K.R., Hassan, M.T.: A machine learning approach to recognize speakers region of the united kingdom from continuous speech based on accent classification. In: 2020 11th International Conference on Electrical and Computer Engineering (ICECE), pp. 210\u2013213 (2020). https:\/\/doi.org\/10.1109\/ICECE51571.2020.9393038","DOI":"10.1109\/ICECE51571.2020.9393038"},{"key":"954_CR71","doi-asserted-by":"publisher","unstructured":"Guntur, R.K., Ramakrishnan, K., Mittal, V.K.: Automatic classification of foreign language accent. In: 2021 2nd Global Conference for Advancement in Technology (GCAT), pp. 1\u20135 (2021). https:\/\/doi.org\/10.1109\/GCAT52182.2021.9587650","DOI":"10.1109\/GCAT52182.2021.9587650"},{"key":"954_CR72","doi-asserted-by":"crossref","unstructured":"Singh, Y., Pillay, A., Jembere, E.: Features of speech audio for accent recognition. In: 2020 International Conference on Artificial Intelligence, Big Data, Computing and Data Communication Systems (icABCD), pp. 1\u20136 (2020). IEEE","DOI":"10.1109\/icABCD49160.2020.9183893"},{"key":"954_CR73","doi-asserted-by":"crossref","unstructured":"Ge, Z., Tan, Y., Ganapathiraju, A.: Accent classification with phonetic vowel representation (2016)","DOI":"10.1109\/ACPR.2015.7486559"},{"key":"954_CR74","doi-asserted-by":"publisher","unstructured":"Mikhailava, V., Lesnichaia, M., Bogach, N., Lezhenin, I., Blake, J., Pyshkin, E.: Language accent detection with cnn using sparse data from a crowd-sourced speech archive. Mathematics 10(16) (2022) https:\/\/doi.org\/10.3390\/math10162913","DOI":"10.3390\/math10162913"},{"key":"954_CR75","unstructured":"Scott, A.J., Thieu, J., Wall, J.M.: Convolutional neural networks for american accented english region localization and analysis. (2020)"},{"key":"954_CR76","doi-asserted-by":"publisher","unstructured":"Muttaqi, M., Degirmenci, A., Karal, O.: Us accent recognition using machine learning methods. In: 2022 Innovations in Intelligent Systems and Applications Conference (ASYU), pp. 1\u20136 (2022). https:\/\/doi.org\/10.1109\/ASYU56188.2022.9925265","DOI":"10.1109\/ASYU56188.2022.9925265"},{"key":"954_CR77","doi-asserted-by":"publisher","unstructured":"Jayne, C., Chang, V., Bailey, J., Xu, Q.: Automatic Accent and Gender Recognition of Regional UK Speakers, pp. 67\u201380 (2022). https:\/\/doi.org\/10.1007\/978-3-031-08223-8_6","DOI":"10.1007\/978-3-031-08223-8_6"},{"key":"954_CR78","doi-asserted-by":"publisher","unstructured":"Honnavalli, D., S\u00a0S, S.: Supervised Machine Learning Model for Accent Recognition in English Speech Using Sequential MFCC Features, pp. 55\u201366 (2021).https:\/\/doi.org\/10.1007\/978-981-15-3514-7_5","DOI":"10.1007\/978-981-15-3514-7_5"},{"key":"954_CR79","unstructured":"Grigoriadis, S.: Convolutional neural networks for accent classification (2019)"},{"key":"954_CR80","doi-asserted-by":"crossref","unstructured":"Badhe, S.S., Shirbahadurkar, S.D., Gulhane, S.R.: Renyi entropy and deep learning-based approach for accent classification. Multimedia Tools and Applications, 1\u201333 (2022)","DOI":"10.1007\/s11042-021-11371-4"},{"key":"954_CR81","doi-asserted-by":"publisher","unstructured":"Purwar, A., Sharma, H., Sharma, Y., Gupta, H., Kaur, A.: Accent classification using machine learning and deep learning models. In: 2022 1st International Conference on Informatics (ICI), pp. 13\u201318 (2022).https:\/\/doi.org\/10.1109\/ICI53355.2022.9786885","DOI":"10.1109\/ICI53355.2022.9786885"},{"key":"954_CR82","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2024.101676","volume":"89","author":"T Song","year":"2025","unstructured":"Song, T., Nguyen, L.T.H., Ta, T.V.: Mpsa-densenet: A novel deep learning model for english accent classification. Computer Speech & Language 89, 101676 (2025)","journal-title":"Computer Speech & Language"},{"key":"954_CR83","doi-asserted-by":"publisher","unstructured":"Walsh, D., Dev, S., Nag, A.: Hilbert-huang-transform based features for accent classification of non-native english speakers. In: 2023 34th Irish Signals and Systems Conference (ISSC), pp. 1\u20136 (2023). https:\/\/doi.org\/10.1109\/ISSC59246.2023.10162075","DOI":"10.1109\/ISSC59246.2023.10162075"},{"key":"954_CR84","doi-asserted-by":"crossref","unstructured":"Honnavalli, D., Shylaja, S.S.: Supervised machine learning model for accent recognition in english speech using sequential mfcc features. (2020). https:\/\/api.semanticscholar.org\/CorpusID:225148737","DOI":"10.1007\/978-981-15-3514-7_5"},{"key":"954_CR85","doi-asserted-by":"publisher","unstructured":"Widyowaty, D.S., Sunyoto, A.: Accent recognition by native language using mel-frequency cepstral coefficient and k-nearest neighbor. In: 2020 3rd International Conference on Information and Communications Technology (ICOIACT), pp. 314\u2013318 (2020). https:\/\/doi.org\/10.1109\/ICOIACT50329.2020.9332026","DOI":"10.1109\/ICOIACT50329.2020.9332026"},{"key":"954_CR86","doi-asserted-by":"publisher","unstructured":"Upadhyay, R., Lui, S.: Foreign english accent classification using deep belief networks. In: 2018 IEEE 12th International Conference on Semantic Computing (ICSC), pp. 290\u2013293 (2018). https:\/\/doi.org\/10.1109\/ICSC.2018.00053","DOI":"10.1109\/ICSC.2018.00053"},{"key":"954_CR87","doi-asserted-by":"publisher","DOI":"10.1016\/j.fsidi.2020.300982","volume":"34","author":"S Saleem","year":"2020","unstructured":"Saleem, S., Subhan, F., Naseer, N., Bais, A., Imtiaz, A.: Forensic speaker recognition: A new method based on extracting accent and language information from short utterances. Forensic Science International: Digital Investigation 34, 300982 (2020). https:\/\/doi.org\/10.1016\/j.fsidi.2020.300982","journal-title":"Forensic Science International: Digital Investigation"},{"key":"954_CR88","doi-asserted-by":"publisher","unstructured":"Thakkar, M., Elias, S., Ashok, A.: Speech recognition learning framework for non-native english accent. In: 2019 International Conference on Data Science and Engineering (ICDSE), pp. 84\u201389 (2019). https:\/\/doi.org\/10.1109\/ICDSE47409.2019.8971486","DOI":"10.1109\/ICDSE47409.2019.8971486"},{"key":"954_CR89","doi-asserted-by":"publisher","first-page":"104","DOI":"10.1016\/j.wocn.2016.08.004","volume":"58","author":"T Bent","year":"2016","unstructured":"Bent, T., Atagi, E., Akbik, A., Bonifield, E.: Classification of regional dialects, international dialects, and nonnative accents. J. Phon. 58, 104\u2013117 (2016). https:\/\/doi.org\/10.1016\/j.wocn.2016.08.004","journal-title":"J. Phon."},{"issue":"11","key":"954_CR90","first-page":"105","volume":"7","author":"A Name","year":"2020","unstructured":"Name, A.: Irjet- accent classification using machine learning. International Research Journal of Engineering and Technology 7(11), 105\u2013110 (2020)","journal-title":"International Research Journal of Engineering and Technology"},{"key":"954_CR91","unstructured":"Zhao, N., Liu, H., Wang, L.: Improving the transferability of speech separation by meta-learning. In: Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing (ICASSP), Singapore (2022). arXiv:2203.05882"},{"key":"954_CR92","doi-asserted-by":"crossref","unstructured":"Hossain, M.F., Hasan, M.M., Ali, H., Sarker, M.R.K.R., Hassan, M.T.: A machine learning approach to recognize speakers region of the united kingdom from continuous speech based on accent classification. In: 2020 11th International Conference on Electrical and Computer Engineering (ICECE), pp. 210\u2013213 (2020). IEEE","DOI":"10.1109\/ICECE51571.2020.9393038"},{"key":"954_CR93","doi-asserted-by":"crossref","unstructured":"Brown, G.: Automatic accent recognition systems and the effects of data on performance (2016)","DOI":"10.21437\/Odyssey.2016-14"},{"key":"954_CR94","volume":"34","author":"S Saleem","year":"2020","unstructured":"Saleem, S., Subhan, F., Naseer, N., Bais, A., Imtiaz, A.: Forensic speaker recognition: A new method based on extracting accent and language information from short utterances. Forensic Science International: Digital Investigation 34, 300982 (2020)","journal-title":"Forensic Science International: Digital Investigation"},{"issue":"6","key":"954_CR95","first-page":"1701","volume":"1","author":"Y Deng","year":"2007","unstructured":"Deng, Y., Li, X., Kwan, C., Raj, B., Stern, R.: Continuous feature adaptation for non-native speech recognition. International Journal of Computer and Information Engineering 1(6), 1701\u20131708 (2007)","journal-title":"International Journal of Computer and Information Engineering"},{"key":"954_CR96","doi-asserted-by":"crossref","unstructured":"Thakkar, M., Elias, S., Ashok, A.: Speech recognition learning framework for non-native english accent. In: 2019 International Conference on Data Science and Engineering (ICDSE), pp. 84\u201389 (2019). IEEE","DOI":"10.1109\/ICDSE47409.2019.8971486"},{"key":"954_CR97","doi-asserted-by":"publisher","first-page":"17","DOI":"10.7240\/jeps.896427","volume":"33","author":"AA AYRANCI","year":"2021","unstructured":"AYRANCI, A.A., Sergen, A., YILDIRIM, T.: Speaker accent recognition using mfcc feature extraction and machine learning algorithms. International Journal of Advances in Engineering and Pure Sciences 33, 17\u201327 (2021)","journal-title":"International Journal of Advances in Engineering and Pure Sciences"},{"issue":"2","key":"954_CR98","doi-asserted-by":"publisher","first-page":"1077","DOI":"10.1121\/10.0009405","volume":"151","author":"R Kethireddy","year":"2022","unstructured":"Kethireddy, R., Kadiri, S.R., Gangashetty, S.V.: Deep neural architectures for dialect classification with single frequency filtering and zero-time windowing feature representations. The Journal of the Acoustical Society of America 151(2), 1077\u20131092 (2022)","journal-title":"The Journal of the Acoustical Society of America"},{"key":"954_CR99","doi-asserted-by":"crossref","unstructured":"Mnasri, S., Habbash, M.: Study of the influence of arabic mother tongue on the english language using a hybrid artificial intelligence method. Interactive Learning Environments, 1\u201314 (2021)","DOI":"10.1080\/10494820.2021.2012809"},{"issue":"3","key":"954_CR100","doi-asserted-by":"publisher","first-page":"3485","DOI":"10.1007\/s11042-022-13236-w","volume":"82","author":"KS Rao","year":"2023","unstructured":"Rao, K.S.: Accent classification from an emotional speech in clean and noisy environments. Multimedia Tools and Applications 82(3), 3485\u20133508 (2023)","journal-title":"Multimedia Tools and Applications"},{"key":"954_CR101","doi-asserted-by":"publisher","first-page":"2367","DOI":"10.1109\/TASLP.2021.3060813","volume":"29","author":"G Zhao","year":"2021","unstructured":"Zhao, G., Ding, S., Gutierrez-Osuna, R.: Converting foreign accent speech without a reference. IEEE\/ACM Transactions on Audio, Speech, and Language Processing 29, 2367\u20132381 (2021)","journal-title":"IEEE\/ACM Transactions on Audio, Speech, and Language Processing"},{"key":"954_CR102","doi-asserted-by":"crossref","unstructured":"AJU, O.G., OSUBOR, V.I.: A hybrid architecture for accent-based automatic speech recognition systems for e-learning environment. Journal of Applied Computer Science & Mathematics 16(34) (2022)","DOI":"10.4316\/JACSM.202202003"},{"key":"954_CR103","doi-asserted-by":"publisher","unstructured":"Al-Jumaili, Z., Bassiouny, T., Alanezi, A., Khan, W., Al-Jumeily\u00a0Obe, D., Hussain, A.: Classification of Spoken English Accents Using Deep Learning and Speech Analysis, pp. 277\u2013287 (2022). https:\/\/doi.org\/10.1007\/978-3-031-13832-4_24","DOI":"10.1007\/978-3-031-13832-4_24"},{"key":"954_CR104","unstructured":"Ahamad, A., Anand, A., Bhargava, P.: Accentdb: A database of non-native english accents to assist neural speech recognition. arXiv preprint arXiv:2005.07973 (2020)"},{"key":"954_CR105","doi-asserted-by":"publisher","unstructured":"Kethireddy, R., Kadiri, S.R., Gangashetty, S.V.: Learning filterbanks from raw waveform for accent classification. In: 2020 International Joint Conference on Neural Networks (IJCNN), pp. 1\u20136 (2020).https:\/\/doi.org\/10.1109\/IJCNN48605.2020.9206778","DOI":"10.1109\/IJCNN48605.2020.9206778"},{"key":"954_CR106","doi-asserted-by":"crossref","unstructured":"Reid, K., Williams, E.T.: Common Voice and Accent Choice: Data Contributors Self-Describe Their Spoken Accents in Diverse Ways. EasyChair Preprint no. 9678, ??? (EasyChair, 2023)","DOI":"10.1145\/3617694.3623258"},{"key":"954_CR107","doi-asserted-by":"publisher","unstructured":"Zuluaga, J.P., Ahmed, S., Visockas, D., Subakan, C.: Commonaccent: Exploring large acoustic pretrained models for accent classification based on common voice, pp. 5291\u20135295 (2023). https:\/\/doi.org\/10.21437\/Interspeech.2023-2419","DOI":"10.21437\/Interspeech.2023-2419"},{"key":"954_CR108","doi-asserted-by":"crossref","unstructured":"Zeng, Q., Chong, D., Zhou, P., Yang, J.: Low-resource accent classification in geographically-proximate settings: A forensic and sociophonetics perspective. arXiv preprint arXiv:2206.12759 (2022)","DOI":"10.21437\/Interspeech.2022-11372"},{"key":"954_CR109","doi-asserted-by":"publisher","unstructured":"Behravan, H., Hautam\u00e4ki, V., Kinnunen, T.: Foreign accent detection from spoken finnish using i-vectors. (2013). https:\/\/doi.org\/10.21437\/Interspeech.2013-42","DOI":"10.21437\/Interspeech.2013-42"},{"key":"954_CR110","doi-asserted-by":"publisher","first-page":"3040","DOI":"10.1109\/TASLP.2021.3111568","volume":"29","author":"C Liberatore","year":"2021","unstructured":"Liberatore, C.: Native-nonnative voice conversion by residual warping in a sparse, anchor-based representation. IEEE\/ACM Transactions on Audio, Speech, and Language Processing 29, 3040\u20133051 (2021). https:\/\/doi.org\/10.1109\/TASLP.2021.3111568","journal-title":"IEEE\/ACM Transactions on Audio, Speech, and Language Processing"},{"key":"954_CR111","doi-asserted-by":"publisher","unstructured":"Ayranc\u0131, A., ATAY, S., Yildirim, T.: Speaker accent recognition using mfcc feature extraction and machine learning algorithms. International Journal of Advances in Engineering and Pure Sciences 33 (2021) https:\/\/doi.org\/10.7240\/jeps.896427","DOI":"10.7240\/jeps.896427"},{"key":"954_CR112","unstructured":"Ai, L., Jeng, S.-Y., Beigi, H.: A new approach to accent recognition and conversion for mandarin chinese. arXiv preprint arXiv:2008.03359 (2020)"},{"key":"954_CR113","doi-asserted-by":"publisher","unstructured":"Zhu, H., Wang, l., Zhang, P., Yan, Y.: Multi-accent adaptation based on gate mechanism, pp. 744\u2013748 (2019). https:\/\/doi.org\/10.21437\/Interspeech.2019-3155","DOI":"10.21437\/Interspeech.2019-3155"},{"key":"954_CR114","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1080\/02533839.1986.9676859","volume":"9","author":"K Chang","year":"1986","unstructured":"Chang, K., Yang, C.-C.: A real-time pitch extraction and four-tone recognition system for mandarin speech. J. Chin. Inst. Eng. 9, 37\u201349 (1986)","journal-title":"J. Chin. Inst. Eng."},{"key":"954_CR115","doi-asserted-by":"publisher","first-page":"607","DOI":"10.1007\/978-981-10-3005-5_50","volume-title":"Pattern Recognition","author":"H Ni","year":"2016","unstructured":"Ni, H., Yi, J., Wen, Z., Tao, J.: Recurrent neural network based language model adaptation for accent mandarin speech. In: Tan, T., Li, X., Chen, X., Zhou, J., Yang, J., Cheng, H. (eds.) Pattern Recognition, pp. 607\u2013617. Springer, Singapore (2016)"},{"key":"954_CR116","unstructured":"Nisioi, S.: Comparing speech and text classification on icnale. In: International Conference on Language Resources and Evaluation (2016). https:\/\/api.semanticscholar.org\/CorpusID:21954016"},{"key":"954_CR117","doi-asserted-by":"crossref","unstructured":"Zhang, Z., Wang, Y., Yang, J.: Accent recognition with hybrid phonetic features. Sensors 21(18) (2021)","DOI":"10.3390\/s21186258"},{"key":"954_CR118","doi-asserted-by":"publisher","first-page":"2842","DOI":"10.1109\/TASLP.2022.3198546","volume":"30","author":"Y Qian","year":"2022","unstructured":"Qian, Y., Gong, X., Huang, H.: Layer-wise fast adaptation for end-to-end multi-accent speech recognition. IEEE\/ACM Transactions on Audio, Speech, and Language Processing 30, 2842\u20132853 (2022)","journal-title":"IEEE\/ACM Transactions on Audio, Speech, and Language Processing"},{"issue":"18","key":"954_CR119","doi-asserted-by":"publisher","first-page":"6258","DOI":"10.3390\/s21186258","volume":"21","author":"Z Zhang","year":"2021","unstructured":"Zhang, Z., Wang, Y., Yang, J.: Accent recognition with hybrid phonetic features. Sensors 21(18), 6258 (2021)","journal-title":"Sensors"},{"key":"954_CR120","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1016\/j.specom.2015.12.004","volume":"78","author":"JHL Hansen","year":"2016","unstructured":"Hansen, J.H.L., Liu, G.: Unsupervised accent classification for deep data fusion of accent and language information. Speech Commun. 78, 19\u201333 (2016). https:\/\/doi.org\/10.1016\/j.specom.2015.12.004","journal-title":"Speech Commun."},{"key":"954_CR121","doi-asserted-by":"publisher","first-page":"92","DOI":"10.1016\/j.specom.2022.03.007","volume":"139","author":"MA Humayun","year":"2022","unstructured":"Humayun, M.A., Yassin, H., Abas, P.E.: Native language identification for indian-speakers by an ensemble of phoneme-specific, and text-independent convolutions. Speech Commun. 139, 92\u2013101 (2022). https:\/\/doi.org\/10.1016\/j.specom.2022.03.007","journal-title":"Speech Commun."},{"key":"954_CR122","doi-asserted-by":"publisher","unstructured":"Radha, K., Bansal, M., Shabber, S.M.: Accent classification of native and non-native children using harmonic pitch. In: 2022 2nd International Conference on Artificial Intelligence and Signal Processing (AISP), pp. 1\u20136 (2022). https:\/\/doi.org\/10.1109\/AISP53593.2022.9760588","DOI":"10.1109\/AISP53593.2022.9760588"},{"key":"954_CR123","doi-asserted-by":"publisher","unstructured":"Duong, Q.T., Do, V.H.: Development of accent recognition systems for vietnamese speech. In: 2021 24th Conference of the Oriental COCOSDA International Committee for the Co-ordination and Standardisation of Speech Databases and Assessment Techniques (O-COCOSDA), pp. 174\u2013179 (2021). https:\/\/doi.org\/10.1109\/O-COCOSDA202152914.2021.9660512","DOI":"10.1109\/O-COCOSDA202152914.2021.9660512"},{"key":"954_CR124","doi-asserted-by":"publisher","unstructured":"Shergill, J., Pravin, C., Ojha, V.: Accent and Gender Recognition from English Language Speech and Audio Using Signal Processing and Deep Learning, pp. 62\u201372 (2021). https:\/\/doi.org\/10.1007\/978-3-030-73050-5_7","DOI":"10.1007\/978-3-030-73050-5_7"},{"key":"954_CR125","first-page":"1","volume":"7","author":"H Bello","year":"2020","unstructured":"Bello, H., Yap, N., Chan, M.-Y., Nimehchisalem, V.: An acoustic analysis of english vowels produced by nigerian and malaysian esl speakers 7, 1\u201315 (2020)","journal-title":"An acoustic analysis of english vowels produced by nigerian and malaysian esl speakers"},{"key":"954_CR126","doi-asserted-by":"publisher","first-page":"55","DOI":"10.1007\/978-981-15-3514-7_5","volume-title":"Advances in Artificial Intelligence and Data Engineering","author":"D Honnavalli","year":"2021","unstructured":"Honnavalli, D., Shylaja, S.S.: Supervised machine learning model for accent recognition in english speech using sequential mfcc features. In: Chiplunkar, N.N., Fukao, T. (eds.) Advances in Artificial Intelligence and Data Engineering, pp. 55\u201366. Springer, Singapore (2021)"},{"key":"954_CR127","unstructured":"Li, J., Manohar, V., Chitkara, P., Tjandra, A., Picheny, M., Zhang, F., Zhang, X., Saraf, Y.: Accent-robust automatic speech recognition using supervised and unsupervised wav2vec embeddings. arXiv preprint arXiv:2110.03520 (2021)"},{"key":"954_CR128","doi-asserted-by":"publisher","unstructured":"Chellali, S., Al-Maadeed, S., Kenai, O., Maamar, A., Hidouci, W.: Middle eastern and north african english speech corpus (menaesc): Automatic identification of mena english accents (2021)https:\/\/doi.org\/10.34028\/iajit\/18\/1\/8","DOI":"10.34028\/iajit\/18\/1\/8"},{"key":"954_CR129","unstructured":"Abdullah, R., M, H., Vijean, V., Abdullah, Z., Che\u00a0Kassim, F.N.: Real and complex wavelet transform approaches for malaysian speaker and accent recognition. Pertanika Journal of Science and Technology 27, 737\u2013752 (2019)"},{"key":"954_CR130","doi-asserted-by":"publisher","first-page":"70","DOI":"10.1016\/j.specom.2013.07.010","volume":"56","author":"K Amino","year":"2014","unstructured":"Amino, K., Osanai, T.: Native vs. non-native accent identification using japanese spoken telephone numbers. Speech Commun. 56, 70\u201381 (2014). https:\/\/doi.org\/10.1016\/j.specom.2013.07.010","journal-title":"Speech Commun."},{"key":"954_CR131","doi-asserted-by":"publisher","unstructured":"Ghorbani, S., Bulut, A.E., Hansen, J.H.L.: Advancing multi-accented lstm-ctc speech recognition using a domain specific student-teacher learning paradigm. In: 2018 IEEE Spoken Language Technology Workshop (SLT), pp. 29\u201335 (2018). https:\/\/doi.org\/10.1109\/SLT.2018.8639566","DOI":"10.1109\/SLT.2018.8639566"},{"key":"954_CR132","doi-asserted-by":"publisher","unstructured":"Djellab, M., Amrouche, A., Mehallegue, N., Bouridane, A.: Regional accents recognition based on i-vectors approach: The case of the algerian linguistic environment. In: 2015 4th International Conference on Electrical Engineering (ICEE), pp. 1\u20135 (2015). https:\/\/doi.org\/10.1109\/INTEE.2015.7416744","DOI":"10.1109\/INTEE.2015.7416744"},{"key":"954_CR133","doi-asserted-by":"publisher","unstructured":"Ismail, M., Memon, S., Dhomeja, L., Shah, S., Hussain, D., Rahim, S., Hunzai, I.: Development of a regional voice dataset and speaker classification based on machine learning. Journal of Big Data 8 (2021) https:\/\/doi.org\/10.1186\/s40537-021-00435-9","DOI":"10.1186\/s40537-021-00435-9"},{"key":"954_CR134","doi-asserted-by":"publisher","unstructured":"Hautam\u00e4ki, V., Siniscalchi, M., Behravan, H., Salerno, V.M., Kukanov, I.: Boosting universal speech attributes classification with deep neural network for foreign accent characterization. (2015). https:\/\/doi.org\/10.21437\/Interspeech.2015-165","DOI":"10.21437\/Interspeech.2015-165"},{"key":"954_CR135","doi-asserted-by":"publisher","unstructured":"Behravan, H., Hautamauki, V., Siniscalchi, M., Kinnunen, T., Lee, C.-H.: Introducing attribute features to foreign accent recognition, pp. 5332\u20135336 (2014). https:\/\/doi.org\/10.1109\/ICASSP.2014.6854621","DOI":"10.1109\/ICASSP.2014.6854621"},{"key":"954_CR136","doi-asserted-by":"publisher","unstructured":"Bahari, M.H., Saeidi, R., Van\u00a0hamme, H., Van\u00a0Leeuwen, D.: Accent recognition using i-vector, gaussian mean supervector and gaussian posterior probability supervector for spontaneous telephone speech. In: 2013 IEEE International Conference on Acoustics, Speech and Signal Processing, pp. 7344\u20137348 (2013). https:\/\/doi.org\/10.1109\/ICASSP.2013.6639089","DOI":"10.1109\/ICASSP.2013.6639089"},{"key":"954_CR137","doi-asserted-by":"publisher","first-page":"118","DOI":"10.1016\/j.specom.2014.10.004","volume":"66","author":"H Behravan","year":"2015","unstructured":"Behravan, H., Hautam\u00e4ki, V., Kinnunen, T.: Factors affecting i-vector based foreign accent recognition: A case study in spoken finnish. Speech Commun. 66, 118\u2013129 (2015). https:\/\/doi.org\/10.1016\/j.specom.2014.10.004","journal-title":"Speech Commun."},{"key":"954_CR138","doi-asserted-by":"publisher","unstructured":"Ayranc\u0131, A.A., Atay, S., Y\u0131ld\u0131r\u0131m, T.: Speaker accent recognition using machine learning algorithms. In: 2020 Innovations in Intelligent Systems and Applications Conference (ASYU), pp. 1\u20136 (2020). https:\/\/doi.org\/10.1109\/ASYU50717.2020.9259902","DOI":"10.1109\/ASYU50717.2020.9259902"},{"key":"954_CR139","unstructured":"Bello, H., Yap, N., Chan, M.-Y., Nimehchisalem, V.: An acoustic analysis of english vowels produced by nigerian and malaysian esl speakers 7, 1\u201315 (2020)"},{"key":"954_CR140","doi-asserted-by":"publisher","unstructured":"Behravan, H., Hautam\u00e4ki, V., Kinnunen, T.: Factors affecting i-vector based foreign accent recognition: A case study in spoken finnish. Speech Communication 66 (2015) https:\/\/doi.org\/10.1016\/j.specom.2014.10.004","DOI":"10.1016\/j.specom.2014.10.004"},{"key":"954_CR141","doi-asserted-by":"publisher","unstructured":"Zhang, S., Guo, W., Hu, G.: First investigation of universal speech attributes for speaker verification, pp. 1\u20135 (2016). https:\/\/doi.org\/10.1109\/ISCSLP.2016.7918379","DOI":"10.1109\/ISCSLP.2016.7918379"},{"key":"954_CR142","doi-asserted-by":"publisher","unstructured":"Krishna, G.R., Krishnan, R., Mittal, V.K.: Foreign accent recognition with south indian spoken english. In: 2020 IEEE 17th India Council International Conference (INDICON), pp. 1\u20135 (2020). https:\/\/doi.org\/10.1109\/INDICON49873.2020.9342471","DOI":"10.1109\/INDICON49873.2020.9342471"},{"key":"954_CR143","doi-asserted-by":"crossref","unstructured":"Parikh, P., Velhal, K., Potdar, S., Sikligar, A., Karani, R.: English language accent classification and conversion using machine learning. In: Proceedings of the International Conference on Innovative Computing & Communications (ICICC) (2020)","DOI":"10.2139\/ssrn.3600748"},{"key":"954_CR144","doi-asserted-by":"crossref","unstructured":"Ghani, B., Hallerberg, S.: A randomized bag-of-birds approach to study robustness of automated audio based bird species classification. Applied Sciences (2021)","DOI":"10.20944\/preprints202108.0277.v1"},{"key":"954_CR145","doi-asserted-by":"publisher","first-page":"1458","DOI":"10.3390\/s150101458","volume":"15","author":"K-C Wang","year":"2015","unstructured":"Wang, K.-C.: Time-frequency feature representation using multi-resolution texture analysis and acoustic activity detector for real-life speech emotion recognition. Sensors (Basel, Switzerland) 15, 1458\u20131478 (2015)","journal-title":"Sensors (Basel, Switzerland)"},{"key":"954_CR146","doi-asserted-by":"crossref","unstructured":"Xu, W., Huang, J., Sun, L., Yao, Y., Zhu, F., Xie, Y., Zhang, M.: An improved convolutional neural network for pipe leakage identification based on acoustic emission. Journal of Marine Science and Engineering (2024)","DOI":"10.3390\/jmse12101720"},{"key":"954_CR147","doi-asserted-by":"crossref","unstructured":"Atif, Y.: Audio-to-image encoding for improved voice characteristic detection using deep convolutional neural networks. (2025). https:\/\/api.semanticscholar.org\/CorpusID:276903236","DOI":"10.36227\/techrxiv.174163928.83517889\/v1"},{"key":"954_CR148","first-page":"1","volume":"48","author":"M Crocco","year":"2014","unstructured":"Crocco, M., Cristani, M., Trucco, A., Murino, V.: Audio surveillance. ACM Computing Surveys (CSUR) 48, 1\u201346 (2014)","journal-title":"Audio surveillance. ACM Computing Surveys (CSUR)"},{"key":"954_CR149","doi-asserted-by":"crossref","unstructured":"Tariq, Z., Shah, S.K., Lee, Y.: Feature-based fusion using cnn for lung and heart sound classification. Sensors (Basel, Switzerland) 22 (2022)","DOI":"10.3390\/s22041521"},{"key":"954_CR150","doi-asserted-by":"crossref","unstructured":"Chamoli, A., Semwal, A., Saikia, N.: Detection of emotion in analysis of speech using linear predictive coding techniques (lpc). In: 2017 International Conference on Inventive Systems and Control (ICISC), pp. 1\u20134 (2017). IEEE","DOI":"10.1109\/ICISC.2017.8068642"},{"key":"954_CR151","unstructured":"Hussain, S.S., Neekhara, P., Dubnov, S., McAuley, J., Koushanfar, F.: Waveguard: Understanding and mitigating audio adversarial examples. arXiv:2103.03344 (2021)"},{"key":"954_CR152","doi-asserted-by":"crossref","unstructured":"Kim, L.H., Goel, R., Liang, J.-R., Pilanci, M., Paredes, P.E.: Linear predictive coding for acute stress prediction from computer mouse movements. 2021 43rd Annual International Conference of the IEEE Engineering in Medicine & Biology Society (EMBC), 7465\u20137469 (2020)","DOI":"10.1109\/EMBC46164.2021.9630217"},{"issue":"4","key":"954_CR153","doi-asserted-by":"publisher","first-page":"1738","DOI":"10.1121\/1.399423","volume":"87","author":"H Hermansky","year":"1990","unstructured":"Hermansky, H.: Perceptual linear predictive (plp) analysis of speech. the Journal of the Acoustical Society of America 87(4), 1738\u20131752 (1990)","journal-title":"the Journal of the Acoustical Society of America"},{"key":"954_CR154","doi-asserted-by":"crossref","unstructured":"Xie, L., Liu, Z.-Q.: A comparative study of audio features for audio-to-visual conversion in mpeg-4 compliant facial animation. In: 2006 International Conference on Machine Learning and Cybernetics, pp. 4359\u20134364 (2006). IEEE","DOI":"10.1109\/ICMLC.2006.259085"},{"key":"954_CR155","doi-asserted-by":"crossref","unstructured":"Chappuis, C., Grandjean, D.: Set the tone: Trustworthy and dominant novel voices classification using explicit judgement and machine learning techniques. PLoS ONE 17 (2022)","DOI":"10.1371\/journal.pone.0267432"},{"key":"954_CR156","doi-asserted-by":"crossref","unstructured":"Ge, Z.: Improved accent classification combining phonetic vowels with acoustic features. 2015 8th International Congress on Image and Signal Processing (CISP), 1204\u20131209 (2015)","DOI":"10.1109\/CISP.2015.7408064"},{"key":"954_CR157","doi-asserted-by":"crossref","unstructured":"Lau, J.C.Y., Patel, S.P., Kang, X., Nayar, K., Martin, G.E., Choy, J., Wong, P.C.M., Losh, M.: Cross-linguistic patterns of speech prosodic differences in autism: A machine learning study. PLoS ONE 17 (2022)","DOI":"10.1371\/journal.pone.0269637"},{"key":"954_CR158","doi-asserted-by":"crossref","unstructured":"Nazir, F., Majeed, M.N., Ghazanfar, M.A., Maqsood, M.: An arabic mispronunciation detection system based on the frequency of mistakes for asian speakers. April 2021 (2021)","DOI":"10.22581\/muet1982.2102.03"},{"key":"954_CR159","doi-asserted-by":"crossref","unstructured":"Humayun, M.A., Shuja, J., Abas, P.E.: Speaker profiling based on the short-term acoustic features of vowels. Technologies (2023)","DOI":"10.3390\/technologies11050119"},{"issue":"1","key":"954_CR160","doi-asserted-by":"publisher","DOI":"10.1016\/j.jksuci.2023.101872","volume":"36","author":"L Berriche","year":"2024","unstructured":"Berriche, L., Alqahtani, A., RekikR, S.: Hybrid arabic handwritten character segmentation using cnn and graph theory algorithm. Journal of King Saud University-Computer and Information Sciences 36(1), 101872 (2024)","journal-title":"Journal of King Saud University-Computer and Information Sciences"},{"issue":"3","key":"954_CR161","doi-asserted-by":"publisher","first-page":"1699","DOI":"10.1007\/s00530-021-00822-5","volume":"29","author":"F Nazir","year":"2023","unstructured":"Nazir, F., Majeed, M.N., Ghazanfar, M.A., Maqsood, M.: A computer-aided speech analytics approach for pronunciation feedback using deep feature clustering. Multimedia Syst. 29(3), 1699\u20131715 (2023)","journal-title":"Multimedia Syst."},{"key":"954_CR162","doi-asserted-by":"publisher","first-page":"19143","DOI":"10.1109\/ACCESS.2019.2896880","volume":"7","author":"AB Nassif","year":"2019","unstructured":"Nassif, A.B., Shahin, I., Attili, I., Azzeh, M., Shaalan, K.: Speech recognition using deep neural networks: A systematic review. IEEE access 7, 19143\u201319165 (2019)","journal-title":"IEEE access"},{"key":"954_CR163","unstructured":"Cho, Y., Saul, L.: Kernel methods for deep learning. Advances in neural information processing systems 22 (2009)"},{"key":"954_CR164","doi-asserted-by":"crossref","unstructured":"Ahmed, A., Tangri, P., Panda, A., Ramani, D., Karmakar, S.: Vfnet: A convolutional architecture for accent classification. 2019 IEEE 16th India Council International Conference (INDICON), 1\u20134 (2019)","DOI":"10.1109\/INDICON47234.2019.9030363"},{"key":"954_CR165","unstructured":"Wang, W., Zhang, C., Wu, X.-p.: Deep discriminative feature learning for accent recognition. (2020). https:\/\/api.semanticscholar.org\/CorpusID:237295188"},{"key":"954_CR166","doi-asserted-by":"crossref","unstructured":"Stehwien, S., Vu, N.T.: Prosodic event recognition using convolutional neural networks with context information (2017)","DOI":"10.21437\/Interspeech.2017-1159"},{"key":"954_CR167","doi-asserted-by":"publisher","first-page":"49","DOI":"10.1016\/j.neucom.2021.05.065","volume":"456","author":"A Gallardo-Antol\u00edn","year":"2021","unstructured":"Gallardo-Antol\u00edn, A., Montero, J.M.: On combining acoustic and modulation spectrograms in an attention lstm-based system for speech intelligibility level classification. Neurocomputing 456, 49\u201360 (2021)","journal-title":"Neurocomputing"},{"key":"954_CR168","doi-asserted-by":"crossref","unstructured":"Ghorbani, S., Hansen, J.H.L.: Leveraging native language information for improved accented speech recognition. In: Interspeech (2018). https:\/\/api.semanticscholar.org\/CorpusID:52192017","DOI":"10.21437\/Interspeech.2018-1378"},{"key":"954_CR169","doi-asserted-by":"crossref","unstructured":"Sagri, A., Cazenave, T., Arjonilla, J., Saffidine, A.: Vision transformers for computer go. arXiv:2309.12675 (2023)","DOI":"10.1007\/978-3-031-56855-8_23"},{"key":"954_CR170","unstructured":"Klumpp, P., Chitkara, P., Sari, L., Serai, P., Wu, J., Veliche, I.-E., Huang, R., He, Q.: Synthetic cross-accent data augmentation for automatic speech recognition. arXiv:2303.00802 (2023)"},{"key":"954_CR171","doi-asserted-by":"crossref","unstructured":"Nguyen, T.-N., Pham, N.-Q., Waibel, A.: Accent conversion using discrete units with parallel data synthesized from controllable accented tts. arXiv:2410.03734 (2024)","DOI":"10.21437\/SynData4GenAI.2024-11"},{"key":"954_CR172","unstructured":"Zuluaga, J.S., Laurent, A., Pino, J.M., Adi, Y., Moreno, P., Pino, J., Okhonko, D.: Commonaccent: Exploring accent classification in multilingual speech corpora with self-supervised speech models. In: Proceedings of Interspeech 2023, pp. 5162\u20135166 (2023). https:\/\/www.isca-archive.org\/interspeech_2023\/zuluagagomez23_interspeech.pdf"},{"key":"954_CR173","unstructured":"Kakouros, S., Moshagen, S.N., Jauhiainen, T., Lind\u00e9n, K.: Dialect identification of north s\u00e1mi speech with self-supervised learning and language embeddings. In: Proceedings of Interspeech 2023, pp. 5167\u20135171 (2023). https:\/\/www.isca-archive.org\/interspeech_2023\/kakouros23_interspeech.pdf"},{"key":"954_CR174","unstructured":"Papadopoulos, P., Denisov, P., Popescu-Belis, A.: Continual self-supervised adaptation for speech language identification. arXiv preprint arXiv:2312.07338 (2023)"},{"key":"954_CR175","unstructured":"St\u00f6lten, K., Engstrand, O.: Effects of perceived age on perceived dialect strength: A listening test using manipulations of speaking rate and f0. PHONUM 9 (2003)"},{"key":"954_CR176","doi-asserted-by":"publisher","unstructured":"Sch\u00f6tz, S.: In: M\u00fcller, C. (ed.) Acoustic Analysis of Adult Speaker Age, pp. 88\u2013107. Springer, Berlin, Heidelberg (2007). https:\/\/doi.org\/10.1007\/978-3-540-74200-5_5","DOI":"10.1007\/978-3-540-74200-5_5"},{"key":"954_CR177","unstructured":"The University of Edinburgh: The University of Edinburgh Speech Accent Archive. Accessed: 2024-07-01 (2020). https:\/\/datashare.ed.ac.uk\/handle\/10283\/3443"},{"key":"954_CR178","unstructured":"Garofolo, S., J.: TIMIT AcousticPhonetic Continuous Speech Corpus LDC93S1. Linguistic Data Consortium, Philadelphia (1993)"},{"key":"954_CR179","unstructured":"Feng, S., Kudina, O., Halpern, B.M., Scharenborg, O.: Quantifying bias in automatic speech recognition. arXiv:2103.15122 (2021)"},{"key":"954_CR180","unstructured":"Estevez, M., Ferrer, L.: Study on the fairness of speaker verification systems on underrepresented accents in english. arXiv:2204.12649 (2022)"},{"key":"954_CR181","doi-asserted-by":"crossref","unstructured":"Deng, K., Cao, S., Ma, L.: Improving accent identification and accented speech recognition under a framework of self-supervised learning. arXiv:2109.07349 (2021)","DOI":"10.21437\/Interspeech.2021-1186"},{"key":"954_CR182","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Herygers, A., Patel, T.B., Yue, Z., Scharenborg, O.: Exploring data augmentation in bias mitigation against non-native-accented speech. 2023 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU), 1\u20138 (2023)","DOI":"10.1109\/ASRU57964.2023.10389756"},{"key":"954_CR183","doi-asserted-by":"crossref","unstructured":"Ge, Z., Tan, Y., Ganapathiraju, A.: Accent classification with phonetic vowel representation. 2015 3rd IAPR Asian Conference on Pattern Recognition (ACPR), 529\u2013533 (2015)","DOI":"10.1109\/ACPR.2015.7486559"},{"key":"954_CR184","doi-asserted-by":"crossref","unstructured":"Zeng, W., Shea, C.: Phonetic and phonological factors in cross-dialectal tone perception. In: Proc. SpeechProsody 2024, pp. 422\u2013426 (2024)","DOI":"10.21437\/SpeechProsody.2024-86"},{"key":"954_CR185","doi-asserted-by":"crossref","unstructured":"Najafian, M., Safavi, S., Weber, P., Russell, M.J.: Identification of british english regional accents using fusion of i-vector and multi-accent phonotactic systems. In: The Speaker and Language Recognition Workshop (2016). https:\/\/api.semanticscholar.org\/CorpusID:37836034","DOI":"10.21437\/Odyssey.2016-19"},{"key":"954_CR186","unstructured":"Grigali\u016bnait\u0117, J.: Accent identification using machine learning. PhD thesis, Vilniaus universitetas (2022)"},{"key":"954_CR187","doi-asserted-by":"crossref","unstructured":"Siddhant, A., Jyothi, P., Ganapathy, S.: Leveraging native language speech for accent identification using deep siamese networks. 2017 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU), 621\u2013628 (2017)","DOI":"10.1109\/ASRU.2017.8268994"},{"key":"954_CR188","unstructured":"Song, T., Nguyen, L.T.H., T\u1ea1, T.V.: Mpsa-densenet: A novel deep learning model for english accent classification. arXiv:2306.08798 (2023)"},{"key":"954_CR189","doi-asserted-by":"crossref","unstructured":"Ramos, V.M., Lowit, A., Steen, L.V., Hern\u00e1ndez-D\u00edaz, H.A.K., Huici, M.E.H.-D., Bodt, M.D., Nuffelen, G.V.: Acoustic identification of sentence accent in speakers with dysarthria: Cross-population validation and severity related patterns. Brain Sciences 11 (2021)","DOI":"10.3390\/brainsci11101344"}],"container-title":["International Journal of Data Science and Analytics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-025-00954-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s41060-025-00954-1","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-025-00954-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T09:35:58Z","timestamp":1773480958000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s41060-025-00954-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11,25]]},"references-count":189,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,6]]}},"alternative-id":["954"],"URL":"https:\/\/doi.org\/10.1007\/s41060-025-00954-1","relation":{},"ISSN":["2364-415X","2364-4168"],"issn-type":[{"value":"2364-415X","type":"print"},{"value":"2364-4168","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,11,25]]},"assertion":[{"value":"23 May 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 August 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 November 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no Conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"12"}}