{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,25]],"date-time":"2026-01-25T04:36:34Z","timestamp":1769315794003,"version":"3.49.0"},"reference-count":65,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,5,13]],"date-time":"2025-05-13T00:00:00Z","timestamp":1747094400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,5,13]],"date-time":"2025-05-13T00:00:00Z","timestamp":1747094400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,5,13]]},"DOI":"10.1109\/icmcis64378.2025.11047661","type":"proceedings-article","created":{"date-parts":[[2025,6,30]],"date-time":"2025-06-30T17:36:43Z","timestamp":1751305003000},"page":"1-10","source":"Crossref","is-referenced-by-count":2,"title":["Adapting Automatic Speech Recognition for Accented Air Traffic Control Communications"],"prefix":"10.1109","author":[{"given":"Marcus Yu","family":"Zhe Wee","sequence":"first","affiliation":[{"name":"RSAF Agile Innovation Digital (RAiD), Republic of Singapore Air Force,Air Emerging Technologies High-Speed Experimentations and Research (AETHER),Singapore"}]},{"given":"Justin Juin","family":"Hng Wong","sequence":"additional","affiliation":[{"name":"RSAF Agile Innovation Digital (RAiD), Republic of Singapore Air Force,Air Emerging Technologies High-Speed Experimentations and Research (AETHER),Singapore"}]},{"given":"Lynus","family":"Lim","sequence":"additional","affiliation":[{"name":"RSAF Agile Innovation Digital (RAiD), Republic of Singapore Air Force,Air Emerging Technologies High-Speed Experimentations and Research (AETHER),Singapore"}]},{"given":"Joe Yu","family":"Wei Tan","sequence":"additional","affiliation":[{"name":"RSAF Agile Innovation Digital (RAiD), Republic of Singapore Air Force,Air Emerging Technologies High-Speed Experimentations and Research (AETHER),Singapore"}]},{"given":"Prannaya","family":"Gupta","sequence":"additional","affiliation":[{"name":"RSAF Agile Innovation Digital (RAiD), Republic of Singapore Air Force,Air Emerging Technologies High-Speed Experimentations and Research (AETHER),Singapore"}]},{"given":"Dillion","family":"Lim","sequence":"additional","affiliation":[{"name":"RSAF Agile Innovation Digital (RAiD), Republic of Singapore Air Force,Air Emerging Technologies High-Speed Experimentations and Research (AETHER),Singapore"}]},{"given":"En Hao","family":"Tew","sequence":"additional","affiliation":[{"name":"RSAF Agile Innovation Digital (RAiD), Republic of Singapore Air Force,Air Emerging Technologies High-Speed Experimentations and Research (AETHER),Singapore"}]},{"given":"Aloysius Keng","family":"Siew Han","sequence":"additional","affiliation":[{"name":"RSAF Agile Innovation Digital (RAiD), Republic of Singapore Air Force,Air Emerging Technologies High-Speed Experimentations and Research (AETHER),Singapore"}]},{"given":"Yong Zhi","family":"Lim","sequence":"additional","affiliation":[{"name":"RSAF Agile Innovation Digital (RAiD), Republic of Singapore Air Force,Air Emerging Technologies High-Speed Experimentations and Research (AETHER),Singapore"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Integrating eye- and mouse-tracking with assistant based speech recognition for interaction at controller working positions","volume-title":"Aerospace","author":"Ohneiser","year":"2021"},{"key":"ref2","article-title":"Enhancing multilingual speech recognition in air traffic control by sentence-level language identification","volume":"abs\/2305.00170","author":"Fan","year":"2023","journal-title":"ArXiv"},{"key":"ref3","article-title":"Lessons Learned in Transcribing 5000 h of Air Traffic Control Communications for Robust Automatic Speech Understanding","volume-title":"Aerospace","author":"Zuluaga","year":"2023"},{"key":"ref4","first-page":"28492","article-title":"Robust speech recognition via large-scale weak supervision","volume-title":"International conference on machine learning. PMLR","author":"Radford","year":"2023"},{"key":"ref5","doi-asserted-by":"crossref","first-page":"87","DOI":"10.1007\/s12198-021-00238-2","article-title":"Understanding realistic attacks on airborne collision avoidance systems","volume":"15","author":"Smith","year":"2020","journal-title":"Journal of Transportation Security"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2020-2173"},{"issue":"14","key":"ref7","doi-asserted-by":"crossref","first-page":"4715","DOI":"10.3390\/s24144715","article-title":"Enhancing Air Traffic Control Communication Systems with Integrated Automatic Speech Recognition: Models, Applications and Performance Evaluation","volume":"24","author":"Wang","year":"2024","journal-title":"Sensors"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.4236\/jtts.2011.13007"},{"key":"ref9","article-title":"Do we rely on good-enough processing in reading under auditory and visual noise?","volume":"18","author":"Zdorova","year":"2021","journal-title":"PLOS ONE"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/DASC.2013.6712620"},{"key":"ref11","article-title":"Enhancing Air Traffic Control Communication Systems with Integrated Automatic Speech Recognition: Models, Applications and Performance Evaluation","volume":"24","author":"Wang","year":"2024","journal-title":"Sensors (Basel, Switzerland)"},{"key":"ref12","article-title":"Air traffic control complete (atcc)","volume-title":"1DC94S14A","author":"Godfrey","year":"1994"},{"key":"ref13","first-page":"1493","article-title":"The hiwire database: A noisy and non-native english speech corpus for cockpit communication","volume-title":"Proceedings of the 8th Annual Conference of the International Speech Communication Association (INTERSPEECH 2007)","author":"Segura","year":"2007"},{"key":"ref14","article-title":"The ATCOSIM Corpus of Non-Prompted Clean Air Traffic Control Speech","author":"Hofbauer","year":"2008","journal-title":"LREC"},{"key":"ref15","author":"Zuluaga-Gomez","year":"2023","journal-title":"ATCO2 corpus: A Large-Scale Dataset for Research on Automatic Speech Recognition and Natural Language Understanding of Air Traffic Control Communications"},{"key":"ref16","article-title":"ATCSpeech: a multilingual pilot-controller speech corpus from real Air Traffic Control environment","volume":"abs\/1911.11365","author":"Yang","year":"2019","journal-title":"CoRR"},{"key":"ref17","article-title":"The ATCOSIM Corpus of Non-Prompted Clean Air Traffic Control Speech","volume-title":"Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC\u201908)","author":"Hofbauer"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-33-4669-7_6"},{"key":"ref19","article-title":"The Airbus Air Traffic Control speech recognition 2018 challenge: towards ATC automatic transcription and call sign detection","volume":"abs\/1810.12614","author":"Pellegrini","year":"2018","journal-title":"CoRR"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/s10579-019-09449-5"},{"key":"ref21","author":"Helmke","year":"2023","journal-title":"The HAAWAII Framework for Automatic SpeechUnderstanding of Air Traffic Commu-nication"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.3389\/fnbot.2024.1360094"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2023.110851"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.3390\/aerospace10060538"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-318"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.444"},{"key":"ref27","article-title":"Accent-robust automatic speech recognition using supervised and unsupervised wav2vec embeddings","author":"Li","year":"2021","journal-title":"arXiv preprint"},{"key":"ref28","article-title":"Improving Accent Identification and Accented Speech Recognition Under a Framework of Self-supervised Learning","volume":"abs\/2109.07349","author":"Deng","year":"2021","journal-title":"ArXiv"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-333"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.3390\/diagnostics14090895"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1121\/10.0024876"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10095057"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.3389\/fnbot.2024.1360094"},{"key":"ref34","article-title":"Supervised contrastive learning for accented speech recognition","author":"Han","year":"2021","journal-title":"arXiv preprint"},{"key":"ref35","article-title":"Accented speech recognition: Benchmarking, pre-training, and diverse data","volume":"abs\/2205.08014","author":"Aksenova","year":"2022","journal-title":"ArXiv"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10096268"},{"key":"ref37","author":"Radford","year":"2022","journal-title":"Robust Speech Recognition via Large-Scale Weak Supervision"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.3390\/aerospace8030065"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2024.3423652"},{"key":"ref40","article-title":"Investigation and Analysis of \u201cCapture Effect\u201d in F- M and A-M Communication Systems","volume-title":"Naval Research Laboratory, Washington, DC, Tech. Rep.","author":"Zeek","year":"1949"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/ICMCIS61231.2024.10540964"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.3390\/aerospace10060526"},{"key":"ref43","article-title":"Whisper- ATC Open Models for Air Traffic Control Automatic Speech Recognition with Accuracy","author":"Van Doorn","year":"2024","journal-title":"ICRAT"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.3389\/fpsyg.2024.1383904"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1051\/shsconf\/202110101007"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2018.8462663"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1155\/2023\/8676366"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.13052\/jcsm2245-1439.1261"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.38124\/ijisrt\/ijisrt24jun1134"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pcbi.1008228"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1177\/1548512919869567"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1117\/12.2518917"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178964"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.3390\/s23062927"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1119\/10.0009409"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-10959"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2006-40"},{"key":"ref58","article-title":"Using Audio Quality to Predict Word Error Rate in an Automatic Speech Recognition System","volume-title":"The MITRE Corporation, Technical Report","author":"Fish","year":"2006"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.3390\/aerospace10100898"},{"key":"ref60","first-page":"601","article-title":"Air traffic control communication (atcc) speech corpora and their use for asr and tts development","volume":"53","author":"Ircing","year":"2019","journal-title":"Language Resources and Evaluation"},{"key":"ref61","article-title":"Manual of Radiotelephony","volume-title":"International Civil Aviation Organization (ICAO)","year":"2018"},{"key":"ref62","article-title":"Federal Aviation Administration (FAA)","volume-title":"Pilot\/Controller Glossary","year":"2025"},{"key":"ref63","first-page":"1","article-title":"Normalization of audio signals for the needs of machine learning","author":"Kowalski","year":"2022","journal-title":"2022 Signal Processing: Algorithms, Architectures, Arrangements, and Applications (SPA). IEEE"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/SLT61566.2024.10832185"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/icasspw65056.2025.11010998"}],"event":{"name":"2025 International Conference on Military Communication and Information Systems (ICMCIS)","location":"Oerias, Portugal","start":{"date-parts":[[2025,5,13]]},"end":{"date-parts":[[2025,5,14]]}},"container-title":["2025 International Conference on Military Communication and Information Systems (ICMCIS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11047255\/11047555\/11047661.pdf?arnumber=11047661","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,1]],"date-time":"2025-07-01T05:41:58Z","timestamp":1751348518000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11047661\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,13]]},"references-count":65,"URL":"https:\/\/doi.org\/10.1109\/icmcis64378.2025.11047661","relation":{},"subject":[],"published":{"date-parts":[[2025,5,13]]}}}