{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,3]],"date-time":"2025-12-03T18:04:09Z","timestamp":1764785049303,"version":"3.28.0"},"reference-count":49,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,1,9]],"date-time":"2023-01-09T00:00:00Z","timestamp":1673222400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,1,9]],"date-time":"2023-01-09T00:00:00Z","timestamp":1673222400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,1,9]]},"DOI":"10.1109\/slt54892.2023.10022718","type":"proceedings-article","created":{"date-parts":[[2023,1,27]],"date-time":"2023-01-27T18:54:03Z","timestamp":1674845643000},"page":"633-640","source":"Crossref","is-referenced-by-count":13,"title":["Bertraffic: Bert-Based Joint Speaker Role and Speaker Change Detection for Air Traffic Control Communications"],"prefix":"10.1109","author":[{"given":"Juan","family":"Zuluaga-Gomez","sequence":"first","affiliation":[{"name":"Idiap Research Institute,Martigny,Switzerland"}]},{"given":"Seyyed Saeed","family":"Sarfjoo","sequence":"additional","affiliation":[{"name":"Idiap Research Institute,Martigny,Switzerland"}]},{"given":"Amrutha","family":"Prasad","sequence":"additional","affiliation":[{"name":"Idiap Research Institute,Martigny,Switzerland"}]},{"given":"Iuliia","family":"Nigmatulina","sequence":"additional","affiliation":[{"name":"Idiap Research Institute,Martigny,Switzerland"}]},{"given":"Petr","family":"Motlicek","sequence":"additional","affiliation":[{"name":"Idiap Research Institute,Martigny,Switzerland"}]},{"given":"Karel","family":"Ondrej","sequence":"additional","affiliation":[{"name":"Brno University of Technology,Brno,Czech Republic"}]},{"given":"Oliver","family":"Ohneiser","sequence":"additional","affiliation":[{"name":"Institute of Flight Guidance,German Aerospace Center (DLR),Braunschweig,Germany"}]},{"given":"Hartmut","family":"Helmke","sequence":"additional","affiliation":[{"name":"Institute of Flight Guidance,German Aerospace Center (DLR),Braunschweig,Germany"}]}],"member":"263","reference":[{"article-title":"Increasing atm efficiency with assistant based speech recognition","volume-title":"Proc. of the 13th USA\/Europe Air Traffic Man-agement Research and Development Seminar","author":"Helmke","key":"ref1"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/DASC.2018.8569879"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.3390\/aerospace8030065"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.cja.2022.08.020"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-1446"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2019-1962"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2021.101254"},{"key":"ref8","article-title":"End-to-end neural speakar di-arization with permutation-free objectives","author":"Fujita","year":"2019","journal-title":"ar Xiv preprint"},{"key":"ref9","article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","author":"Devlin","year":"2018","journal-title":"arXiv preprint"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-1373"},{"issue":"1","key":"ref11","first-page":"8","article-title":"Au-tomatic processing pipeline for collecting and annotating air-traffic voice communication data","volume-title":"Engineering Proceedings","volume":"13","author":"Kocour"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2014.6853568"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2009.2015698"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1893"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2010.5495087"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8683114"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1364"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1943"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003959"},{"key":"ref20","article-title":"End-to-end speaker diarization for an unknown number of speakers with encoder-decoder based at-tractors","author":"Horiguchi","year":"2020","journal-title":"arXiv preprint"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-3039"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9414371"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9746531"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9746964"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2011.5947333"},{"key":"ref26","first-page":"2493","article-title":"Natural language pro-cessing (almost) from scratch","volume":"12","author":"Collobert","year":"2011","journal-title":"Journal of machine learning research"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.5121\/ijnlc.2021.10401"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W17-1412"},{"key":"ref29","first-page":"2145","article-title":"A survey on recent advances in named entity recognition from deep learning models","volume-title":"Proc. of the 27th International Conference on Computational Linguistics","author":"Yadav"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-16-3346-1_66"},{"key":"ref31","first-page":"1","volume-title":"Grammar based identification of speaker role for improving atco and pilot asr","author":"Prasad","year":"2021"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P17-3009"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-935"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/SLT54892.2023.10022724"},{"journal-title":"The Air Traffic Control Corpus (ATC0)-LDC94S14A","year":"1994","author":"Godfrey","key":"ref35"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1007\/s10579-019-09449-5"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9746563"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.3390\/proceedings2020059014"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2021-1058"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-demos.6"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-demo.21"},{"article-title":"Decoupled Weight Decay Regularization","volume-title":"International Conference on Learning Rep-resentations","author":"Loshchilov","key":"ref42"},{"issue":"1","key":"ref43","first-page":"1929","article-title":"Dropout: a simple way to prevent neural networks from overfitting","volume":"15","author":"Srivastava","year":"2014","journal-title":"The journal of machine learning research"},{"key":"ref44","article-title":"Gaussian error linear units (GELUs)","author":"Hendrycks","year":"2016","journal-title":"arXiv preprint"},{"key":"ref45","article-title":"The kaldi speech recognition toolkit","volume-title":"IEEE workshop on automatic speech recognition and understanding. IEEE Signal Processing Soci-ety","volume":"2011","author":"Povey"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2173"},{"key":"ref47","first-page":"1","article-title":"Improving callsign recognition with air-surveillance data in air-traffic communication","volume-title":"Idiap Research Institute","author":"Nigmatulina","year":"2021"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-1268"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1016\/0167-6377(86)90073-8"}],"event":{"name":"2022 IEEE Spoken Language Technology Workshop (SLT)","start":{"date-parts":[[2023,1,9]]},"location":"Doha, Qatar","end":{"date-parts":[[2023,1,12]]}},"container-title":["2022 IEEE Spoken Language Technology Workshop (SLT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10022052\/10022330\/10022718.pdf?arnumber=10022718","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,2]],"date-time":"2024-03-02T15:34:03Z","timestamp":1709393643000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10022718\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,1,9]]},"references-count":49,"URL":"https:\/\/doi.org\/10.1109\/slt54892.2023.10022718","relation":{},"subject":[],"published":{"date-parts":[[2023,1,9]]}}}