{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,25]],"date-time":"2025-09-25T18:06:59Z","timestamp":1758823619935,"version":"3.41.0"},"reference-count":70,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2017,2,28]],"date-time":"2017-02-28T00:00:00Z","timestamp":1488240000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J AUDIO SPEECH MUSIC PROC."],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1186\/s13636-017-0102-8","type":"journal-article","created":{"date-parts":[[2017,2,28]],"date-time":"2017-02-28T02:18:01Z","timestamp":1488248281000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["Statistical analysis of orthographic and phonemic language corpus for word-based and phoneme-based Polish language modelling"],"prefix":"10.1186","volume":"2017","author":[{"given":"Piotr","family":"K\u0142osowski","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2017,2,28]]},"reference":[{"key":"102_CR1","volume-title":"Fundamentals of Speech Recognition. Prentice Hall signal processing series","author":"L Rabiner","year":"1993","unstructured":"L Rabiner, B Juang, Fundamentals of Speech Recognition. Prentice Hall signal processing series (PTR Prentice Hall, USA, 1993)."},{"key":"102_CR2","doi-asserted-by":"publisher","first-page":"163","DOI":"10.1016\/j.csl.2015.07.001","volume":"35","author":"JR Bellegarda","year":"2016","unstructured":"JR Bellegarda, C Monz, State of the art in statistical methods for language and speech processing. Comput. Speech Lang. 35:, 163\u2013184 (2016).","journal-title":"Comput. Speech Lang"},{"key":"102_CR3","volume-title":"Encyclopedia of Language and Linguistics, Statistical methods for the recognition and understanding of speech","author":"L Rabiner","year":"2005","unstructured":"L Rabiner, B Juang, Encyclopedia of Language and Linguistics, Statistical methods for the recognition and understanding of speech (Elsevier, Amsterdam, 2005)."},{"key":"102_CR4","first-page":"19","volume-title":"Incorporating Knowledge Sources into Statistical Speech Recognition, vol 42 of Lecture Notes in Electrical Engineering","author":"S Sakti","year":"2009","unstructured":"S Sakti, K Markov, S Nakamura, W Minker, in Incorporating Knowledge Sources into Statistical Speech Recognition, vol 42 of Lecture Notes in Electrical Engineering. Statistical Speech Recognition (Springer USUSA, 2009), pp. 19\u201353."},{"key":"102_CR5","doi-asserted-by":"publisher","first-page":"76","DOI":"10.1109\/89.817455","volume":"8","author":"J Bellegarda","year":"2000","unstructured":"J Bellegarda, Large vocabulary speech recognition with multispan statistical language models. IEEE Transa. Speech Audio Process. 8:, 76\u201384 (2000).","journal-title":"IEEE Transa. Speech Audio Process"},{"key":"102_CR6","first-page":"236","volume-title":"Computer Nerworks vol 79 of Communications in Computer and Information Science","author":"P K\u0142osowski","year":"2010","unstructured":"P K\u0142osowski, in Computer Nerworks vol 79 of Communications in Computer and Information Science, ed. by A Kwiecien, P Gaj, and P Stera. Speech processing application based on phonetics and phonology of the polish language. 17th International Conference Computer Networks, Ustron, Poland, Jun 15-19 (Springer-VerlagBerlin, 2010), pp. 236\u2013244."},{"key":"102_CR7","first-page":"303","volume":"89","author":"P K\u0142osowski","year":"2013","unstructured":"P K\u0142osowski, Improving speech processing based on phonetics and phonology of Polish language. Przegl\u0105d Elektrotechniczny. 89:, 303\u2013307 (2013).","journal-title":"Przegl\u0105d Elektrotechniczny"},{"issue":"1","key":"102_CR8","first-page":"29","volume":"47","author":"J Izydorczyk","year":"1999","unstructured":"J Izydorczyk, P K\u0142osowski, Acoustic properties of Polish vowels. Bull. Pol. Acad. Sci. Tech. Sci. 47(1), 29\u201337 (1999).","journal-title":"Bull. Pol. Acad. Sci. Tech. Sci"},{"key":"102_CR9","first-page":"61","volume-title":"International Conference Programable Devices and Systems PDS2001 IFAC Workshop, Gliwice November 22nd - 23rd","author":"J Izydorczyk","year":"2001","unstructured":"J Izydorczyk, P K\u0142osowski, in International Conference Programable Devices and Systems PDS2001 IFAC Workshop, Gliwice November 22nd - 23rd. Base acoustic properties of Polish speech (IFACGliwice, 2001), pp. 61\u201366."},{"key":"102_CR10","first-page":"308","volume-title":"Computer Networks, CN 2014. vol 431 of Communications in Computer and Information Science","author":"P K\u0142osowski","year":"2014","unstructured":"P K\u0142osowski, A Dustor, J Izydorczyk, J Kotas, Slimok J, in Computer Networks, CN 2014. vol 431 of Communications in Computer and Information Science, ed. by A Kwiecien, P Gaj, and P Stera. Speech recognition based on open source speech processing software. 21st International Science Conference on Computer Networks (CN), Brunow, Poland, Jun 23-27 (Springer-VerlagBerlin, 2014), pp. 308\u2013317."},{"key":"102_CR11","first-page":"456","volume-title":"Computer Networks, CN 2013. vol 370 of Communications in Computer and Information Science","author":"A Dustor","year":"2013","unstructured":"A Dustor, K\u0142osowski P, in Computer Networks, CN 2013. vol 370 of Communications in Computer and Information Science, ed. by A Kwiecien, P Gaj, and Stera P. Biometric voice identification based on Fuzzy Kernel Classifier. 20th International Conference on Computer Networks (CN), Lwowek Slaski, Poland, Jun 17-21 (Springer-VerlagBerlin, 2013), pp. 456\u2013465."},{"key":"102_CR12","doi-asserted-by":"publisher","first-page":"206","DOI":"10.1109\/ICMCS.2014.6911233","volume-title":"2014 International Conference on Multimedia Computing and Systems (ICMCS)","author":"A Dustor","year":"2014","unstructured":"A Dustor, P K\u0142osowski, J Izydorczyk, in 2014 International Conference on Multimedia Computing and Systems (ICMCS). Speaker recognition system with good generalization properties. International Conference on Multimedia Computing and Systems (ICMCS), Marrakech, Morocco, Apr 14-16 (IEEEUSA, 2014), pp. 206\u2013210."},{"key":"102_CR13","first-page":"177","volume-title":"Computer Networks, CN 2014. vol 431 of, Communications in Computer and Information Science","author":"A Dustor","year":"2014","unstructured":"A Dustor, P K\u0142osowski, J Izydorczyk, in Computer Networks, CN 2014. vol 431 of, Communications in Computer and Information Science, ed. by A Kwiecien, P Gaj, and P Stera. Influence of Feature Dimensionality and Model Complexity on Speaker Verification Performance. 21st International Science Conference on Computer Networks (CN), Brunow, Poland, Jun 23-27 (Springer-VerlagBerlin, 2014), pp. 177\u2013186."},{"key":"102_CR14","first-page":"400","volume-title":"Computer Networks, CN 2015. vol 522 of Communications in Computer and Information Science","author":"P K\u0142osowski","year":"2015","unstructured":"P K\u0142osowski, A Dustor, J Izydorczyk, in Computer Networks, CN 2015. vol 522 of Communications in Computer and Information Science, ed. by P Gaj, A Kwiecien, and P Stera. Speaker verification performance evaluation based on open source speech processing software and timit speech corpus. 22nd International Conference on Computer Networks (CN), Brunow, Poland, Jun 16-19 (Springer-VerlagBerlin, 2015), pp. 400\u2013409."},{"key":"102_CR15","first-page":"242","volume-title":"Computer Networks, CN 2015. vol 522 of Communications in Computer and Information Science","author":"A Dustor","year":"2015","unstructured":"A Dustor, P K\u0142osowski, J Izydorczyk, R Kopanski, in Computer Networks, CN 2015. vol 522 of Communications in Computer and Information Science, ed. by P Gaj, A Kwiecien, and P Stera. Influence of Corpus Size on Speaker Verification. 22nd International Conference on Computer Networks (CN), Brunow, Poland (Springer-VerlagBerlin, 2015), pp. 242\u2013249."},{"key":"102_CR16","first-page":"466","volume-title":"Computer Networks, CN 2013. vol 370 of Communications in Computer and Information Science","author":"P K\u0142osowski","year":"2013","unstructured":"P K\u0142osowski, Dustor A, in Computer Networks, CN 2013. vol 370 of Communications in Computer and Information Science, ed. by A Kwiecien, P Gaj, and P Stera. Automatic Speech Segmentation for Automatic Speech Translation. 20th International Conference on Computer Networks (CN), Lwowek Slaski, Poland, Jun 17-21 (Springer-VerlagBerlin, 2013), pp. 466\u2013475."},{"key":"102_CR17","volume-title":"Statistical Methods for Speech Recognition. Language, Speech, & Communication: A Bradford Book","author":"F Jelinek","year":"1997","unstructured":"F Jelinek, Statistical Methods for Speech Recognition. Language, Speech, & Communication: A Bradford Book (MIT Press, USA, 1997)."},{"key":"102_CR18","doi-asserted-by":"publisher","first-page":"366","DOI":"10.1093\/ietisy\/e88-d.3.366","volume":"E88D","author":"S Furui","year":"2005","unstructured":"S Furui, Recent progress in corpus-based spontaneous speech recognition. IEICE Trans. Inf. Syst. E88D:, 366\u2013375 (2005).","journal-title":"IEICE Trans. Inf. Syst"},{"key":"102_CR19","doi-asserted-by":"crossref","first-page":"71","DOI":"10.3917\/rfla.121.0071","volume":"12","author":"M Adda-Decker","year":"2007","unstructured":"M Adda-Decker, Corpus for automatic speech recognition. Revue Francaise De Linguistique Appliquee. 12:, 71\u201384 (2007).","journal-title":"Revue Francaise De Linguistique Appliquee"},{"key":"102_CR20","volume-title":"The National Corpus of Polish (in Polish: Narodowy Korpus J\u0119zyka Polskiego)","author":"A Przepi\u00f3rkowski","year":"2012","unstructured":"A Przepi\u00f3rkowski, M Ba\u0144ko, RL G\u00f3rski, B Lewandowska-Tomaszczyk, The National Corpus of Polish (in Polish: Narodowy Korpus J\u0119zyka Polskiego) (Wydawnictwo Naukowe PWN, Warszawa, 2012)."},{"key":"102_CR21","volume-title":"Proceedings of the Sixth International Conference on Language Resources and Evaluation, LREC 2008","author":"A Przepi\u00f3rkowski","year":"2008","unstructured":"A Przepi\u00f3rkowski, RL G\u00f3rski, B Lewandowska-Tomaszczyk, \u0141azi\u0144ski M, in Proceedings of the Sixth International Conference on Language Resources and Evaluation, LREC 2008. Towards the national corpus of Polish (MarrakechELRA, 2008)."},{"key":"102_CR22","first-page":"231","volume":"63","author":"RL G\u00f3rski","year":"2012","unstructured":"RL G\u00f3rski, B Lewandowska-Tomaszczyk, M Ba\u0144ko, P P\u0119zik, M \u0141azi\u0144ski, A Przepi\u00f3rkowski, Practical applications of the National Corpus of Polish. Prace Filologiczne. 63:, 231\u2013240 (2012).","journal-title":"Prace Filologiczne"},{"key":"102_CR23","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1126\/science.aaa8685","volume":"349","author":"J Hirschberg","year":"2015","unstructured":"J Hirschberg, CD Manning, Advances in natural language processing. Science. 349:, 261\u2013266 (2015).","journal-title":"Science"},{"key":"102_CR24","doi-asserted-by":"crossref","DOI":"10.1017\/9780511807954","volume-title":"Handbook of the International Phonetic Association: A Guide to the Use of the International Phonetic Alphabet. A Regents publication","author":"Association International Phonetic","year":"1999","unstructured":"Association International Phonetic, Handbook of the International Phonetic Association: A Guide to the Use of the International Phonetic Alphabet. A Regents publication (Cambridge University Press, UK, 1999)."},{"key":"102_CR25","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511486807","volume-title":"The Slavic Languages. Cambridge Language Surveys","author":"R Sussex","year":"2006","unstructured":"R Sussex, P Cubberley, The Slavic Languages. Cambridge Language Surveys (Cambridge University Press, UK, 2006)."},{"key":"102_CR26","volume-title":"Handbook of Standards and Resources for Spoken Language Systems. vol Part IV, section B","author":"J Wells","year":"1997","unstructured":"J Wells, in Handbook of Standards and Resources for Spoken Language Systems. vol Part IV, section B, ed. by D Gibbon, R Moore, and R Winski. SAMPA computer readable phonetic alphabet (Mouton de GruyterBerlin and New York, 1997)."},{"key":"102_CR27","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.specom.2016.03.003","volume":"80","author":"M Razavi","year":"2016","unstructured":"M Razavi, R Rasipuram, MM Doss, Acoustic data-driven grapheme-to-phoneme conversion in the probabilistic lexical modeling framework. Speech Commun. 80:, 1\u201321 (2016).","journal-title":"Speech Commun"},{"key":"102_CR28","first-page":"331","volume":"20","author":"RM Kaplan","year":"1994","unstructured":"RM Kaplan, M Kay, Regular models of phonological rule systems. Comput. Linguist. 20:, 331\u2013378 (1994).","journal-title":"Comput. Linguist"},{"key":"102_CR29","first-page":"75","volume":"14","author":"M Steffen-Bat\u00f3g","year":"1973","unstructured":"M Steffen-Bat\u00f3g, The problem of automatic phonemic transcription of written Polish. Biuletyn Fonograficzny. 14:, 75\u201386 (1973).","journal-title":"Biuletyn Fonograficzny"},{"key":"102_CR30","volume-title":"Polish: Automatyzacja transkrypcji fonematycznej tekst\u00f3w polskich","author":"M Steffen-Bat\u00f3g","year":"1975","unstructured":"M Steffen-Bat\u00f3g, in Polish: Automatyzacja transkrypcji fonematycznej tekst\u00f3w polskich. Automatic phonemic transcription of Polish texts (Wydawnictwo Naukowe PWNWarszawa, 1975)."},{"key":"102_CR31","volume-title":"Studia Phonetica Posnaniensia. Vol. 3","author":"M Steffen-Bat\u00f3g","year":"1993","unstructured":"M Steffen-Bat\u00f3g, Nowakowski P, in Studia Phonetica Posnaniensia. Vol. 3, ed. by M Steffen-Bat\u00f3g, W Awedyk. An algorithm for phonetic transcription of orthographic texts in Polish (Wydawnictwo Naukowe UAMPozna\u0144, 1993)."},{"key":"102_CR32","volume-title":"A phonemic transcription and syllable division rule engine","author":"W Jassem","year":"1996","unstructured":"W Jassem, A phonemic transcription and syllable division rule engine (Onomastica-Copernicus Research Colloquium, Edinburgh, 1996)."},{"key":"102_CR33","first-page":"298","volume-title":"Proceedings of 20th IEEE International Conference Signal Processing Algorithms, Architectures, Arrangements, and App.lications, September 21-23","author":"P K\u0142osowski","year":"2016","unstructured":"P K\u0142osowski, in Proceedings of 20th IEEE International Conference Signal Processing Algorithms, Architectures, Arrangements, and App.lications, September 21-23. Algorithm and implementation of automatic phonemic transcription for polish (Poznan University of TechnologyPozna\u0144, 2016), pp. 298\u2013303."},{"key":"102_CR34","volume-title":"Speech and Language Technology. Vol. 3","author":"M Wypych","year":"1999","unstructured":"M Wypych, in Speech and Language Technology. Vol. 3. Implementation of phonenic transcription alghorithm (in Polish: Implementacja algorytmu transkrypcji fonematycznej) (Polskie Towarzystwo FonetycznePozna\u0144, 1999)."},{"key":"102_CR35","unstructured":"G Demenko, M Wypych, E Baranowska, Implementation of grapheme-to-phoneme rules and extended SAMPA alphabet in Polish text-to-speech synthesis. Speech Lang. Technol. 7(17) (2003)."},{"key":"102_CR36","doi-asserted-by":"publisher","first-page":"292","DOI":"10.1109\/HSI.2013.6577838","volume-title":"2013 6th International Conferance on Human Systems Interactions (HSI)","author":"P Przybysz","year":"2013","unstructured":"P Przybysz, W Kasprzak, in 2013 6th International Conferance on Human Systems Interactions (HSI), ed. by WA Paja, BM Wilamowski. The generation of letter-to-sound rules for grapheme-to-phoneme conversion. Conference on Human System Interaction. Gdansk Univ Technol; Univ Informat Technol & Management; IEEE Ind Elect Soc (Gdansk University of TechlologyGdansk, 2013), pp. 292\u2013297."},{"key":"102_CR37","volume-title":"7th Language & Technology Conference, Pozna\u0144","author":"D Skurzok","year":"2015","unstructured":"D Skurzok, B Zi\u00f3\u0142ko, Zi\u00f3\u0142ko M, in 7th Language & Technology Conference, Pozna\u0144. Ortfon2 - tool for orthographic to phonetic transcription (Adam Mickiewicz University in PoznanPoznan, 2015)."},{"key":"102_CR38","unstructured":"D Kor\u017einek, \u0141 Brocki, Marasek K, Polish grapheme-to-phoneme tool and service, CLARIN-PL digital repository (2016). http:\/\/hdl.handle.net\/11321\/295 , (Online: 2016.08.01)."},{"key":"102_CR39","unstructured":"Wiktionary, Polish Language Dictionary (2015). https:\/\/pl.wiktionary.org\/. Accessed 17 Feb 2017."},{"key":"102_CR40","unstructured":"W Jassem, Podstawy fonetyki akustycznej (eng. Rudiments of acoustic phonetics) (PWN, Warszawa, 1973)."},{"key":"102_CR41","first-page":"179","volume":"32","author":"P \u0141obacz","year":"1974","unstructured":"P \u0141obacz, W Jassem, Fonotaktyczna analiza m\u00f3wionego tekstu polskiego (eng. Phonotactic analysis of spoken Polish texts). Biuletyn Polskiego Towarzystwa J\u0119. 32:, 179\u2013195 (1974).","journal-title":"Biuletyn Polskiego Towarzystwa J\u0119"},{"key":"102_CR42","unstructured":"C Basztura, Rozmawiac z komputerem (Eng. To speak with computers), (1992)."},{"key":"102_CR43","unstructured":"B Zi\u00f3\u0142ko, J Ga\u0142ka, S Manandhar, RC Wilson, M Zi\u00f3\u0142ko, in Human Language Technology: Challenges of the Information Society. Vol 5603 of Lecture Notes in Artificial Intelligence, ed. by Z Vetulani, H Uszkoreit. Triphone Statistics for Polish Language. 3rd Language and Technology Conference 2007, Poznan, Poland, Oct 05-07, (2009), pp. 63\u201373."},{"key":"102_CR44","first-page":"97","volume":"10","author":"B Zi\u00f3\u0142ko","year":"2009","unstructured":"B Zi\u00f3\u0142ko, J Ga\u0142ka, M Zi\u00f3\u0142ko, Polish phoneme statistics obtained on large set of written texts. Comput. Sci. (AGH). 10:, 97\u2013106 (2009).","journal-title":"Comput. Sci. (AGH)"},{"key":"102_CR45","first-page":"561","volume-title":"Computer Science and Information Technology (IMCSIT), Proceedings of the 2010 International Multiconference on","author":"B Zi\u00f3\u0142ko","year":"2010","unstructured":"B Zi\u00f3\u0142ko, Ga\u0142ka J, in Computer Science and Information Technology (IMCSIT), Proceedings of the 2010 International Multiconference on. Polish phones statistics (AGH Univesity of Science and TechnologyKrakow, 2010), pp. 561\u2013565."},{"key":"102_CR46","volume-title":"2014 XXII Annual Pacific Voice Conference (PVC)","author":"B Zi\u00f3\u0142ko","year":"2014","unstructured":"B Zi\u00f3\u0142ko, P Zelasko, Skurzok D, in 2014 XXII Annual Pacific Voice Conference (PVC). Statistics of diphones and triphones presence on the word boundaries in the Polish language. App.lications to ASR. Annual Pacific Voice Conference, AGH; Pacific Voice Speech Fdn, 2014. 22nd Annual Pacific Voice Conference (PVC) (KrakowAGH Univesity of Science and Technology, 2014)."},{"key":"102_CR47","volume-title":"The development of language: Acquisition, change, and evolution","author":"D Lightfoot","year":"1999","unstructured":"D Lightfoot, The development of language: Acquisition, change, and evolution (Wiley-Blackwell, Hoboken, 1999)."},{"key":"102_CR48","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511804489","volume-title":"Corpus linguistics: Investigating language structure and use","author":"D Biber","year":"1998","unstructured":"D Biber, S Conrad, R Repp.en, Corpus linguistics: Investigating language structure and use (Cambridge University Press, Cambridge, 1998)."},{"key":"102_CR49","doi-asserted-by":"publisher","unstructured":"R Facchinetti, M Rissanen, Corpus-based studies of diachronic English, vol. 31 (Peter Lang, 2006).","DOI":"10.3726\/978-3-0351-0269-7"},{"issue":"3","key":"102_CR50","first-page":"306","volume":"6","author":"GK Zipf","year":"1950","unstructured":"GK Zipf, Human behavior and the principle of least effort. J. Clin. Psychol. 6(3), 306\u2013306 (1950).","journal-title":"J. Clin. Psychol"},{"key":"102_CR51","unstructured":"Y Tambovtsev, C Martindale, Phoneme frequencies follow a yule distribution. SKASE J. Theor. Linguist. 4(2) (2008)."},{"key":"102_CR52","doi-asserted-by":"publisher","first-page":"1112","DOI":"10.3758\/s13423-014-0585-6","volume":"21","author":"ST Piantadosi","year":"2014","unstructured":"ST Piantadosi, Zipf\u2019s word frequency law in natural language: A critical review and future directions. Psychonimic Bull. Rev. 21:, 1112\u20131130 (2014).","journal-title":"Psychonimic Bull. Rev"},{"issue":"7","key":"102_CR53","doi-asserted-by":"publisher","first-page":"e0129031","DOI":"10.1371\/journal.pone.0129031","volume":"10","author":"A Corral","year":"2015","unstructured":"A Corral, G Boleda, R Ferrer-i Cancho, Zipf\u2019s law for word frequencies: word forms versus lemmas in long texts. Plos ONE. 10(7), e0129031 (2015). doi: 10.1371\/journal.pone.0129031 .","journal-title":"Plos ONE"},{"issue":"402-410","key":"102_CR54","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1098\/rstb.1925.0002","volume":"213","author":"GU Yule","year":"1925","unstructured":"GU Yule, A mathematical theory of evolution, based on the conclusions of Dr.J. C. Willis, F.R.S. Phil. Trans. R. Soc. London B Biol Sci. 213(402-410), 21\u201387 (1925).","journal-title":"Phil. Trans. R. Soc. London B Biol Sci"},{"key":"102_CR55","doi-asserted-by":"publisher","first-page":"193","DOI":"10.15439\/2015F386","volume-title":"Computer Science and Information Systems (FedCSIS) 2015 Federated Conference on","author":"S Dziadzio","year":"2015","unstructured":"S Dziadzio, A Nabo\u017bny, A Smywi\u0144ski-Pohl, B Zi\u00f3\u0142ko, in Computer Science and Information Systems (FedCSIS) 2015 Federated Conference on. Comparison of language models trained on written texts and speech transcripts in the context of automatic speech recognition (Lodz University of TechnologyLodz, 2015), pp. 193\u2013197."},{"key":"102_CR56","doi-asserted-by":"publisher","first-page":"225","DOI":"10.1109\/IALP.2012.55","volume-title":"2012 International Conference on Asian Language Processing (IALP 2012)","author":"S Takahashi","year":"2012","unstructured":"S Takahashi, T Morimoto, in 2012 International Conference on Asian Language Processing (IALP 2012), ed. by D Xiong, E Castelli, M Dong, and PTN Yen. N-gram Language Model Based on Multi-Word Expressions in Web Documents for Speech Recognition and Closed-Captioning (Soochow UniversityChina, 2012), pp. 225\u2013228."},{"key":"102_CR57","volume-title":"2013 21st Iranian Conference on Electrical Engineering (ICEE)","author":"A Hatami","year":"2013","unstructured":"A Hatami, A Akbari, B Nasersharif, in 2013 21st Iranian Conference on Electrical Engineering (ICEE). N-gram Adaptation Using Dirichlet Class Language Model Based on Part-of-Speech for Speech Recognition (Ferdowsi University of MashhadMashhadm, 2013)."},{"key":"102_CR58","first-page":"286","volume-title":"New Frontiers in App.lied Artificial Intelligence, vol 5027 of Lecture Notes in Artificial Intelligence","author":"M Bahrani","year":"2008","unstructured":"M Bahrani, H Sameti, N Hafezi, S Momtazi, in New Frontiers in App.lied Artificial Intelligence, vol 5027 of Lecture Notes in Artificial Intelligence, ed. by NT Nguyen, L Borzemski, A Grzech, and M Ali. New word clustering method for building n-gram language models in continuous speech recognition systems (SpringerBerlin, 2008), pp. 286\u2013293."},{"key":"102_CR59","first-page":"295","volume-title":"2008 International Multiconference on Computer Science and Information Technology (IMCSIT), Vols 1 and 2","author":"B Rapp","year":"2008","unstructured":"B Rapp, in 2008 International Multiconference on Computer Science and Information Technology (IMCSIT), Vols 1 and 2, ed. by M Ganzha, M Paprzycki, and T PelechPilichowski. N-gram language models for Polish language. Basic concepts and applications in automatic speech recognition systems (IEEE Computer Society PressLos Alamitos, 2008), pp. 295\u2013298."},{"issue":"1\u20132","key":"102_CR60","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1016\/S0167-6393(01)00041-3","volume":"38","author":"D Klakow","year":"2002","unstructured":"D Klakow, P Jochen, Testing the correlation of word error rate and perplexity. Speech Commun. 38(1\u20132), 19\u201328 (2002).","journal-title":"Speech Commun"},{"key":"102_CR61","doi-asserted-by":"publisher","DOI":"10.1002\/0471200611","volume-title":"Wiley series in telecommunications: Elements of information theory","author":"T Cover","year":"1991","unstructured":"T Cover, J Thomas, Wiley series in telecommunications: Elements of information theory (John Wiley and Sons, USA, 1991)."},{"key":"102_CR62","volume-title":"Interspeech","author":"P Yu","year":"2004","unstructured":"P Yu, FTB Seide, in Interspeech. A hybrid word\/phoneme-based app.roach for improved vocabulary-independent search in spontaneous speech (CiteseerJeju Island, 2004)."},{"issue":"1","key":"102_CR63","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1186\/s13636-016-0093-x","volume":"2016","author":"V Chunwijitra","year":"2016","unstructured":"V Chunwijitra, A Chotimongkol, C Wutiwiwatchai, A hybrid input-type recurrent neural network for lvcsr language modeling. EURASIP J. Audio Speech Music Process. 2016(1), 15 (2016).","journal-title":"EURASIP J. Audio Speech Music Process"},{"key":"102_CR64","doi-asserted-by":"crossref","unstructured":"A Yazgan, M Saraclar, in Acoustics, Speech, and Signal Processing, 2004. Proceedings.(ICASSP\u201904). IEEE International Conference on. Hybrid language models for out of vocabulary word detection in large vocabulary conversational speech recognition. vol 1 (IEEE, 2004), pp. I\u2013745.","DOI":"10.1109\/ICASSP.2004.1326093"},{"key":"102_CR65","unstructured":"M Larson, Sub-word-based language models for speech recognition: implications for spoken document retrieval. Whorkshop on Language Modeling and Information Retrieval (2001)."},{"key":"102_CR66","first-page":"144","volume-title":"Advances in Natural Language Processing. vol 8686 of Lecture Notes in Artificial Intelligence","author":"A Czardybon","year":"2014","unstructured":"A Czardybon, O Hellwig, W Petersen, in Advances in Natural Language Processing. vol 8686 of Lecture Notes in Artificial Intelligence, ed. by A Przepiorkowski, M Ogrodniczuk. Statistical Analysis of the Interaction between Word Order and Definiteness in Polish. Polish Acad Sci, Inst Comp Sci, 2014. 9th International Conference on Natural Language Processing (NLP), Warsaw, Poland, Sep 17-19 (Polish Academy of Science, Institute of Conputer ScinceWarsaw, 2014), pp. 144\u2013150."},{"key":"102_CR67","doi-asserted-by":"publisher","first-page":"471","DOI":"10.3758\/s13428-014-0489-4","volume":"47","author":"P Mandera","year":"2015","unstructured":"P Mandera, E Keuleers, Z Wodniecka, M Brysbaert, Subtlex-pl: subtitle-based word frequency estimates for Polish. Behav. Res. Methods. 47:, 471\u2013483 (2015).","journal-title":"Behav. Res. Methods"},{"key":"102_CR68","doi-asserted-by":"publisher","first-page":"76","DOI":"10.1109\/89.817455","volume":"8","author":"JR Bellegarda","year":"2000","unstructured":"JR Bellegarda, Large vocabulary speech recognition with multispan statistical language models. IEEE Trans. Speech Audio Process. 8:, 76\u201384 (2000).","journal-title":"IEEE Trans. Speech Audio Process"},{"issue":"3","key":"102_CR69","doi-asserted-by":"publisher","first-page":"492","DOI":"10.1016\/j.csl.2006.09.003","volume":"21","author":"H Schwenk","year":"2007","unstructured":"H Schwenk, Continuous space language models. Comput. Speech Lang. 21(3), 492\u2013518 (2007).","journal-title":"Comput. Speech Lang"},{"key":"102_CR70","doi-asserted-by":"crossref","first-page":"1441","DOI":"10.21437\/Interspeech.2011-252","volume-title":"INTERSPEECH","author":"MAB Shaik","year":"2011","unstructured":"MAB Shaik, E-D AMousa, R Schl\u00fcter, H Ney, in INTERSPEECH. Hybrid language models using mixed types of sub-lexical units for open vocabulary German LVCSR (International Speech Communication Association (ISCA)Baixas, 2011), pp. 1441\u20131444."}],"container-title":["EURASIP Journal on Audio, Speech, and Music Processing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13636-017-0102-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s13636-017-0102-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s13636-017-0102-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,15]],"date-time":"2025-06-15T20:45:30Z","timestamp":1750020330000},"score":1,"resource":{"primary":{"URL":"https:\/\/asmp-eurasipjournals.springeropen.com\/articles\/10.1186\/s13636-017-0102-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,2,28]]},"references-count":70,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2017,12]]}},"alternative-id":["102"],"URL":"https:\/\/doi.org\/10.1186\/s13636-017-0102-8","relation":{},"ISSN":["1687-4722"],"issn-type":[{"type":"electronic","value":"1687-4722"}],"subject":[],"published":{"date-parts":[[2017,2,28]]},"article-number":"5"}}