{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T00:48:47Z","timestamp":1740098927157,"version":"3.37.3"},"publisher-location":"Cham","reference-count":25,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319664286"},{"type":"electronic","value":"9783319664293"}],"license":[{"start":{"date-parts":[[2017,1,1]],"date-time":"2017-01-01T00:00:00Z","timestamp":1483228800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017]]},"DOI":"10.1007\/978-3-319-66429-3_42","type":"book-chapter","created":{"date-parts":[[2017,8,12]],"date-time":"2017-08-12T02:02:55Z","timestamp":1502503375000},"page":"427-437","source":"Crossref","is-referenced-by-count":2,"title":["Improving of LVCSR for Causal Czech Using Publicly Available Language Resources"],"prefix":"10.1007","author":[{"given":"Petr","family":"Mizera","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Petr","family":"Pollak","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2017,8,13]]},"reference":[{"key":"42_CR1","doi-asserted-by":"crossref","unstructured":"Cui, J., Ramabhadran, B., Cui, X., Rosenberg, A., Kingsbury, B., Sethy, A.: Recent improvements in neural network acoustic modeling for LVCSR in low resource languages. In: Proceedings of Interspeech 2014: 15th Annual Conference of the International Speech Communication Association, Singapore (2014)","DOI":"10.21437\/Interspeech.2014-213"},{"key":"42_CR2","doi-asserted-by":"crossref","unstructured":"Seltzer, L.M., Dong, Y., Yongqiang, W.: An investigation of deep neural networks for noise robust speech recognition. In: IEEE International Conference on Acoustics, Speech and Signal Processing, ICASSP 2013, Vancouver, Canada (2013)","DOI":"10.1109\/ICASSP.2013.6639100"},{"key":"42_CR3","unstructured":"Korvas, M., Pl\u00e1tek, O., Du\u0161ek, O., \u017dilka, L., Jur\u010d\u00ed\u010dek, F.: Free English and Czech telephone speech corpus shared under the CC-BY-SA 3.0 license. In: Proceedings of LREC 2014: 9th International Conference on Language Resources and Evaluation, Reykjavik, Iceland, pp. 365\u2013370 (2014)"},{"key":"42_CR4","doi-asserted-by":"crossref","unstructured":"Barras, C., Lamel, L., Gauvain, J.L.: Automatic transcription of compressed broadcast audio. In: Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing, Salt Lake City, USA, pp. 265\u2013268 (2001)","DOI":"10.1109\/ICASSP.2001.940818"},{"key":"42_CR5","doi-asserted-by":"crossref","unstructured":"Nouza, J., \u017dd\u00e1nsk\u00fd, J., \u010cerva, P.: System for automatic collection, annotation and indexing of Czech broadcast speech with full-text search. In: Proceedings of 15th IEEE MELECON Conference, La Valleta, Malta, pp. 202\u2013205 (2010)","DOI":"10.1109\/MELCON.2010.5476306"},{"key":"42_CR6","doi-asserted-by":"crossref","unstructured":"Nouza, J., Blavka, K., Bohac, M., Cerva, P., M\u00e1lek, J.: System for producing subtitles to internet audio-visual documents. In: 38th International Conference on Telecommunications and Signal Processing, TSP 2015, Prague, Czech Republic, pp. 1\u20135, 9\u201311 July 2015","DOI":"10.1109\/TSP.2015.7296415"},{"key":"42_CR7","unstructured":"Psutka, J., Psutka, J., Ircing, P., Hoidekr, J.: Recognition of spontaneously pronounced TV ice-hockey commentary. In: Proceedings of ISCA & IEEE Workshop on Spontaneous Speech Processing and Recognition, Tokyo, pp. 83\u201386 (2003)"},{"key":"42_CR8","doi-asserted-by":"crossref","unstructured":"Lehr, M., Gorman, K., Shafran, I.: Discriminative pronunciation modeling for dialectal speech recognition. In: Proceedings of Interspeech 2014, Singapore, pp. 1458\u20131462 (2014)","DOI":"10.21437\/Interspeech.2014-356"},{"key":"42_CR9","doi-asserted-by":"crossref","unstructured":"Nouza, J., Silovsk\u00fd, J.: Adpating lexical and language models for transcription of highly spontaneous spoken Czech. In: Proceedings of Text, Speech, and Dialogue, LNAI, vol. 6231, Brno, Czech Republic, pp. 377\u2013384 (2010)","DOI":"10.1007\/978-3-642-15760-8_48"},{"issue":"4","key":"42_CR10","doi-asserted-by":"crossref","first-page":"420","DOI":"10.1109\/TSA.2004.828702","volume":"12","author":"W Byrne","year":"2004","unstructured":"Byrne, W., et al.: Automatic recognition of spontaneous speech for access to multilingual oral history archives. IEEE Trans. Speech Audio Process. 12(4), 420\u2013435 (2004)","journal-title":"IEEE Trans. Speech Audio Process."},{"key":"42_CR11","unstructured":"Ernestus, M., Ko\u010dkov\u00e1-Amortov\u00e1, L., Poll\u00e1k, P.: The Nijmegen corpus of casual Czech. In: Proceedings of LREC 2014: 9th International Conference on Language Resources and Evaluation, Reykjavik, Iceland, pp. 365\u2013370 (2014)"},{"key":"42_CR12","doi-asserted-by":"crossref","first-page":"201","DOI":"10.1016\/j.specom.2009.10.004","volume":"52","author":"F Torreira","year":"2010","unstructured":"Torreira, F., Adda-Decker, M., Ernestus, M.: The Nijmegen corpus of casual French. Speech Commun. 52, 201\u2013221 (2010)","journal-title":"Speech Commun."},{"key":"42_CR13","unstructured":"Prochazka, V., Pollak, P.: Conversational speech from Nijmegen corpus of casual Czech by general ASR language models. In: Production and Comprehension of Conversational Speech, pp. 34\u201335 (2011)"},{"issue":"6","key":"42_CR14","doi-asserted-by":"crossref","first-page":"82","DOI":"10.1109\/MSP.2012.2205597","volume":"29","author":"G Hinton","year":"2012","unstructured":"Hinton, G., Deng, L., Yu, D., Dahl, G., Mohamed, A., Jaitly, N., Senior, A., Vanhoucke, V., Nguyen, P., Sainath, T., Kingsbury, B.: Deep neural networks for acoustic modeling in speech recognition: the shared views of four research groups. IEEE Sig. Process. Mag. 29(6), 82\u201397 (2012)","journal-title":"IEEE Sig. Process. Mag."},{"key":"42_CR15","doi-asserted-by":"crossref","unstructured":"Vesely, K., Karafiat, M., Grezl, F.: Convolutive bottleneck network features for lVCSR. In: 2011 IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), December 2011","DOI":"10.1109\/ASRU.2011.6163903"},{"key":"42_CR16","unstructured":"Pollak, P., Cernocky, J.: Czech SPEECON adult database. Technical report (2004)"},{"key":"42_CR17","unstructured":"Institute of the Czech National Corpus: SYN2006PUB corpus (2006). http:\/\/ucnk.ff.cuni.cz\/english\/syn2006pub.php"},{"key":"42_CR18","first-page":"1002","volume":"20","author":"V Prochazka","year":"2011","unstructured":"Prochazka, V., Pollak, P., Zdansky, J., Nouza, J.: Performance of Czech speech recognition with language models created from public resources. Radioengineering 20, 1002\u20131008 (2011)","journal-title":"Radioengineering"},{"key":"42_CR19","unstructured":"Institute of the Czech National Corpus: Corpus oral 2006 and oral 2008 and oral 2013, Institute of the Czech National Corpus FF UK. http:\/\/www.korpus.cz"},{"key":"42_CR20","doi-asserted-by":"crossref","unstructured":"Schuppler, B., Adda-Decker, M., Morales-Cordovilla, J.A.: Pronunciation variation in read and conversational Austrian German. In: Proceedings of Interspeech 2014, Singapore (2014)","DOI":"10.21437\/Interspeech.2014-355"},{"key":"42_CR21","unstructured":"Kolman, A., Pollak, P.: Speech reduction in Czech. In: Proceedings of LabPhone 14, The 14th Conference on Laboratory Phonology, Tokyo, Japan (2014)"},{"key":"42_CR22","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"377","DOI":"10.1007\/978-3-642-03320-9_35","volume-title":"Cross-Modal Analysis of Speech, Gestures, Gaze and Facial Expressions","author":"J Rajnoha","year":"2009","unstructured":"Rajnoha, J., Poll\u00e1k, P.: Czech spontaneous speech collection and annotation: the database of technical lectures. In: Esposito, A., V\u00edch, R. (eds.) Cross-Modal Analysis of Speech, Gestures, Gaze and Facial Expressions. LNCS, vol. 5641, pp. 377\u2013385. Springer, Heidelberg (2009). doi: 10.1007\/978-3-642-03320-9_35"},{"key":"42_CR23","unstructured":"Povey, D., et al.: The Kaldi speech recognition toolkit. In: Proceedings of ASRU 2011, IEEE 2011 Workshop on Automatic Speech Recognition and Understanding (2011)"},{"key":"42_CR24","unstructured":"Fousek, P., Pollak, P.: Efficient and reliable measurement and simulation of noisy speech background. In: Proceedings of EUROSPEECH 2003, 8-th European Conference on Speech Communication and Technology, Geneve, Switzerland (2003)"},{"key":"42_CR25","doi-asserted-by":"crossref","unstructured":"Borsky, M., Mizera, P., Pollak, P.: Noise and channel normalized cepstral features for far-speech recognition. In: Proceedings of SPECOM 2013, The 15th International Conference on Speech and Computer, Pilsen, Czech Republic (2013)","DOI":"10.1007\/978-3-319-01931-4_32"}],"container-title":["Lecture Notes in Computer Science","Speech and Computer"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-66429-3_42","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,1]],"date-time":"2022-08-01T03:35:59Z","timestamp":1659324959000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-66429-3_42"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017]]},"ISBN":["9783319664286","9783319664293"],"references-count":25,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-66429-3_42","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2017]]}}}