{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,7]],"date-time":"2024-09-07T21:45:53Z","timestamp":1725745553039},"publisher-location":"Berlin, Heidelberg","reference-count":17,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642405846"},{"type":"electronic","value":"9783642405853"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2013]]},"DOI":"10.1007\/978-3-642-40585-3_69","type":"book-chapter","created":{"date-parts":[[2013,8,17]],"date-time":"2013-08-17T10:15:02Z","timestamp":1376734502000},"page":"552-559","source":"Crossref","is-referenced-by-count":2,"title":["The Joint Optimization of Spectro-Temporal Features and Neural Net Classifiers"],"prefix":"10.1007","author":[{"given":"Gy\u00f6rgy","family":"Kov\u00e1cs","sequence":"first","affiliation":[]},{"given":"L\u00e1szl\u00f3","family":"T\u00f3th","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"issue":"2","key":"69_CR1","doi-asserted-by":"publisher","first-page":"133","DOI":"10.1007\/BF00336731","volume":"42","author":"A.M. Aertsen","year":"1981","unstructured":"Aertsen, A.M., Johannesma, P.I.: The spectro-temporal receptive field. A functional characteristic of auditory neurons. Biological Cybernetics\u00a042(2), 133\u2013143 (1981)","journal-title":"Biological Cybernetics"},{"key":"69_CR2","doi-asserted-by":"crossref","unstructured":"Bouvrie, J., Ezzat, T., Poggio, T.: Localized Spectro-Temporal Cepstral Analysis of Speech. In: Proc. ICASSP, pp. 4733\u20134736 (2008)","DOI":"10.1109\/ICASSP.2008.4518714"},{"key":"69_CR3","doi-asserted-by":"crossref","unstructured":"Kov\u00e1cs, G., T\u00f3th, L.: Localized Spectro-Temporal Features for Noise-Robust Speech Recognition. In: Proc. ICCC-CONTI 2010, pp. 481\u2013485 (2010)","DOI":"10.1109\/ICCCYB.2010.5491225"},{"key":"69_CR4","doi-asserted-by":"crossref","unstructured":"Kov\u00e1cs, G., T\u00f3th, L.: Phone Recognition Experiments with 2D-DCT Spectro-Temporal Features. In: Proc. SACI 2011, pp. 143\u2013146 (2011)","DOI":"10.1109\/SACI.2011.5872988"},{"key":"69_CR5","doi-asserted-by":"crossref","unstructured":"Meyer, B.T., Kollmeier, B.: Optimization and evaluation of Gabor feature sets for ASR. In: Proc. Interspeech 2008, pp. 906\u2013909 (2008)","DOI":"10.21437\/Interspeech.2008-211"},{"key":"69_CR6","doi-asserted-by":"crossref","unstructured":"Kleinschmidt, M.: Localized Spectro-Temporal Features for Automatic Speech Recognition. In: Proc. EuroSpeech 2003, pp. 2573\u20132576 (2003)","DOI":"10.21437\/Eurospeech.2003-710"},{"issue":"3","key":"69_CR7","first-page":"416","volume":"88","author":"M. Kleinschmidt","year":"2002","unstructured":"Kleinschmidt, M.: Methods for capturing spectrotemporal modulations in automatic speech recognition. Acta Acustica United With Acustica\u00a088(3), 416\u2013422 (2002)","journal-title":"Acta Acustica United With Acustica"},{"key":"69_CR8","unstructured":"Greenberg, S.: Understanding Speech Understanding: Towards A Unified Theory Of Speech Perception. In: Proceedings of the ESCA Tutorial and Advanced Research Workshop on the Auditory Basis of Speech Perception, pp. 1\u20138 (1996)"},{"key":"69_CR9","doi-asserted-by":"crossref","unstructured":"Ezzat, T., Bouvrie, J., Poggio, T.: Spectro-Temporal Analysis of Speech Using 2-D Gabor Filters. In: Proc. Interspeech 2007, pp. 506\u2013509 (2007)","DOI":"10.21437\/Interspeech.2007-236"},{"key":"69_CR10","doi-asserted-by":"crossref","unstructured":"Kleinschmidt, M., Gelbart, D.: Improving Word Accuracy with Gabor Feature Extraction. In: Proc. ICSLP 2002, pp. 25\u201328 (2002)","DOI":"10.21437\/ICSLP.2002-5"},{"key":"69_CR11","doi-asserted-by":"crossref","unstructured":"Bourlard, H., Morgan, N.: Connectionist speech recognition: A hybrid approach. Kluwer Academic Pub. (1994)","DOI":"10.1007\/978-1-4615-3210-1"},{"key":"69_CR12","doi-asserted-by":"crossref","unstructured":"Abdel-Hamid, O., Mohamed, A., Jiang, H., Penn, G.: Applying Convolutional Neural Networks concepts to hybrid NN-HMM model for speech recognition. In: Proc. ICASSP 2012, pp. 4277\u20134280 (2012)","DOI":"10.1109\/ICASSP.2012.6288864"},{"key":"69_CR13","doi-asserted-by":"crossref","unstructured":"Vesely, K., Karafiat, M., Grezl, F.: Convolutive Bottleneck Network features for LVCSR. In: Proc. ASRU 2011, pp. 42\u201347 (2011)","DOI":"10.1109\/ASRU.2011.6163903"},{"key":"69_CR14","doi-asserted-by":"publisher","first-page":"1641","DOI":"10.1109\/29.46546","volume":"37","author":"K.-F. Lee","year":"1989","unstructured":"Lee, K.-F., Hon, H.-W.: Speaker-independent phone recognition using Hidden Markov models. IEEE Trans. Acoust., Speech Signal Processing\u00a037, 1641\u20131648 (1989)","journal-title":"IEEE Trans. Acoust., Speech Signal Processing"},{"key":"69_CR15","volume-title":"PC The HTK book version 3.4","author":"S.. Young","year":"2006","unstructured":"Young, S., et al.: PC The HTK book version 3.4. Cambridge University Engineering Department, Cambridge (2006)"},{"key":"69_CR16","doi-asserted-by":"crossref","unstructured":"Vinyals, O., Deng, L.: Are sparse representations enough for acoustic modeling? In: Proc. INTERSPEECH (2012)","DOI":"10.21437\/Interspeech.2012-8"},{"issue":"2","key":"69_CR17","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1007\/s13042-011-0019-y","volume":"2","author":"G.-B. Huang","year":"2011","unstructured":"Huang, G.-B., Wang, D.H., Lan, Y.: Extreme learning machines: A survey. International Journal of Machine Learning and Cybernetics\u00a02(2), 107\u2013122 (2011)","journal-title":"International Journal of Machine Learning and Cybernetics"}],"container-title":["Lecture Notes in Computer Science","Text, Speech, and Dialogue"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-40585-3_69","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,3]],"date-time":"2023-07-03T22:53:42Z","timestamp":1688424822000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-40585-3_69"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2013]]},"ISBN":["9783642405846","9783642405853"],"references-count":17,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-40585-3_69","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2013]]}}}