{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T15:44:58Z","timestamp":1750347898542,"version":"3.37.3"},"publisher-location":"Cham","reference-count":31,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030302436"},{"type":"electronic","value":"9783030302443"}],"license":[{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019]]},"DOI":"10.1007\/978-3-030-30244-3_36","type":"book-chapter","created":{"date-parts":[[2019,9,3]],"date-time":"2019-09-03T07:05:29Z","timestamp":1567494329000},"page":"435-447","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["Sibilant Consonants Classification with Deep Neural Networks"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9493-1564","authenticated-orcid":false,"given":"Ivo","family":"Anjos","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3019-3304","authenticated-orcid":false,"given":"Nuno","family":"Marques","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2187-8253","authenticated-orcid":false,"given":"Margarida","family":"Grilo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8524-8731","authenticated-orcid":false,"given":"Isabel","family":"Guimar\u00e3es","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6290-5719","authenticated-orcid":false,"given":"Jo\u00e3o","family":"Magalh\u00e3es","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7315-4543","authenticated-orcid":false,"given":"Sofia","family":"Cavaco","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2019,8,30]]},"reference":[{"key":"36_CR1","unstructured":"Amodei, D., et al.: Deep speech 2: end-to-end speech recognition in English and Mandarin. In: Proceedings of The 33rd International Conference on Machine Learning, vol. 48, pp. 173\u2013182. PMLR (2016)"},{"key":"36_CR2","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"430","DOI":"10.1007\/978-3-319-76270-8_30","volume-title":"Advances in Computer Entertainment Technology","author":"I Anjos","year":"2018","unstructured":"Anjos, I., Grilo, M., Ascens\u00e3o, M., Guimar\u00e3es, I., Magalh\u00e3es, J., Cavaco, S.: A serious mobile game with visual feedback for training sibilant consonants. In: Cheok, A.D., Inami, M., Rom\u00e3o, T. (eds.) ACE 2017. LNCS, vol. 10714, pp. 430\u2013450. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-319-76270-8_30"},{"issue":"1","key":"36_CR3","doi-asserted-by":"publisher","first-page":"106","DOI":"10.1136\/adc.67.1.106","volume":"67","author":"J Barratt","year":"1992","unstructured":"Barratt, J., Littlejohns, P., Thompson, J.: Trial of intensive compared with weekly speech therapy in preschool children. Arch. Dis. Child. 67(1), 106\u2013108 (1992)","journal-title":"Arch. Dis. Child."},{"issue":"9","key":"36_CR4","doi-asserted-by":"publisher","first-page":"685","DOI":"10.3844\/jcssp.2007.685.692","volume":"3","author":"Z Benselama","year":"2007","unstructured":"Benselama, Z., Guerti, M., Bencherif, M.: Arabic speech pathology therapy computer aided system. J. Comput. Sci. 3(9), 685\u2013692 (2007)","journal-title":"J. Comput. Sci."},{"issue":"4","key":"36_CR5","doi-asserted-by":"publisher","first-page":"987","DOI":"10.1161\/01.STR.0000062343.64383.D0","volume":"34","author":"SK Bhogal","year":"2003","unstructured":"Bhogal, S.K., Teasell, R., Speechley, M.: Intensity of aphasia therapy, impact on recovery. Stroke 34(4), 987\u2013993 (2003)","journal-title":"Stroke"},{"key":"36_CR6","unstructured":"Carvalho, M.I.P., Ferreira, A.: Interactive game for the training of Portuguese vowels. Master\u2019s thesis. Faculdade de Engenharia da Universidade do Porto (2008)"},{"key":"36_CR7","unstructured":"Clarkson, P., Moreno, P.J.: On the use of support vector machines for phonetic classification. In: Proceedings of the IEEE International Conference on Acoustics, Speech, and Signal Processing, vol. 2, pp. 585\u2013588 (1999)"},{"key":"36_CR8","doi-asserted-by":"crossref","unstructured":"Davis, S.B., Mermelstein, P.: Comparison of parametric representations for monosyllabic word recognition in continuously spoken sentences. In: Readings in Speech Recognition, pp. 65\u201374. Elsevier (1990)","DOI":"10.1016\/B978-0-08-051584-7.50010-3"},{"issue":"4","key":"36_CR9","doi-asserted-by":"publisher","first-page":"385","DOI":"10.1080\/02687039608248418","volume":"10","author":"G Denes","year":"1996","unstructured":"Denes, G., Perazzolo, C., Piani, A., Piccione, F.: Intensive versus regular speech therapy in global aphasia: a controlled study. Aphasiology 10(4), 385\u2013394 (1996)","journal-title":"Aphasiology"},{"key":"36_CR10","unstructured":"Figueiredo, A.C.: An\u00e1lise ac\u00fastica dos fonemas produzidos por crian\u00e7as com desempenho articulat\u00f3rio alterado. Master\u2019s thesis. Escola Superior de Sa\u00fade de Alcoit\u00e3o (2017)"},{"key":"36_CR11","doi-asserted-by":"publisher","DOI":"10.1002\/9781118142882","volume-title":"Speech and Audio Signal Processing: Processing and Perception of Speech and Music","author":"B Gold","year":"2011","unstructured":"Gold, B., Morgan, N., Ellis, D.: Speech and Audio Signal Processing: Processing and Perception of Speech and Music, 2nd edn. Wiley-Interscience, Hoboken (2011)","edition":"2"},{"key":"36_CR12","unstructured":"Guimar\u00e3es, I.: A Ci\u00eancia e a Arte da Voz Humana. ESSA - Escola Superior de Sa\u00fade do Alcoit\u00e3o (2007)"},{"issue":"2","key":"36_CR13","doi-asserted-by":"publisher","first-page":"205","DOI":"10.1109\/TASL.2008.2006575","volume":"17","author":"CW Hsu","year":"2009","unstructured":"Hsu, C.W., Lee, L.S.: Higher order cepstral moment normalization for improved robust speech recognition. IEEE Trans. Audio Speech Lang. Process. 17(2), 205\u2013220 (2009)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"36_CR14","volume-title":"Spoken Language Processing: A Guide to Theory, Algorithm, and System Development","author":"X Huang","year":"2001","unstructured":"Huang, X., Acero, A., Hon, H.W.: Spoken Language Processing: A Guide to Theory, Algorithm, and System Development, 1st edn. Prentice Hall PTR, Upper Saddle River (2001)","edition":"1"},{"key":"36_CR15","unstructured":"Kingma, D.P., Ba, J.: Adam: a method for stochastic optimization. In: Proceedings of the International Conference on Learning Representations (ICLR) (2015)"},{"key":"36_CR16","unstructured":"Krizhevsky, A., Sutskever, I., Hinton, G.E.: ImageNet classification with deep convolutional neural networks. In: Advances in Neural Information Processing Systems, pp. 1097\u20131105 (2012)"},{"key":"36_CR17","unstructured":"Mestre, I.: Sibilantes e motricidade orofacial em crian\u00e7as portuguesas dos 5:00 aos 9:11 anos de idade. Master\u2019s thesis. Escola Superior de Sa\u00fade do Alcoit\u00e3o (2018)"},{"key":"36_CR18","series-title":"Advances in Intelligent Systems and Computing","doi-asserted-by":"publisher","first-page":"367","DOI":"10.1007\/978-3-319-39796-2_30","volume-title":"Information Technologies in Medicine","author":"Z Miodo\u0144ska","year":"2016","unstructured":"Miodo\u0144ska, Z., Kr\u0119cichwost, M., Szyma\u0144ska, A.: Computer-aided evaluation of sibilants in preschool children sigmatism diagnosis. In: Pi\u0119tka, E., Badura, P., Kawa, J., Wieclawek, W. (eds.) Information Technologies in Medicine. AISC, vol. 471, pp. 367\u2013376. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-39796-2_30"},{"key":"36_CR19","unstructured":"Muda, L., Begam, M., Elamvazuthi, I.: Voice recognition algorithms using mel frequency cepstral coefficient and dynamic time warping techniques. Computing Research Repository (CoRR) abs\/1003.4083 (2010)"},{"key":"36_CR20","doi-asserted-by":"crossref","unstructured":"Palaz, D., Magimai-Doss, M., Collobert, R.: Analysis of CNN-based speech recognition system using raw speech as input. In: Proceedings of Interspeech, pp. 11\u201315 (2015)","DOI":"10.21437\/Interspeech.2015-3"},{"issue":"1","key":"36_CR21","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1044\/1092-4388(2009\/09-0021)","volume":"53","author":"J Preston","year":"2010","unstructured":"Preston, J., Edwards, M.L.: Phonological awareness and types of sound errors in preschoolers with speech sound disorders. J. Speech Lang. Hear. Res. 53(1), 44\u201360 (2010)","journal-title":"J. Speech Lang. Hear. Res."},{"key":"36_CR22","unstructured":"Rua, M.: Carateriza\u00e7\u00e3o do desempenho articulat\u00f3rio e oromotor de crian\u00e7as com altera\u00e7\u00f5es da fala. Master\u2019s thesis. Escola Superior de Sa\u00fade de Alcoit\u00e3o (2015)"},{"key":"36_CR23","doi-asserted-by":"crossref","unstructured":"Sainath, T.N., Kingsbury, B., Mohamed, A.R., Saon, G., Ramabhadran, B.: Improvements to filterbank and delta learning within a deep neural network framework. In: Proceedings of the IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 6839\u20136843 (2014)","DOI":"10.1109\/ICASSP.2014.6854925"},{"key":"36_CR24","doi-asserted-by":"crossref","unstructured":"Sainath, T.N., Kingsbury, B., Ramabhadran, B., Fousek, P., Novak, P., Mohamed, A.R.: Making deep belief networks effective for large vocabulary continuous speech recognition. In: Proceedings of the IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU), pp. 30\u201335 (2011)","DOI":"10.1109\/ASRU.2011.6163900"},{"key":"36_CR25","doi-asserted-by":"crossref","unstructured":"Sainath, T.N., Weiss, R.J., Senior, A., Wilson, K.W., Vinyals, O.: Learning the speech front-end with raw waveform CLDNNs. In: Proceedings of the Annual Conference of the International Speech Communication Association (2015)","DOI":"10.21437\/Interspeech.2015-1"},{"key":"36_CR26","doi-asserted-by":"crossref","unstructured":"Salomon, J., King, S., Salomon, J.: Framewise phone classification using support vector machines. In: Proceedings of the International Conference on Spoken Language Processing (2002)","DOI":"10.21437\/ICSLP.2002-352"},{"key":"36_CR27","doi-asserted-by":"crossref","unstructured":"Schuller, B., Steidl, S., Batliner, A.: The INTERSPEECH 2009 emotion challenge. In: Proceedings of Interspeech (2009)","DOI":"10.21437\/Interspeech.2009-103"},{"key":"36_CR28","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"190","DOI":"10.1007\/978-3-540-71505-4_11","volume-title":"Progress in Nonlinear Speech Processing","author":"R Solera-Ure\u00f1a","year":"2007","unstructured":"Solera-Ure\u00f1a, R., Padrell-Sendra, J., Mart\u00edn-Iglesias, D., Gallardo-Antol\u00edn, A., Pel\u00e1ez-Moreno, C., D\u00edaz-de-Mar\u00eda, F.: SVMs for automatic speech recognition: a survey. In: Stylianou, Y., Faundez-Zanuy, M., Esposito, A. (eds.) Progress in Nonlinear Speech Processing. LNCS, vol. 4391, pp. 190\u2013216. Springer, Heidelberg (2007). https:\/\/doi.org\/10.1007\/978-3-540-71505-4_11"},{"issue":"1","key":"36_CR29","first-page":"1929","volume":"15","author":"N Srivastava","year":"2014","unstructured":"Srivastava, N., Hinton, G., Krizhevsky, A., Sutskever, I., Salakhutdinov, R.: Dropout: a simple way to prevent neural networks from overfitting. J. Mach. Learn. Res. 15(1), 1929\u20131958 (2014)","journal-title":"J. Mach. Learn. Res."},{"key":"36_CR30","unstructured":"Valentini-Botinhao, C., Degenkolb-Weyers, S., Maier, A., N\u00f6th, E., Eysholdt, U., Bocklet, T.: Automatic detection of sigmatism in children. In: Proceedings of the Workshop on Child, Computer Interaction (WOCCI) (2012)"},{"key":"36_CR31","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Chan, W., Jaitly, N.: Very deep convolutional networks for end-to-end speech recognition. In: 2017 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 4845\u20134849 (2017)","DOI":"10.1109\/ICASSP.2017.7953077"}],"container-title":["Lecture Notes in Computer Science","Progress in Artificial Intelligence"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-30244-3_36","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,9,27]],"date-time":"2022-09-27T06:27:18Z","timestamp":1664260038000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-030-30244-3_36"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019]]},"ISBN":["9783030302436","9783030302443"],"references-count":31,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-30244-3_36","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2019]]},"assertion":[{"value":"30 August 2019","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"EPIA","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"EPIA Conference on Artificial Intelligence","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Vila Real","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Portugal","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2019","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"3 September 2019","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"6 September 2019","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"19","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"epia2019","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/epia2019.utad.pt\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Easychair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"252","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"119","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"6","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"47% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.32","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1.86","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}