{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,9]],"date-time":"2026-05-09T17:20:08Z","timestamp":1778347208922,"version":"3.51.4"},"reference-count":37,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2023,6,26]],"date-time":"2023-06-26T00:00:00Z","timestamp":1687737600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,6,26]],"date-time":"2023-06-26T00:00:00Z","timestamp":1687737600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/100008990","name":"Universit\u00e9 de Lorraine","doi-asserted-by":"publisher","award":["18-CE36-0008-03"],"award-info":[{"award-number":["18-CE36-0008-03"]}],"id":[{"id":"10.13039\/100008990","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Speech Technol"],"published-print":{"date-parts":[[2023,7]]},"DOI":"10.1007\/s10772-023-10032-1","type":"journal-article","created":{"date-parts":[[2023,6,26]],"date-time":"2023-06-26T16:02:57Z","timestamp":1687795377000},"page":"521-530","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["Stuttering detection using speaker representations and self-supervised contextual embeddings"],"prefix":"10.1007","volume":"26","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-9822-8422","authenticated-orcid":false,"given":"Shakeel A.","family":"Sheikh","sequence":"first","affiliation":[]},{"given":"Md","family":"Sahidullah","sequence":"additional","affiliation":[]},{"given":"Fabrice","family":"Hirsch","sequence":"additional","affiliation":[]},{"given":"Slim","family":"Ouni","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,6,26]]},"reference":[{"key":"10032_CR1","doi-asserted-by":"publisher","first-page":"56","DOI":"10.1016\/j.specom.2019.12.001","volume":"116","author":"MB Ak\u00e7ay","year":"2020","unstructured":"Ak\u00e7ay, M. B., & O\u01e7uz, K. (2020). Speech emotion recognition: Emotional models, databases, features, preprocessing methods, supporting modalities, and classifiers. Speech Communication, 116, 56\u201376.","journal-title":"Speech Communication"},{"key":"10032_CR2","doi-asserted-by":"publisher","first-page":"14","DOI":"10.1016\/j.neunet.2021.01.026","volume":"138","author":"A Apicella","year":"2021","unstructured":"Apicella, A., et al. (2021). A survey on modern trainable activation functions. Neural Networks, 138, 14\u201332.","journal-title":"Neural Networks"},{"key":"10032_CR3","first-page":"12449","volume":"33","author":"A Baevski","year":"2020","unstructured":"Baevski, A., et al. (2020). Wav2vec 2.0: A framework for self-supervised learning of speech representations. Advances in Neural Information Processing Systems, 33, 12449\u201312460.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"10032_CR4","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2022.3155295","author":"L Barrett","year":"2022","unstructured":"Barrett, L., et al. (2022). Systematic review of machine learning approaches for detecting developmental stuttering. IEEE\/ACM Transactions on Audio, Speech, and Language Processing. https:\/\/doi.org\/10.1109\/TASLP.2022.3155295","journal-title":"IEEE\/ACM Transactions on Audio, Speech, and Language Processing"},{"key":"10032_CR5","doi-asserted-by":"crossref","unstructured":"Bayerl, S. P., Wagner, D., N\u00f6th, E., & Riedhammer, K. (2022) Detecting dysfluencies in stuttering therapy using wav2vec 2.0. In: Proc. Interspeech 2022.","DOI":"10.21437\/Interspeech.2022-10908"},{"key":"10032_CR6","doi-asserted-by":"crossref","unstructured":"Dawalatabad, N., et al. (2021) ECAPA-TDNN embeddings for speaker diarization. In: Proceedings of Interspeech 2021, (pp. 3560\u20133564).","DOI":"10.21437\/Interspeech.2021-941"},{"key":"10032_CR7","doi-asserted-by":"crossref","unstructured":"Desplanques, B., et al. (2019) ECAPA-TDNN: Emphasized channel attention, propagation and aggregation in TDNN based speaker verification. In: Proceedings of Interspeech 2020.","DOI":"10.21437\/Interspeech.2020-2650"},{"key":"10032_CR8","unstructured":"Duffy, J. (2019), Motor speech disorders E-book: Substrates, differential diagnosis, and management (4th ed). Elsevier Health Sciences."},{"key":"10032_CR9","volume-title":"Stuttering: An integrated approach to its nature and treatment","author":"B Guitar","year":"2019","unstructured":"Guitar, B. (2019). Stuttering: An integrated approach to its nature and treatment (5th ed.). Wolters Kluwer.","edition":"5"},{"key":"10032_CR10","doi-asserted-by":"crossref","unstructured":"Howell, P., Davis, S., Bartrip, J. (2009) The University College London Archive of Stuttered Speech (UCLASS). Journal of Speech, Language, and Hearing Research : JSLHR, 52(2), 556\u2013569.","DOI":"10.1044\/1092-4388(2009\/07-0129)"},{"key":"10032_CR11","volume-title":"Spoken language processing: A guide to theory, algorithm, and system development","author":"X Huang","year":"2001","unstructured":"Huang, X., Acero, A., Hon, H.-W., & Reddy, R. (2001). Spoken language processing: A guide to theory, algorithm, and system development. Prentice Hall PTR."},{"key":"10032_CR12","first-page":"208","volume":"39","author":"RJ Ingham","year":"1996","unstructured":"Ingham, R. J., et al. (1996). Functional-lesion investigation of developmental stuttering with positron emission tomography. JSHR, 39, 208\u201327.","journal-title":"JSHR"},{"key":"10032_CR13","unstructured":"Ioffe, S., & Szegedy, C. (2015) Batch normalization: Accelerating deep network training by reducing internal covariate shift. In: Proceedings of the 32nd ICML (Vol. 37, pp. 448\u2013456)."},{"key":"10032_CR14","doi-asserted-by":"crossref","unstructured":"Jouaiti, M., & Dautenhahn, K. (2022) Dysfluency classification in stuttered speech using deep learning for real-time applications. In: Proceedings of ICASSP 2022.","DOI":"10.1109\/ICASSP43922.2022.9746638"},{"key":"10032_CR15","unstructured":"Kehoe, T. D., et al. (2006) Speech language pathology-stuttering. Kiambo Ridge."},{"key":"10032_CR16","doi-asserted-by":"crossref","unstructured":"Kourkounakis, T., et al. (2020) Detecting multiple speech disfluencies using a deep residual network with bidirectional long short-term memory. In: Proceedings of ICASSP.","DOI":"10.1109\/ICASSP40776.2020.9053893"},{"key":"10032_CR17","doi-asserted-by":"publisher","first-page":"2986","DOI":"10.1109\/TASLP.2021.3110146","volume":"29","author":"T Kourkounakis","year":"2021","unstructured":"Kourkounakis, T., et al. (2021). FluentNet: End-to-end detection of stuttered speech disfluencies with deep learning. IEEE\/ACM Transactions on Audio, Speech, and Language Processing, 29, 2986\u20132999.","journal-title":"IEEE\/ACM Transactions on Audio, Speech, and Language Processing"},{"key":"10032_CR18","doi-asserted-by":"crossref","unstructured":"Lea, C., et al. (2021) SEP-28k: A dataset for stuttering event detection from podcasts with people who stutter. In: Proceedings of ICASSP (pp. 6798\u20136802).","DOI":"10.1109\/ICASSP39728.2021.9413520"},{"key":"10032_CR19","doi-asserted-by":"crossref","unstructured":"Li, H., et al. (2020). Speaker-invariant affective representation learning via adversarial training. In: Proceedings of ICASSP 2020 (pp. 7144\u20137148).","DOI":"10.1109\/ICASSP40776.2020.9054580"},{"key":"10032_CR20","doi-asserted-by":"crossref","unstructured":"Mohamed, A. et al. (2022) Self-supervised speech representation learning: A review. arXiv preprint arXiv:2205.10643.","DOI":"10.1109\/JSTSP.2022.3207050"},{"key":"10032_CR21","volume-title":"Machine learning: A probabilistic perspective","author":"KP Murphy","year":"2012","unstructured":"Murphy, K. P. (2012). Machine learning: A probabilistic perspective. MIT Press."},{"key":"10032_CR22","doi-asserted-by":"publisher","first-page":"19143","DOI":"10.1109\/ACCESS.2019.2896880","volume":"7","author":"AB Nassif","year":"2019","unstructured":"Nassif, A. B., et al. (2019). Speech recognition using deep neural networks: A systematic review. IEEE Access, 7, 19143\u201319165.","journal-title":"IEEE Access"},{"key":"10032_CR23","unstructured":"Paszke, A., et al.: PyTorch: An imperative style, high-performance deep learning library. In: Proceedings of advances in NIPS 2019 (pp. 8024\u20138035)."},{"key":"10032_CR24","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa, F., et al. (2011). Scikit-learn: Machine learning in Python. JMLR, 12, 2825\u20132830.","journal-title":"JMLR"},{"key":"10032_CR25","doi-asserted-by":"crossref","unstructured":"Pepino, L., et al. (2021) Emotion recognition from speech using wav2vec 2.0 embeddings. In: Proceedings of Interspeech 2021 (pp. 3400\u20133404).","DOI":"10.21437\/Interspeech.2021-703"},{"key":"10032_CR26","unstructured":"Ravanelli, M., et al. (2021) SpeechBrain: A general-purpose speech toolkit. arXiv:2106.04624."},{"key":"10032_CR27","doi-asserted-by":"crossref","unstructured":"Schuller, B. W., et al. (2022) The ACM Multimedia 2022 computational paralinguistics challenge: Vocalisations, stuttering, activity, & mosquitos. In: Proceedings of ACM Multimedia 2022, Lisbon, Portugal.","DOI":"10.1145\/3503161.3551591"},{"key":"10032_CR33","unstructured":"Sheikh, S. A. (2023) Deep learning for stuttering detection, PhD thesis, Universit\u00e9 de Lorraine."},{"key":"10032_CR28","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2107.04057","author":"SA Sheikh","year":"2021","unstructured":"Sheikh, S. A., Sahidullah, M., Hirsch, F., & Ouni, S. (2021a). Machine learning for stuttering identification: Review, challenges & future directions. Neurocomputing. https:\/\/doi.org\/10.48550\/arXiv.2107.04057","journal-title":"Neurocomputing"},{"key":"10032_CR29","doi-asserted-by":"crossref","unstructured":"Sheikh, S. A., Sahidullah, M., Hirsch, F., & Ouni, S. (2021b) StutterNet: Stuttering detection using time delay neural network. In: Proceedings of 29th EUSIPCO (pp. 426\u2013430).","DOI":"10.23919\/EUSIPCO54536.2021.9616063"},{"key":"10032_CR30","doi-asserted-by":"crossref","unstructured":"Sheikh, S. A., Sahidullah, M., Hirsch, F., & Ouni, S. (2022a) End-to-end and self-supervised learning for ComParE 2022 stuttering sub-challenge. In: Proceedings of ACM Multimedia.","DOI":"10.1145\/3503161.3551588"},{"key":"10032_CR31","doi-asserted-by":"crossref","unstructured":"Sheikh, S. A., Sahidullah, M., Hirsch, F., & Ouni, S. (2022b) Robust stuttering detection via multi-task and adversarial learning. In: Proceedings of 30th EUSIPCO.","DOI":"10.23919\/EUSIPCO55093.2022.9909644"},{"key":"10032_CR32","doi-asserted-by":"publisher","DOI":"10.1109\/JBHI.2023.3248281","author":"SA Sheikh","year":"2023","unstructured":"Sheikh, S. A., Sahidullah, M., Hirsch, F., & Ouni, S. (2023). Advancing stuttering detection via data augmentation, class-balanced loss and multi-contextual deep learning. IEEE Journal of Biomedical and Health Informatics. https:\/\/doi.org\/10.1109\/JBHI.2023.3248281","journal-title":"IEEE Journal of Biomedical and Health Informatics"},{"issue":"9","key":"10032_CR34","first-page":"2483","volume":"60","author":"A Smith","year":"2017","unstructured":"Smith, A., & Weber, C. (2017). How stuttering develops: The multifactorial dynamic pathways theory. JSLHR, 60(9), 2483\u20132505.","journal-title":"JSLHR"},{"issue":"56","key":"10032_CR35","first-page":"1929","volume":"15","author":"N Srivastava","year":"2014","unstructured":"Srivastava, N., Hinton, G., Krizhevsky, A., Sutskever, I., & Salakhutdinov, R. (2014). Dropout: A simple way to prevent neural networks from overfitting. JMLR, 15(56), 1929\u20131958.","journal-title":"JMLR"},{"issue":"11","key":"10032_CR36","first-page":"2579","volume":"9","author":"L Van der Maaten","year":"2008","unstructured":"Van der Maaten, L., & Hinton, G. (2008). Visualizing data using t-SNE. Journal of Machine Learning Research, 9(11), 2579\u20132605.","journal-title":"Journal of Machine Learning Research"},{"key":"10032_CR37","volume-title":"Stuttering and cluttering: Frameworks for understanding and treatment","author":"D Ward","year":"2018","unstructured":"Ward, D. (2018). Stuttering and cluttering: Frameworks for understanding and treatment (2nd ed.). Psychology Press.","edition":"2"}],"container-title":["International Journal of Speech Technology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-023-10032-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10772-023-10032-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-023-10032-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,31]],"date-time":"2023-07-31T11:20:24Z","timestamp":1690802424000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10772-023-10032-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,6,26]]},"references-count":37,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2023,7]]}},"alternative-id":["10032"],"URL":"https:\/\/doi.org\/10.1007\/s10772-023-10032-1","relation":{},"ISSN":["1381-2416","1572-8110"],"issn-type":[{"value":"1381-2416","type":"print"},{"value":"1572-8110","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,6,26]]},"assertion":[{"value":"8 October 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 May 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 June 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}