{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,9]],"date-time":"2026-06-09T10:01:26Z","timestamp":1780999286426,"version":"3.54.1"},"publisher-location":"Singapore","reference-count":46,"publisher":"Springer Nature Singapore","isbn-type":[{"value":"9789819573936","type":"print"},{"value":"9789819573943","type":"electronic"}],"license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-981-95-7394-3_18","type":"book-chapter","created":{"date-parts":[[2026,5,10]],"date-time":"2026-05-10T23:42:36Z","timestamp":1778456556000},"page":"260-271","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["A Comparative Study of\u00a0ASRs, LLMs, and\u00a0Few-Shot Learning for\u00a0Emotion Recognition in\u00a0Tunisian Dialect"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0008-0677-7458","authenticated-orcid":false,"given":"Latifa","family":"Iben Nasr","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1868-1185","authenticated-orcid":false,"given":"Ismail","family":"Badache","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5987-8876","authenticated-orcid":false,"given":"Abir","family":"Masmoudi","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4868-657X","authenticated-orcid":false,"given":"Lamia Hadrich","family":"Belguith","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2026,5,1]]},"reference":[{"key":"18_CR1","doi-asserted-by":"crossref","unstructured":"Sallam, M., et al.: Chinese generative AI models (DeepSeek and Qwen) rival ChatGPT-4 in ophthalmology queries with excellent performance in Arabic and English. Narra J. 5(1), e2371 (2025)","DOI":"10.52225\/narra.v5i1.2371"},{"key":"18_CR2","unstructured":"Wang, Y., et al.: Is human-like text liked by humans? Multilingual human detection and preference against AI. arXiv preprint arXiv:2502.11614 (2025)"},{"key":"18_CR3","doi-asserted-by":"crossref","unstructured":"Fsih, E., Boujelbane, R., Belguith, L.H.: Resources building for sentiment analysis of content disseminated by Tunisian medias in social networks. Lang. Resour. Eval., 1\u201326 (2023)","DOI":"10.21203\/rs.3.rs-2035344\/v1"},{"key":"18_CR4","doi-asserted-by":"crossref","unstructured":"Bojic, L., et al.: Evaluating large language models against human annotators in latent content analysis: sentiment, political leaning, emotional intensity, and sarcasm. arXiv preprint arXiv:2501.02532 (2025)","DOI":"10.1038\/s41598-025-96508-3"},{"key":"18_CR5","doi-asserted-by":"crossref","unstructured":"Duret, J., Rouvier, M., Est\u00e8ve, Y.: MSP-podcast SER challenge 2024: L\u2019antenne du Ventoux multimodal self-supervised learning for speech emotion recognition. arXiv preprint arXiv:2407.05746 (2024)","DOI":"10.21437\/odyssey.2024-44"},{"issue":"5","key":"18_CR6","doi-asserted-by":"publisher","first-page":"440","DOI":"10.1007\/s42979-024-02775-8","volume":"5","author":"E Boughariou","year":"2024","unstructured":"Boughariou, E., Bahou, Y., Belguith, L.H.: Detecting speech disorders using a machine-learning guided method in spontaneous Tunisian dialect speech. SN Comput. Sci. 5(5), 440 (2024)","journal-title":"SN Comput. Sci."},{"key":"18_CR7","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1016\/j.specom.2022.03.002","volume":"140","author":"BT Atmaja","year":"2022","unstructured":"Atmaja, B.T., Sasou, A., Akagi, M.: Survey on bimodal speech emotion recognition from acoustic and linguistic information fusion. Speech Commun. 140, 11\u201328 (2022)","journal-title":"Speech Commun."},{"key":"18_CR8","doi-asserted-by":"publisher","first-page":"127081","DOI":"10.1109\/ACCESS.2021.3110992","volume":"9","author":"RH Aljuhani","year":"2021","unstructured":"Aljuhani, R.H., Alshutayri, A., Alahdal, S.: Arabic speech emotion recognition from Saudi dialect corpus. IEEE Access 9, 127081\u2013127085 (2021)","journal-title":"IEEE Access"},{"issue":"2","key":"18_CR9","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3708340","volume":"24","author":"L Ibn Nasr","year":"2025","unstructured":"Ibn Nasr, L., Masmoudi, A., Hadrich Belguith, L.: Emotion recognition from spontaneous Tunisian dialect speech. ACM Trans. Asian Low-Resour. Lang. Inf. Process. 24(2), 1\u201316 (2025)","journal-title":"ACM Trans. Asian Low-Resour. Lang. Inf. Process."},{"key":"18_CR10","doi-asserted-by":"crossref","unstructured":"Besdouri, F.Z., Zribi, I., Belguith, L.H.: Challenges and progress in developing speech recognition systems for dialectal Arabic. Speech Commun., 103110 (2024)","DOI":"10.1016\/j.specom.2024.103110"},{"key":"18_CR11","first-page":"11","volume":"8","author":"M Meddeb","year":"2016","unstructured":"Meddeb, M., Karray, H., Alimi, A.M.: Automated extraction of features from Arabic emotional speech corpus. Int. J. Comput. Inf. Syst. Ind. Manage. Appl. 8, 11 (2016)","journal-title":"Int. J. Comput. Inf. Syst. Ind. Manage. Appl."},{"key":"18_CR12","unstructured":"Messaoudi, A., Haddad, H., Hmida, M.B., Graiet, M.: TuniSER: toward a Tunisian Speech Emotion Recognition System. In: Proceedings of the 5th International Conference on Natural Language and Speech Processing (ICNLSP 2022), pp. 234\u2013241 (2022)"},{"key":"18_CR13","doi-asserted-by":"crossref","unstructured":"Xu, Y., Zhou, Y., Cai, Y., Xie, J., Ye, R., Wu, Z.: Multimodal emotion captioning using large language model with prompt engineering. In: Proceedings of the 2nd International Workshop on Multimodal and Responsible Affective Computing, pp. 104\u2013109 (2024)","DOI":"10.1145\/3689092.3689403"},{"key":"18_CR14","doi-asserted-by":"crossref","unstructured":"Bellver, J., et al.: Multimodal audio-language model for speech emotion recognition. Proc. Odyssey 2024 (2024)","DOI":"10.21437\/odyssey.2024-41"},{"key":"18_CR15","unstructured":"Nasr, L. I., Masmoudi, A., Belguith, L.H.: Tunisian dialect speech corpus: construction and emotion annotation"},{"key":"18_CR16","doi-asserted-by":"crossref","unstructured":"Guanxiong, P., et al.: Affective computing: recent advances, challenges, and future trends. Intell. Comput. 3, 0076 (2024)","DOI":"10.34133\/icomputing.0076"},{"issue":"7","key":"18_CR17","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3544558","volume":"55","author":"M Bayer","year":"2022","unstructured":"Bayer, M., Kaufhold, M.A., Reuter, C.: A survey on data augmentation for text classification. ACM Comput. Surv. 55(7), 1\u201339 (2022)","journal-title":"ACM Comput. Surv."},{"key":"18_CR18","doi-asserted-by":"crossref","unstructured":"Haddad, H., et al.: TunBERT: pretraining BERT for Tunisian dialect understanding. SN Comput. Sci. 4(2), 194 (2023)","DOI":"10.1007\/s42979-022-01541-y"},{"key":"18_CR19","doi-asserted-by":"publisher","first-page":"1408845","DOI":"10.3389\/frai.2024.1408845","volume":"7","author":"W Alosaimi","year":"2024","unstructured":"Alosaimi, W., et al.: ArabBert-LSTM: improving Arabic sentiment analysis based on transformer model and long short-term memory. Front. Artif. Intell. 7, 1408845 (2024)","journal-title":"Front. Artif. Intell."},{"key":"18_CR20","doi-asserted-by":"crossref","unstructured":"Zaraket, F.A., Jaber, A.: MATAR: morphology-based tagger for Arabic. In: 2013 ACS International Conference on Computer Systems and Applications (AICCSA), pp. 1\u20134. IEEE (2013)","DOI":"10.1109\/AICCSA.2013.6616418"},{"key":"18_CR21","doi-asserted-by":"crossref","unstructured":"Gugliotta, E., Dinarelli, M.: TARC: Tunisian Arabish corpus first complete release. arXiv preprint arXiv:2207.04796 (2022)","DOI":"10.63317\/5eqrikasc4rn"},{"key":"18_CR22","doi-asserted-by":"crossref","unstructured":"Mdhaffar, S., Bougares, F., Esteve, Y., Hadrich-Belguith, L.: Sentiment analysis of tunisian dialects: Linguistic ressources and experiments. In: Third Arabic natural language processing workshop (WANLP), pp. 55\u201361 (2017)","DOI":"10.18653\/v1\/W17-1307"},{"key":"18_CR23","unstructured":"Chaudhury, R., Godbole, M., Garg, A., Seo, J.H.: Humane speech synthesis through zero-shot emotion and disfluency generation. arXiv preprint arXiv:2404.01339 (2024)"},{"key":"18_CR24","doi-asserted-by":"crossref","unstructured":"Gong, T., Belanich, J., Somandepalli, K., Nagrani, A., Eoff, B., Jou, B.: Lanser: language-model supported speech emotion recognition. arXiv preprint arXiv:2309.03978 (2023)","DOI":"10.21437\/Interspeech.2023-1832"},{"key":"18_CR25","doi-asserted-by":"publisher","first-page":"249","DOI":"10.1007\/s10579-017-9402-y","volume":"52","author":"A Masmoudi","year":"2018","unstructured":"Masmoudi, A., Bougares, F., Ellouze, M., Est\u00e8ve, Y., Belguith, L.: Automatic speech recognition system for Tunisian dialect. Lang. Resour. Eval. 52, 249\u2013267 (2018)","journal-title":"Lang. Resour. Eval."},{"key":"18_CR26","unstructured":"Antoun, W., Baly, F., Hajj, H.: AraGPT2: pre-trained transformer for Arabic language generation. arXiv preprint arXiv:2012.15520 (2020)"},{"key":"18_CR27","doi-asserted-by":"publisher","unstructured":"Turki, H., et al.: Normalized orthography for Tunisian Arabic. In: International Conference on Language Processing and Knowledge Management, pp. 133\u2013142. Springer Nature Switzerland, Cham. https:\/\/doi.org\/10.1007\/978-3-031-85067-7_13","DOI":"10.1007\/978-3-031-85067-7_13"},{"key":"18_CR28","unstructured":"Hamed, I., Sabty, C., Abdennadher, S., Vu, N.T., Solorio, T., Habash, N.: A survey of code-switched Arabic NLP: progress, challenges, and future directions. arXiv preprint arXiv:2501.13419 (2025)"},{"issue":"1","key":"18_CR29","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1007\/s10772-024-10088-7","volume":"27","author":"L Iben Nasr","year":"2024","unstructured":"Iben Nasr, L., Masmoudi, A., Hadrich Belguith, L.: Survey on Arabic speech emotion recognition. Int. J. Speech Technol. 27(1), 53\u201368 (2024)","journal-title":"Int. J. Speech Technol."},{"key":"18_CR30","doi-asserted-by":"crossref","unstructured":"Zribi, I., Ellouze, M., Belguith, L.H., Blache, P.: Spoken Tunisian Arabic corpus \u201cSTAC\u201d: transcription and annotation. Res. Comput. Sci. 90, 123\u2013135 (2015)","DOI":"10.13053\/rcs-90-1-9"},{"key":"18_CR31","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.neucom.2023.01.002","volume":"528","author":"J de Lope","year":"2023","unstructured":"de Lope, J., Gra\u00f1a, M.: An ongoing review of speech emotion recognition. Neurocomputing 528, 1\u201311 (2023)","journal-title":"Neurocomputing"},{"key":"18_CR32","unstructured":"Sharma, V.: Speech and text-based emotion recognizer. arXiv preprint arXiv:2312.11503 (2023)"},{"key":"18_CR33","doi-asserted-by":"crossref","unstructured":"Padi, S., Sadjadi, S.O., Manocha, D., Sriram, R.D.: Multimodal emotion recognition using transfer learning from speaker recognition and BERT-based models. arXiv preprint arXiv:2202.08974 (2022)","DOI":"10.21437\/Odyssey.2022-57"},{"key":"18_CR34","doi-asserted-by":"publisher","first-page":"94557","DOI":"10.1109\/ACCESS.2021.3092735","volume":"9","author":"S Lee","year":"2021","unstructured":"Lee, S., Han, D.K., Ko, H.: Multimodal emotion recognition fusion analysis adapting BERT with heterogeneous feature unification. IEEE Access 9, 94557\u201394572 (2021)","journal-title":"IEEE Access"},{"key":"18_CR35","unstructured":"Macary, M., Tahon, M., Est\u00e8ve, Y., Luzzati, D.: Acoustic and linguistic representations for speech continuous emotion recognition in call center conversations. arXiv preprint arXiv:2310.04481 (2023)"},{"key":"18_CR36","doi-asserted-by":"crossref","unstructured":"Rybak, P.: Transferring BERT capabilities from high-resource to low-resource languages using vocabulary matching. arXiv preprint arXiv:2402.14408 (2024)","DOI":"10.63317\/58uhrwywiqyc"},{"key":"18_CR37","unstructured":"Zhang, E., Poellabauer, C.: Contextual speech emotion recognition with large language models and ASR-based transcriptions. In: Audio Imagination: NeurIPS 2024 Workshop AI-Driven Speech, Music, and Sound Generation"},{"key":"18_CR38","doi-asserted-by":"crossref","unstructured":"Santoso, J., Ishizuka, K., Hashimoto, T.: Large language model-based emotional speech annotation using context and acoustic feature for speech emotion recognition. In ICASSP 2024-2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 11026\u201311030. IEEE (2024)","DOI":"10.1109\/ICASSP48485.2024.10448316"},{"key":"18_CR39","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2023.103005","volume":"155","author":"N Al Roken","year":"2023","unstructured":"Al Roken, N., Barlas, G.: Multimodal Arabic emotion recognition using deep learning. Speech Commun. 155, 103005 (2023)","journal-title":"Speech Commun."},{"issue":"18","key":"18_CR40","doi-asserted-by":"publisher","first-page":"9188","DOI":"10.3390\/app12189188","volume":"12","author":"BB Al-onazi","year":"2022","unstructured":"Al-onazi, B.B., Nauman, M.A., Jahangir, R., Malik, M.M., Alkhammash, E.H., Elshewey, A.M.: Transformer-based multilingual speech emotion recognition using data augmentation and feature fusion. Appl. Sci. 12(18), 9188 (2022)","journal-title":"Appl. Sci."},{"key":"18_CR41","doi-asserted-by":"crossref","unstructured":"Tajalsir, M., Hernandez, S.M., Mohammed, F.A.: ASERS-LSTM: Arabic speech emotion recognition system based on LSTM model. Int. J. Sig. Image Process. (2022)","DOI":"10.5121\/sipij.2022.13102"},{"key":"18_CR42","unstructured":"Naouara, H., Lorr\u00e9, J.P., Louradour, J.: LinTO audio and textual datasets to train and evaluate automatic speech recognition in Tunisian Arabic dialect. arXiv preprint arXiv:2504.02604 (2025)"},{"issue":"2","key":"18_CR43","doi-asserted-by":"publisher","first-page":"20737","DOI":"10.48084\/etasr.9584","volume":"15","author":"M Zouidine","year":"2025","unstructured":"Zouidine, M., Khalil, M.: Large language models for Arabic sentiment analysis and machine translation. Eng. Technol. Appl. Sci. Res. 15(2), 20737\u201320742 (2025)","journal-title":"Eng. Technol. Appl. Sci. Res."},{"key":"18_CR44","unstructured":"Peng, B., Li, C., He, P., Galley, M., Gao, J.: Instruction tuning with GPT-4. arXiv preprint arXiv:2304.03277 (2023)"},{"key":"18_CR45","unstructured":"James, J., Gopinath, D.P.: Advocating character error rate for multilingual ASR evaluation. arXiv preprint arXiv:2410.07400 (2024)"},{"key":"18_CR46","unstructured":"Chebotarova, I.: Intelligent text recognition when creating audio books for blind people (2024)"}],"container-title":["Lecture Notes in Computer Science","Web Information Systems Engineering - WISE 2025"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-95-7394-3_18","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,6,9]],"date-time":"2026-06-09T09:32:37Z","timestamp":1780997557000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-95-7394-3_18"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"ISBN":["9789819573936","9789819573943"],"references-count":46,"URL":"https:\/\/doi.org\/10.1007\/978-981-95-7394-3_18","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]},"assertion":[{"value":"1 May 2026","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"WISE","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Web Information Systems Engineering","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Marrakech","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Morocco","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15 December 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17 December 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"wise2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/wise2025.ficloud.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}