{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,7]],"date-time":"2026-03-07T17:46:51Z","timestamp":1772905611785,"version":"3.50.1"},"publisher-location":"Cham","reference-count":43,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783031060175","type":"print"},{"value":"9783031060182","type":"electronic"}],"license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-031-06018-2_6","type":"book-chapter","created":{"date-parts":[[2022,6,15]],"date-time":"2022-06-15T23:05:23Z","timestamp":1655334323000},"page":"79-94","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["Multimodal Data Fusion for Automatic Detection of Alzheimer\u2019s Disease"],"prefix":"10.1007","author":[{"given":"Ivan","family":"Krstev","sequence":"first","affiliation":[]},{"given":"Milan","family":"Pavikjevikj","sequence":"additional","affiliation":[]},{"given":"Martina","family":"Toshevska","sequence":"additional","affiliation":[]},{"given":"Sonja","family":"Gievska","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,6,16]]},"reference":[{"key":"6_CR1","doi-asserted-by":"crossref","unstructured":"Akbik, A., Bergmann, T., Vollgraf, R.: Pooled contextualized embeddings for named entity recognition. In: NAACL 2019, 2019 Annual Conference of the North American Chapter of the Association for Computational Linguistics, pp. 724\u2013728 (2019)","DOI":"10.18653\/v1\/N19-1078"},{"key":"6_CR2","unstructured":"Akbik, A., Blythe, D., Vollgraf, R.: Contextual string embeddings for sequence labeling. In: COLING 2018, 27th International Conference on Computational Linguistics, pp. 1638\u20131649 (2018)"},{"key":"6_CR3","doi-asserted-by":"publisher","first-page":"260","DOI":"10.1016\/j.cortex.2019.12.002","volume":"124","author":"RS Alyahya","year":"2020","unstructured":"Alyahya, R.S., Halai, A.D., Conroy, P., Ralph, M.A.L.: Mapping psycholinguistic features to the neuropsychological and lesion profiles in aphasia. Cortex 124, 260\u2013273 (2020)","journal-title":"Cortex"},{"key":"6_CR4","first-page":"12449","volume":"33","author":"A Baevski","year":"2020","unstructured":"Baevski, A., Zhou, Y., Mohamed, A., Auli, M.: wav2vec 2.0: a framework for self-supervised learning of speech representations. Adv. Neural Inf. Process. Syst. 33, 12449\u201312460 (2020)","journal-title":"Adv. Neural Inf. Process. Syst."},{"issue":"6","key":"6_CR5","doi-asserted-by":"publisher","first-page":"585","DOI":"10.1001\/archneur.1994.00540180063015","volume":"51","author":"JT Becker","year":"1994","unstructured":"Becker, J.T., Boiler, F., Lopez, O.L., Saxton, J., McGonigle, K.L.: The natural history of Alzheimer\u2019s disease: description of study cohort and accuracy of diagnosis. Arch. Neurol. 51(6), 585\u2013594 (1994)","journal-title":"Arch. Neurol."},{"issue":"1","key":"6_CR6","doi-asserted-by":"publisher","first-page":"71","DOI":"10.1080\/026870300401603","volume":"14","author":"RS Bucks","year":"2000","unstructured":"Bucks, R.S., Singh, S., Cuerden, J.M., Wilcock, G.K.: Analysis of spontaneous, conversational speech in dementia of Alzheimer type: evaluation of an objective technique for analysing lexical performance. Aphasiology 14(1), 71\u201391 (2000)","journal-title":"Aphasiology"},{"key":"6_CR7","unstructured":"Clark, K., Luong, M., Le, Q.V., Manning, C.D.: ELECTRA: pre-training text encoders as discriminators rather than generators. CoRR abs\/2003.10555 (2020). https:\/\/arxiv.org\/abs\/2003.10555"},{"key":"6_CR8","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.J., Li, K., Fei-Fei, L.: ImageNet: a large-scale hierarchical image database. In: 2009 IEEE Conference on Computer Vision and Pattern Recognition, pp. 248\u2013255. IEEE (2009)","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"6_CR9","unstructured":"Devlin, J., Chang, M., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding. CoRR abs\/1810.04805 (2018). http:\/\/arxiv.org\/abs\/1810.04805"},{"key":"6_CR10","doi-asserted-by":"crossref","unstructured":"Eyben, F., W\u00f6llmer, M., Schuller, B.: OpenSmile: the Munich versatile and fast open-source audio feature extractor. In: Proceedings of the 18th ACM International Conference on Multimedia, pp. 1459\u20131462 (2010)","DOI":"10.1145\/1873951.1874246"},{"key":"6_CR11","doi-asserted-by":"publisher","unstructured":"Gauder, L., Pepino, L., Ferrer, L., Riera, P.: Alzheimer disease recognition using speech-based embeddings from pre-trained models. In: Proceedings of Interspeech 2021, pp. 3795\u20133799 (2021). https:\/\/doi.org\/10.21437\/Interspeech.2021-753","DOI":"10.21437\/Interspeech.2021-753"},{"key":"6_CR12","doi-asserted-by":"crossref","unstructured":"Gievska, S., Koroveshovski, K.: The impact of affective verbal content on predicting personality impressions in YouTube videos. In: Proceedings of the 2014 ACM Multi Media on Workshop on Computational Personality Recognition, pp. 19\u201322 (2014)","DOI":"10.1145\/2659522.2659529"},{"issue":"5800","key":"6_CR13","doi-asserted-by":"publisher","first-page":"777","DOI":"10.1126\/science.1132814","volume":"314","author":"M Goedert","year":"2006","unstructured":"Goedert, M., Spillantini, M.G.: A century of Alzheimer\u2019s disease. Science 314(5800), 777\u2013781 (2006)","journal-title":"Science"},{"key":"6_CR14","volume-title":"BDAE: The Boston Diagnostic Aphasia Examination","author":"H Goodglass","year":"2001","unstructured":"Goodglass, H., Kaplan, E., Weintraub, S.: BDAE: The Boston Diagnostic Aphasia Examination. Lippincott Williams & Wilkins, Philadelphia (2001)"},{"key":"6_CR15","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"issue":"2","key":"6_CR16","doi-asserted-by":"publisher","first-page":"108","DOI":"10.3390\/info11020108","volume":"11","author":"J Howard","year":"2020","unstructured":"Howard, J., Gugger, S.: FastAI: a layered API for deep learning. Information 11(2), 108 (2020)","journal-title":"Information"},{"issue":"1","key":"6_CR17","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/s41598-020-78888-w","volume":"10","author":"SC Huang","year":"2020","unstructured":"Huang, S.C., Pareek, A., Zamanian, R., Banerjee, I., Lungren, M.P.: Multimodal fusion with deep neural networks for leveraging CT imaging and electronic health record: a case-study in pulmonary embolism detection. Sci. Rep. 10(1), 1\u20139 (2020)","journal-title":"Sci. Rep."},{"key":"6_CR18","unstructured":"Iandola, F.N., Moskewicz, M.W., Ashraf, K., Han, S., Dally, W.J., Keutzer, K.: SqueezeNet: AlexNet-level accuracy with 50x fewer parameters and $$<$$1mb model size. CoRR abs\/1602.07360 (2016). http:\/\/arxiv.org\/abs\/1602.07360"},{"key":"6_CR19","doi-asserted-by":"crossref","unstructured":"Joulin, A., Grave, E., Mikolov, P.B.T.: Bag of tricks for efficient text classification (2016)","DOI":"10.18653\/v1\/E17-2068"},{"issue":"11","key":"6_CR20","doi-asserted-by":"publisher","first-page":"1097","DOI":"10.1001\/archneur.1985.04060100083029","volume":"42","author":"ZS Khachaturian","year":"1985","unstructured":"Khachaturian, Z.S.: Diagnosis of Alzheimer\u2019s disease. Arch. Neurol. 42(11), 1097\u20131105 (1985)","journal-title":"Arch. Neurol."},{"key":"6_CR21","unstructured":"Lundberg, S.M., Lee, S.I.: A unified approach to interpreting model predictions. In: Proceedings of the 31st International Conference on Neural Information Processing Systems, pp. 4768\u20134777 (2017)"},{"key":"6_CR22","doi-asserted-by":"crossref","unstructured":"Luz, S., Haider, F., de la Fuente, S., Fromm, D., MacWhinney, B.: Alzheimer\u2019s dementia recognition through spontaneous speech: the adress challenge. arXiv preprint arXiv:2004.06833 (2020)","DOI":"10.21437\/Interspeech.2020-2571"},{"key":"6_CR23","doi-asserted-by":"publisher","unstructured":"Luz, S., Haider, F., de la Fuente, S., Fromm, D., MacWhinney, B.: Detecting cognitive decline using speech only: the ADReSSo challenge. In: Proceedings of Interspeech 2021, pp. 3780\u20133784 (2021). https:\/\/doi.org\/10.21437\/Interspeech.2021-1220","DOI":"10.21437\/Interspeech.2021-1220"},{"key":"6_CR24","doi-asserted-by":"crossref","unstructured":"Martinc, M., Pollak, S.: Tackling the ADReSS challenge: a multimodal approach to the automated recognition of Alzheimer\u2019s dementia. In: INTERSPEECH, pp. 2157\u20132161 (2020)","DOI":"10.21437\/Interspeech.2020-2202"},{"key":"6_CR25","doi-asserted-by":"publisher","unstructured":"McFee, B., et al.: Thassilo: librosa\/librosa: 0.8.1rc2, May 2021. https:\/\/doi.org\/10.5281\/zenodo.4792298","DOI":"10.5281\/zenodo.4792298"},{"issue":"4","key":"6_CR26","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1007\/BF02686918","volume":"14","author":"A Mehrabian","year":"1996","unstructured":"Mehrabian, A.: Pleasure-arousal-dominance: a general framework for describing and measuring individual differences in temperament. Curr. Psychol. 14(4), 261\u2013292 (1996)","journal-title":"Curr. Psychol."},{"issue":"7266","key":"6_CR27","doi-asserted-by":"publisher","first-page":"895","DOI":"10.1038\/461895a","volume":"461","author":"L Mucke","year":"2009","unstructured":"Mucke, L.: Alzheimer\u2019s disease. Nature 461(7266), 895\u2013897 (2009)","journal-title":"Nature"},{"key":"6_CR28","doi-asserted-by":"crossref","unstructured":"Pan, Y., et al.: Using the outputs of different automatic speech recognition paradigms for acoustic-and BERT-based Alzheimer\u2019s dementia detection through spontaneous speech. In: Proceedings of Interspeech, pp. 3810\u20133814 (2021)","DOI":"10.21437\/Interspeech.2021-1519"},{"key":"6_CR29","doi-asserted-by":"crossref","unstructured":"Pennington, J., Socher, R., Manning, C.D.: GloVe: global vectors for word representation. In: Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 1532\u20131543 (2014)","DOI":"10.3115\/v1\/D14-1162"},{"key":"6_CR30","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1016\/j.inffus.2017.02.003","volume":"37","author":"S Poria","year":"2017","unstructured":"Poria, S., Cambria, E., Bajpai, R., Hussain, A.: A review of affective computing: from unimodal analysis to multimodal fusion. Inf. Fusion 37, 98\u2013125 (2017)","journal-title":"Inf. Fusion"},{"key":"6_CR31","doi-asserted-by":"publisher","first-page":"50","DOI":"10.1016\/j.neucom.2015.01.095","volume":"174","author":"S Poria","year":"2016","unstructured":"Poria, S., Cambria, E., Howard, N., Huang, G.B., Hussain, A.: Fusing audio, visual and textual clues for sentiment analysis from multimodal content. Neurocomputing 174, 50\u201359 (2016)","journal-title":"Neurocomputing"},{"key":"6_CR32","doi-asserted-by":"crossref","unstructured":"Poria, S., Chaturvedi, I., Cambria, E., Hussain, A.: Convolutional MKL based multimodal emotion recognition and sentiment analysis. In: 2016 IEEE 16th International Conference on Data Mining (ICDM), pp. 439\u2013448. IEEE (2016)","DOI":"10.1109\/ICDM.2016.0055"},{"key":"6_CR33","doi-asserted-by":"publisher","unstructured":"P\u00e9rez-Toro, P., et al.: Influence of the interviewer on the automatic assessment of Alzheimer\u2019s disease in the context of the ADReSSo challenge. In: Proceedings of Interspeech 2021, pp. 3785\u20133789 (2021). https:\/\/doi.org\/10.21437\/Interspeech.2021-1589","DOI":"10.21437\/Interspeech.2021-1589"},{"key":"6_CR34","doi-asserted-by":"crossref","unstructured":"Reimers, N., Gurevych, I.: Sentence-BERT: sentence embeddings using Siamese BERT-networks. In: Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing. Association for Computational Linguistics, November 2019. https:\/\/arxiv.org\/abs\/1908.10084","DOI":"10.18653\/v1\/D19-1410"},{"key":"6_CR35","doi-asserted-by":"crossref","unstructured":"Sarawgi, U., Zulfikar, W., Soliman, N., Maes, P.: Multimodal inductive transfer learning for detection of Alzheimer\u2019s dementia and its severity. arXiv preprint arXiv:2009.00700 (2020)","DOI":"10.21437\/Interspeech.2020-3137"},{"issue":"1","key":"6_CR36","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s13721-020-0226-0","volume":"9","author":"A Shrestha","year":"2020","unstructured":"Shrestha, A., Serra, E., Spezzano, F.: Multi-modal social and psycho-linguistic embedding via recurrent neural networks to identify depressed users in online forums. Netw. Model. Anal. Health Inform. Bioinform. 9(1), 1\u201311 (2020). https:\/\/doi.org\/10.1007\/s13721-020-0226-0","journal-title":"Netw. Model. Anal. Health Inform. Bioinform."},{"key":"6_CR37","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. In: Bengio, Y., LeCun, Y. (eds.) 3rd International Conference on Learning Representations, ICLR 2015, San Diego, CA, USA, 7\u20139 May 2015, Conference Track Proceedings (2015). http:\/\/arxiv.org\/abs\/1409.1556"},{"issue":"1S","key":"6_CR38","doi-asserted-by":"publisher","first-page":"491","DOI":"10.1044\/2020_AJSLP-19-00093","volume":"30","author":"BC Stark","year":"2021","unstructured":"Stark, B.C., et al.: Standardizing assessment of spoken discourse in aphasia: a working group with deliverables. Am. J. Speech Lang. Pathol. 30(1S), 491\u2013502 (2021)","journal-title":"Am. J. Speech Lang. Pathol."},{"issue":"s2","key":"6_CR39","doi-asserted-by":"publisher","first-page":"S527","DOI":"10.3233\/JAD-2010-100501","volume":"20","author":"J Vina","year":"2010","unstructured":"Vina, J., Lloret, A.: Why women have more Alzheimer\u2019s disease than men: gender and mitochondrial toxicity of amyloid-$$\\beta $$ peptide. J. Alzheimers Dis. 20(s2), S527\u2013S533 (2010)","journal-title":"J. Alzheimers Dis."},{"key":"6_CR40","doi-asserted-by":"publisher","unstructured":"Wang, N., Cao, Y., Hao, S., Shao, Z., Subbalakshmi, K.: Modular multi-modal attention network for Alzheimer\u2019s disease detection using patient audio and language data. In: Proceedings of Interspeech 2021, pp. 3835\u20133839 (2021). https:\/\/doi.org\/10.21437\/Interspeech.2021-2024","DOI":"10.21437\/Interspeech.2021-2024"},{"key":"6_CR41","doi-asserted-by":"crossref","first-page":"327","DOI":"10.1002\/alz.12328","volume":"17","author":"J Wiley","year":"2021","unstructured":"Wiley, J.: Alzheimer\u2019s disease facts and figures. Alzheimers Dement. 17, 327\u2013406 (2021)","journal-title":"Alzheimers Dement."},{"key":"6_CR42","doi-asserted-by":"crossref","unstructured":"Zhou, G., Wang, J., Zhang, X., Yu, G.: DeepGOA: predicting gene ontology annotations of proteins via graph convolutional network. In: 2019 IEEE International Conference on Bioinformatics and Biomedicine (BIBM), pp. 1836\u20131841. IEEE (2019)","DOI":"10.1109\/BIBM47256.2019.8983075"},{"key":"6_CR43","doi-asserted-by":"crossref","unstructured":"Zhu, Y., Obyat, A., Liang, X., Batsis, J.A., Roth, R.M.: WavBERT: exploiting semantic and non-semantic speech using wav2vec and BERT for dementia detection. In: Proceedings of Interspeech 2021, pp. 3790\u20133794 (2021)","DOI":"10.21437\/Interspeech.2021-332"}],"container-title":["Lecture Notes in Computer Science","Digital Human Modeling and Applications in Health, Safety, Ergonomics and Risk Management. Health, Operations Management, and Design"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-06018-2_6","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,11,9]],"date-time":"2022-11-09T12:05:50Z","timestamp":1667995550000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-06018-2_6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"ISBN":["9783031060175","9783031060182"],"references-count":43,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-06018-2_6","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022]]},"assertion":[{"value":"16 June 2022","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}