{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T06:59:52Z","timestamp":1775199592781,"version":"3.50.1"},"reference-count":40,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T00:00:00Z","timestamp":1764979200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T00:00:00Z","timestamp":1764979200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,12,6]]},"DOI":"10.1109\/asru65441.2025.11434604","type":"proceedings-article","created":{"date-parts":[[2026,4,2]],"date-time":"2026-04-02T19:48:04Z","timestamp":1775159284000},"page":"1-7","source":"Crossref","is-referenced-by-count":0,"title":["Recognizing Dementia from Neuropsychological Tests with State Space Models"],"prefix":"10.1109","author":[{"given":"Liming","family":"Wang","sequence":"first","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Saurabhchand","family":"Bhati","sequence":"additional","affiliation":[{"name":"Massachusetts Institute of Technology"}]},{"given":"Cody","family":"Karjadi","sequence":"additional","affiliation":[{"name":"Boston University"}]},{"given":"Rhoda","family":"Au","sequence":"additional","affiliation":[{"name":"Boston University"}]},{"given":"James","family":"Glass","sequence":"additional","affiliation":[{"name":"Boston University"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1159\/000078501"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1038\/mp.2015.129"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.3928\/0098-9134-19990501-08"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-1220"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU.2017.8268965"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.findings-emnlp.386"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/n18-2117"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2021-1589"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref10","article-title":"Efficiently modeling long sequences with structured state spaces","author":"Gu","year":"2021","journal-title":"arXiv preprint arXiv:2111.00396"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2021-759"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10096205"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/SLT61566.2024.10832169"},{"key":"ref14","article-title":"Efficiently modeling long sequences with structured state spaces","author":"Gu","year":"2022","journal-title":"ICLR"},{"key":"ref15","article-title":"Mamba: Linear-time sequence modeling with selective state spaces","author":"Gu","year":"2023","journal-title":"arXiv preprint arXiv:2312.00752"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2571"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2021-1633"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1186\/s13195-021-00888-3"},{"key":"ref19","article-title":"wav2vec 2.0: A framework for self-supervised learning of speech representations","author":"Baevski","year":"2020","journal-title":"NeurIPS"},{"key":"ref20","article-title":"Robust speech recognition via large-scale weak supervision","author":"Radford","year":"2023","journal-title":"ICML"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.3389\/fpsyg.2020.624137"},{"key":"ref22","article-title":"Vmamba: Visual state space model","author":"Liu","year":"2024","journal-title":"arXiv preprint arXiv:2401.10166"},{"key":"ref23","article-title":"Vision mamba: Efficient visual representation learning with bidirectional state space model","author":"Zhu","year":"2024","journal-title":"arXiv preprint arXiv:2401.09417"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2024.3483009"},{"key":"ref25","article-title":"Audio mamba: Pretrained audio state space model for audio tagging","author":"Lin","year":"2024","journal-title":"arXiv preprint arXiv:2405.13636"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/slt61566.2024.10832304"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TASLPRO.2025.3566210"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49660.2025.10889391"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N19-1423"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2023-205"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2023-105"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7952261"},{"key":"ref34","first-page":"6105","article-title":"Efficientnet: Rethinking model scaling for convolutional neural networks","volume":"97","author":"Tan","year":"2019","journal-title":"ICML"},{"key":"ref35","article-title":"LLaMA: Open and efficient foundation language models","author":"Touvron","year":"2023","journal-title":"arXiv preprint arXiv:2302.13971"},{"key":"ref36","article-title":"Qwen2 technical report","volume-title":"tech. rep., Qwen Team, Alibaba Group","author":"Yang","year":"2024"},{"key":"ref37","article-title":"Phi-4-mini technical report: Compact yet powerful multimodal language models via mixture-of-loras","volume-title":"Technical Report","year":"2024"},{"key":"ref38","article-title":"Lora: Low-rank adaptation of large language models","author":"Hu","year":"2021"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1406.3269"},{"key":"ref40","article-title":"Scaling laws for neural language models","author":"Kaplan","year":"2020","journal-title":"arXiv preprint arXiv:2001.08361"}],"event":{"name":"2025 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","location":"Honolulu, HI, USA","start":{"date-parts":[[2025,12,6]]},"end":{"date-parts":[[2025,12,10]]}},"container-title":["2025 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11434577\/11433836\/11434604.pdf?arnumber=11434604","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T04:56:36Z","timestamp":1775192196000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11434604\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,6]]},"references-count":40,"URL":"https:\/\/doi.org\/10.1109\/asru65441.2025.11434604","relation":{},"subject":[],"published":{"date-parts":[[2025,12,6]]}}}