{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,23]],"date-time":"2026-03-23T22:14:20Z","timestamp":1774304060484,"version":"3.50.1"},"reference-count":33,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,6,6]],"date-time":"2021-06-06T00:00:00Z","timestamp":1622937600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,6,6]],"date-time":"2021-06-06T00:00:00Z","timestamp":1622937600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,6,6]]},"DOI":"10.1109\/icassp39728.2021.9413548","type":"proceedings-article","created":{"date-parts":[[2021,5,13]],"date-time":"2021-05-13T15:53:45Z","timestamp":1620921225000},"page":"7293-7297","source":"Crossref","is-referenced-by-count":4,"title":["Pause-Encoded Language Models for Recognition of Alzheimer\u2019s Disease and Emotion"],"prefix":"10.1109","author":[{"given":"Jiahong","family":"Yuan","sequence":"first","affiliation":[{"name":"Baidu Research,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xingyu","family":"Cai","sequence":"additional","affiliation":[{"name":"Baidu Research,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kenneth","family":"Church","sequence":"additional","affiliation":[{"name":"Baidu Research,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref33","first-page":"3227","article-title":"Attention driven fusion for multi-modal emotion recognition","author":"priyasad","year":"2020","journal-title":"Proceedings of ICASSP 2020"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9052937"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053192"},{"key":"ref30","first-page":"6474","article-title":"Speech emotion recognition with dualsequence lstm architecture","author":"wang","year":"2020","journal-title":"Proceedings of ICASSP 2020"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1016\/j.wocn.2006.04.001"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/0749-596X(91)90004-4"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1080\/713755895"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-1007"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1044\/jshr.3806.1232"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/SpeechProsody.2016-240"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.3138\/cmlr.2018-0258"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2516"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1016\/j.specom.2013.07.009"},{"key":"ref19","article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","author":"devlin","year":"2018"},{"key":"ref28","article-title":"Fine-tuning pretrained language models: Weight initializations, data orders, and early stopping","author":"dodge","year":"2020"},{"key":"ref4","first-page":"41","article-title":"Pauses and the temporal structure of speech","author":"zellner","year":"1994","journal-title":"Fundamentals of speech synthesis and speech recognition"},{"key":"ref27","author":"macwhinney","year":"2000","journal-title":"The CHILDES project Tools for analyzing talk"},{"key":"ref3","author":"butcher","year":"1981","journal-title":"Aspects of the speech pause phonetic correlates and communicative functions"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1121\/1.4807639"},{"key":"ref29","doi-asserted-by":"crossref","first-page":"335","DOI":"10.1007\/s10579-008-9076-6","article-title":"Iemocap: Interactive emotional dyadic motion capture database","volume":"42","author":"busso","year":"2008","journal-title":"Language Resources and Evaluation"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/B0-08-044854-2\/00796-3"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/S0022-5371(71)80072-5"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.cognition.2014.07.013"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/BF01067111"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/0010-0285(79)90004-5"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1177\/002383096100400405"},{"key":"ref20","article-title":"Ernie 2.0: A continual pre-training framework for language understanding","author":"sun","year":"2019"},{"key":"ref22","first-page":"5998","article-title":"Attention is all you need","author":"vaswani","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref21","article-title":"Roberta: A robustly optimized bert pretraining approach","author":"liu","year":"2019","journal-title":"ArXiv"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1121\/1.2935783"},{"key":"ref23","article-title":"Interview: A large-scale open-source corpus of media dialog","author":"majumder","year":"2020","journal-title":"CoRR"},{"key":"ref26","author":"goodglass","year":"2001","journal-title":"The Boston Diagnostic Aphasia Examination"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1001\/archneur.1994.00540180063015"}],"event":{"name":"ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Toronto, ON, Canada","start":{"date-parts":[[2021,6,6]]},"end":{"date-parts":[[2021,6,11]]}},"container-title":["ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9413349\/9413350\/09413548.pdf?arnumber=9413548","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,2]],"date-time":"2022-08-02T20:19:59Z","timestamp":1659471599000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9413548\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,6,6]]},"references-count":33,"URL":"https:\/\/doi.org\/10.1109\/icassp39728.2021.9413548","relation":{},"subject":[],"published":{"date-parts":[[2021,6,6]]}}}