{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T11:48:59Z","timestamp":1775216939935,"version":"3.50.1"},"reference-count":78,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"7","license":[{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"National Key Research and Development Program of China","award":["2019YFA0706200"],"award-info":[{"award-number":["2019YFA0706200"]}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62227807"],"award-info":[{"award-number":["62227807"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004775","name":"Natural Science Foundation of Gansu Province","doi-asserted-by":"publisher","award":["22JR5RA488"],"award-info":[{"award-number":["22JR5RA488"]}],"id":[{"id":"10.13039\/501100004775","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","award":["lzujbky-2023-16"],"award-info":[{"award-number":["lzujbky-2023-16"]}],"id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Supercomputing Center of Lanzhou University"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Knowl. Data Eng."],"published-print":{"date-parts":[[2024,7]]},"DOI":"10.1109\/tkde.2024.3350071","type":"journal-article","created":{"date-parts":[[2024,1,5]],"date-time":"2024-01-05T20:04:36Z","timestamp":1704485076000},"page":"2956-2966","source":"Crossref","is-referenced-by-count":76,"title":["DepMSTAT: Multimodal Spatio-Temporal Attentional Transformer for Depression Detection"],"prefix":"10.1109","volume":"36","author":[{"ORCID":"https:\/\/orcid.org\/0009-0009-9712-9380","authenticated-orcid":false,"given":"Yongfeng","family":"Tao","sequence":"first","affiliation":[{"name":"Gansu Provincial Key Laboratory of Wearable Computing School of Information Science and Engineering, Lanzhou University, LanZhou, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7571-6439","authenticated-orcid":false,"given":"Minqiang","family":"Yang","sequence":"additional","affiliation":[{"name":"Gansu Provincial Key Laboratory of Wearable Computing School of Information Science and Engineering, Lanzhou University, LanZhou, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-6880-3042","authenticated-orcid":false,"given":"Huiru","family":"Li","sequence":"additional","affiliation":[{"name":"Gansu Provincial Key Laboratory of Wearable Computing School of Information Science and Engineering, Lanzhou University, LanZhou, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-3872-9600","authenticated-orcid":false,"given":"Yushan","family":"Wu","sequence":"additional","affiliation":[{"name":"Gansu Provincial Key Laboratory of Wearable Computing School of Information Science and Engineering, Lanzhou University, LanZhou, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3514-5413","authenticated-orcid":false,"given":"Bin","family":"Hu","sequence":"additional","affiliation":[{"name":"Gansu Provincial Key Laboratory of Wearable Computing, School of Information Science and Engineering, Lanzhou University, Lanzhou, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/S0140-6736(18)31948-2"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.jad.2013.01.004"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1017\/S0033291700038502"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1046\/j.1525-1497.2001.016009606.x"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiomed.2023.107457"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2018.2877129"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/MWC.001.2000394"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2021.10.012"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.dcan.2023.03.007"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/tcss.2022.3223251"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2022.3146711"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/s40846-022-00687-7"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1002\/int.22426"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/2988257.2988267"},{"key":"ref15","article-title":"Measuring depression symptom severity from spoken language and 3D facial expressions","author":"Haque","year":"2018"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/s12652-021-03497-y"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.3390\/s21144764"},{"key":"ref18","article-title":"A topic-attentive transformer-based model for multimodal depression detection","author":"Guo","year":"2022"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i11.21483"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref21","article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","author":"Devlin","year":"2018"},{"issue":"8","key":"ref22","article-title":"Language models are unsupervised multitask learners","volume":"1","author":"Radford","year":"2019","journal-title":"OpenAI Blog"},{"key":"ref23","article-title":"End-to-end ASR: From supervised to semi-supervised learning with modern architectures","author":"Synnaeve","year":"2019"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2019-1780"},{"key":"ref25","article-title":"Faster R-CNN: Towards real-time object detection with region proposal networks","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"28","author":"Ren","year":"2015"},{"key":"ref26","article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Dosovitskiy","year":"2021"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01367"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.3389\/fnbot.2021.824592"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01028"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.400"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i05.6503"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20053-3_5"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2023.3275156"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i14.17534"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01157"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1656"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01315"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1145\/2661806.2661809"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1145\/3347320.3357688"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2018.2885515"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2021.3078898"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2020.10.015"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2018.2828819"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2020.3021755"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/FG.2018.00020"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2018.2870884"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1002\/int.22704"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2020.2970418"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1145\/3266302.3268997"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2021.02.019"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-69541-5_3"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/tnnls.2023.3247103"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"ref55","first-page":"1755","article-title":"Dlib-ml: A machine learning toolkit","volume":"10","author":"King","year":"2009","journal-title":"J. Mach. Learn. Res."},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2015.2457417"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.5555\/3454287.3455008"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-35289-8_25"},{"key":"ref59","article-title":"SGDR: Stochastic gradient descent with warm restarts","author":"Loshchilov","year":"2016"},{"issue":"1","key":"ref60","first-page":"1929","article-title":"Dropout: A simple way to prevent neural networks from overfitting","volume":"15","author":"Srivastava","year":"2014","journal-title":"J. Mach. Learn. Res."},{"key":"ref61","first-page":"4604","article-title":"Do we need zero training loss after achieving zero training error?","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Ishida","year":"2020"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-84858-7"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00291"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/EMBC.2017.8037103"},{"key":"ref65","first-page":"6105","article-title":"Efficientnet: Rethinking model scaling for convolutional neural networks","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Tan","year":"2019"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1145\/3347320.3357696"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1115"},{"key":"ref68","first-page":"10347","article-title":"Training data-efficient image transformers & distillation through attention","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Touvron","year":"2021"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01054"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/TNSRE.2022.3224135"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01187"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00745"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19803-8_5"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2019.2935152"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.308"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2023.3282704"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.195"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.243"}],"container-title":["IEEE Transactions on Knowledge and Data Engineering"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/69\/10549876\/10381779.pdf?arnumber=10381779","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,27]],"date-time":"2024-11-27T18:20:37Z","timestamp":1732731637000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10381779\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7]]},"references-count":78,"journal-issue":{"issue":"7"},"URL":"https:\/\/doi.org\/10.1109\/tkde.2024.3350071","relation":{},"ISSN":["1041-4347","1558-2191","2326-3865"],"issn-type":[{"value":"1041-4347","type":"print"},{"value":"1558-2191","type":"electronic"},{"value":"2326-3865","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,7]]}}}