{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,27]],"date-time":"2026-05-27T07:04:32Z","timestamp":1779865472829,"version":"3.53.1"},"reference-count":68,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Biomedical Signal Processing and Control"],"published-print":{"date-parts":[[2026,9]]},"DOI":"10.1016\/j.bspc.2026.110517","type":"journal-article","created":{"date-parts":[[2026,5,9]],"date-time":"2026-05-09T06:58:48Z","timestamp":1778309928000},"page":"110517","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"PA","title":["A long\u2013short behavioral evolution modeling for video depression recognition"],"prefix":"10.1016","volume":"123","author":[{"given":"Wanqing","family":"Xie","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-9092-5044","authenticated-orcid":false,"given":"Yaonan","family":"Zhu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1862-974X","authenticated-orcid":false,"given":"Yongqi","family":"Lin","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-0306-5846","authenticated-orcid":false,"given":"Xiaoyuan","family":"He","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Baoliang","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0768-1676","authenticated-orcid":false,"given":"Yanzhong","family":"Wang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4514-2016","authenticated-orcid":false,"given":"Xiaofeng","family":"Liu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Mingmei","family":"Cheng","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"78","reference":[{"key":"10.1016\/j.bspc.2026.110517_b1","doi-asserted-by":"crossref","first-page":"37","DOI":"10.1016\/j.npbr.2019.01.001","article-title":"Global functioning and suicide risk in patients with depression and comorbid borderline personality disorder","volume":"31","author":"Sarhan","year":"2019","journal-title":"Neurol. Psychiatr. Brain Res."},{"key":"10.1016\/j.bspc.2026.110517_b2","doi-asserted-by":"crossref","first-page":"127","DOI":"10.1038\/s41398-019-0460-3","article-title":"Prognosis and improved outcomes in major depression: a review","volume":"9","author":"Kraus","year":"2019","journal-title":"Transl. Psychiatry"},{"key":"10.1016\/j.bspc.2026.110517_b3","doi-asserted-by":"crossref","first-page":"553","DOI":"10.1002\/0471264385.wei1024","article-title":"Assessing personality and psychopathology with self-report inventories","volume":"10","author":"Ben-Porath","year":"2003","journal-title":"Handb. Psychol.: Assess. Psychol."},{"key":"10.1016\/j.bspc.2026.110517_b4","series-title":"Depression and other common mental disorders: Global health estimates","author":"World Health Organization","year":"2017"},{"issue":"4","key":"10.1016\/j.bspc.2026.110517_b5","doi-asserted-by":"crossref","first-page":"445","DOI":"10.1109\/TAFFC.2017.2724035","article-title":"Automatic assessment of depression based on visual cues: A systematic review","volume":"10","author":"Pampouchidou","year":"2017","journal-title":"IEEE Trans. Affect. Comput."},{"key":"10.1016\/j.bspc.2026.110517_b6","article-title":"Facial depression estimation via Multi-Cue contrastive learning","author":"Wang","year":"2025","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"key":"10.1016\/j.bspc.2026.110517_b7","doi-asserted-by":"crossref","DOI":"10.1016\/j.neucom.2025.129605","article-title":"Deep learning-based depression recognition through facial expression: A systematic review","author":"Cao","year":"2025","journal-title":"Neurocomputing"},{"issue":"3","key":"10.1016\/j.bspc.2026.110517_b8","doi-asserted-by":"crossref","first-page":"1581","DOI":"10.1109\/TAFFC.2020.3021755","article-title":"A deep multiscale spatiotemporal network for assessing depression from facial dynamics","volume":"13","author":"De Melo","year":"2020","journal-title":"IEEE Trans. Affect. Comput."},{"issue":"12","key":"10.1016\/j.bspc.2026.110517_b9","doi-asserted-by":"crossref","first-page":"10140","DOI":"10.1002\/int.22426","article-title":"Intelligent system for depression scale estimation with facial expressions and case study in industrial intelligence","volume":"37","author":"He","year":"2022","journal-title":"Int. J. Intell. Syst."},{"issue":"22","key":"10.1016\/j.bspc.2026.110517_b10","doi-asserted-by":"crossref","first-page":"20230","DOI":"10.1109\/JIOT.2023.3283616","article-title":"An improved global\u2013local fusion network for depression detection telemedicine framework","volume":"10","author":"Zhang","year":"2023","journal-title":"IEEE Internet Things J."},{"key":"10.1016\/j.bspc.2026.110517_b11","series-title":"Proc. 14th IEEE Int. Conf. Autom. Face Gesture Recognit. (FG)","first-page":"1","article-title":"Combining global and local convolutional 3d networks for detecting depression from facial expressions","author":"De Melo","year":"2019"},{"issue":"3","key":"10.1016\/j.bspc.2026.110517_b12","doi-asserted-by":"crossref","first-page":"1605","DOI":"10.1109\/TAFFC.2020.3022732","article-title":"Facial depression recognition by deep joint label distribution and metric learning","volume":"13","author":"Zhou","year":"2020","journal-title":"IEEE Trans. Affect. Comput."},{"key":"10.1016\/j.bspc.2026.110517_b13","doi-asserted-by":"crossref","first-page":"165","DOI":"10.1016\/j.neucom.2020.10.015","article-title":"Automatic depression recognition using CNN with attention mechanism from videos","volume":"422","author":"He","year":"2021","journal-title":"Neurocomputing"},{"key":"10.1016\/j.bspc.2026.110517_b14","doi-asserted-by":"crossref","DOI":"10.1016\/j.eswa.2023.121410","article-title":"Spatial\u2013temporal attention network for depression recognition from facial videos","volume":"237","author":"Pan","year":"2024","journal-title":"Expert Syst. Appl."},{"issue":"2","key":"10.1016\/j.bspc.2026.110517_b15","doi-asserted-by":"crossref","first-page":"829","DOI":"10.1109\/TAFFC.2020.2970712","article-title":"Spectral representation of behaviour primitives for depression analysis","volume":"13","author":"Song","year":"2020","journal-title":"IEEE Trans. Affect. Comput."},{"issue":"1","key":"10.1016\/j.bspc.2026.110517_b16","doi-asserted-by":"crossref","first-page":"161","DOI":"10.1109\/TAFFC.2024.3415770","article-title":"Two-stage temporal modelling framework for video-based depression recognition using graph representation","volume":"16","author":"Xu","year":"2024","journal-title":"IEEE Trans. Affect. Comput."},{"key":"10.1016\/j.bspc.2026.110517_b17","doi-asserted-by":"crossref","DOI":"10.1016\/j.knosys.2025.113437","article-title":"VC-Mamba: Causal Mamba representation consistency for video implicit understanding","volume":"317","author":"Hu","year":"2025","journal-title":"Knowl.-Based Syst."},{"key":"10.1016\/j.bspc.2026.110517_b18","first-page":"1","article-title":"Automatic depression recognition with an ensemble of multimodal Spatio-Temporal routing features","author":"Wang","year":"2025","journal-title":"IEEE Trans. Affect. Comput."},{"key":"10.1016\/j.bspc.2026.110517_b19","doi-asserted-by":"crossref","unstructured":"Z. Wu, L. Zhou, S. Li, C. Fu, J. Lu, J. Han, Y. Zhang, Z. Zhao, S. Song, DepMGNN: Matrixial Graph Neural Network for Video-based Automatic Depression Assessment, in: Proc. AAAI Conf. Artif. Intell., Vol. 39, 2025, pp. 1610\u20131619.","DOI":"10.1609\/aaai.v39i2.32153"},{"key":"10.1016\/j.bspc.2026.110517_b20","doi-asserted-by":"crossref","DOI":"10.1016\/j.bspc.2025.108113","article-title":"CFGMamba: Cross frame group mamba for video-based depression recognition","volume":"110","author":"Liu","year":"2025","journal-title":"Biomed. Signal Process. Control."},{"key":"10.1016\/j.bspc.2026.110517_b21","series-title":"Proc. Int. Conf. Affect. Comput. Intell. Interact.","first-page":"255","article-title":"A temporally piece-wise fisher vector approach for depression analysis","author":"Dhall","year":"2015"},{"issue":"11","key":"10.1016\/j.bspc.2026.110517_b22","doi-asserted-by":"crossref","first-page":"2740","DOI":"10.1109\/TPAMI.2018.2868668","article-title":"Temporal segment networks for action recognition in videos","volume":"41","author":"Wang","year":"2018","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"1","key":"10.1016\/j.bspc.2026.110517_b23","doi-asserted-by":"crossref","first-page":"294","DOI":"10.1109\/TAFFC.2020.3031345","article-title":"Multimodal spatiotemporal representation for automatic depression level detection","volume":"14","author":"Niu","year":"2020","journal-title":"IEEE Trans. Affect. Comput."},{"issue":"6","key":"10.1016\/j.bspc.2026.110517_b24","doi-asserted-by":"crossref","first-page":"1599","DOI":"10.1109\/TFUZZ.2021.3062723","article-title":"Building trend fuzzy granulation-based LSTM recurrent neural network for long-term time-series forecasting","volume":"30","author":"Tang","year":"2021","journal-title":"IEEE Trans. Fuzzy Syst."},{"key":"10.1016\/j.bspc.2026.110517_b25","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1016\/j.neucom.2022.10.050","article-title":"Recurrent attention unit: A new gated recurrent unit for long-term memory of important parts in sequential data","volume":"517","author":"Niu","year":"2023","journal-title":"Neurocomputing"},{"key":"10.1016\/j.bspc.2026.110517_b26","doi-asserted-by":"crossref","DOI":"10.1016\/j.bspc.2024.106552","article-title":"A novel multimodal depression diagnosis approach utilizing a new hybrid fusion method","volume":"96","author":"Zhang","year":"2024","journal-title":"Biomed. Signal Process. Control."},{"key":"10.1016\/j.bspc.2026.110517_b27","series-title":"Proc. 25th Int. Conf. Pattern Recognit.","first-page":"607","article-title":"Video-based facial expression recognition using graph convolutional networks","author":"Liu","year":"2021"},{"key":"10.1016\/j.bspc.2026.110517_b28","doi-asserted-by":"crossref","DOI":"10.1016\/j.bspc.2024.106767","article-title":"LSCAformer: Long and short-term cross-attention-aware transformer for depression recognition from video sequences","volume":"98","author":"He","year":"2024","journal-title":"Biomed. Signal Process. Control."},{"key":"10.1016\/j.bspc.2026.110517_b29","doi-asserted-by":"crossref","DOI":"10.1016\/j.knosys.2024.111951","article-title":"PointTransform networks for automatic depression level prediction via facial keypoints","volume":"297","author":"Niu","year":"2024","journal-title":"Knowl.-Based Syst."},{"key":"10.1016\/j.bspc.2026.110517_b30","series-title":"Proc. IEEE Int. Conf. Acoust., Speech Signal Process.","first-page":"1325","article-title":"Multi-scale and multi-region facial discriminative representation for automatic depression level prediction","author":"Niu","year":"2021"},{"key":"10.1016\/j.bspc.2026.110517_b31","doi-asserted-by":"crossref","unstructured":"M. Valstar, B. Schuller, K. Smith, F. Eyben, B. Jiang, S. Bilakhia, S. Schnieder, R. Cowie, M. Pantic, Avec 2013: the continuous audio\/visual emotion and depression recognition challenge, in: Proc. 3rd ACM Int. Workshop Audio\/Visual Emotion Challenge, 2013, pp. 3\u201310.","DOI":"10.1145\/2512530.2512533"},{"issue":"7","key":"10.1016\/j.bspc.2026.110517_b32","doi-asserted-by":"crossref","first-page":"1432","DOI":"10.1109\/TIFS.2015.2414392","article-title":"Automated depression diagnosis based on facial dynamic analysis and sparse coding","volume":"10","author":"Wen","year":"2015","journal-title":"IEEE Trans. Inf. Forensics Secur."},{"key":"10.1016\/j.bspc.2026.110517_b33","doi-asserted-by":"crossref","unstructured":"H. Meng, D. Huang, H. Wang, H. Yang, M. Ai-Shuraifi, Y. Wang, Depression recognition based on dynamic facial and vocal expression features using partial least square regression, in: Proc. 3rd ACM Int. Workshop Audio\/Visual Emotion Challenge, 2013, pp. 21\u201330.","DOI":"10.1145\/2512530.2512532"},{"issue":"4","key":"10.1016\/j.bspc.2026.110517_b34","doi-asserted-by":"crossref","first-page":"578","DOI":"10.1109\/TAFFC.2017.2650899","article-title":"Automated depression diagnosis based on deep networks to encode facial appearance and dynamics","volume":"9","author":"Zhu","year":"2017","journal-title":"IEEE Trans. Affect. Comput."},{"key":"10.1016\/j.bspc.2026.110517_b35","doi-asserted-by":"crossref","first-page":"554","DOI":"10.1109\/TNSRE.2022.3204757","article-title":"Dual-stream multiple instance learning for depression detection with facial expression videos","volume":"31","author":"Shangguan","year":"2022","journal-title":"IEEE Trans. Neural Syst. Rehabil. Eng."},{"issue":"1","key":"10.1016\/j.bspc.2026.110517_b36","doi-asserted-by":"crossref","first-page":"262","DOI":"10.1109\/TAFFC.2018.2870884","article-title":"Video-based depression level analysis by encoding deep spatiotemporal features","volume":"12","author":"Al Jazaery","year":"2018","journal-title":"IEEE Trans. Affect. Comput."},{"issue":"2","key":"10.1016\/j.bspc.2026.110517_b37","doi-asserted-by":"crossref","first-page":"864","DOI":"10.1109\/TAFFC.2020.2970418","article-title":"Depression level prediction using deep spatiotemporal features and multilayer bi-ltsm","volume":"13","author":"Uddin","year":"2020","journal-title":"IEEE Trans. Affect. Comput."},{"issue":"9","key":"10.1016\/j.bspc.2026.110517_b38","doi-asserted-by":"crossref","first-page":"8924","DOI":"10.1109\/TCSVT.2024.3382334","article-title":"Depressionmlp: A multi-layer perceptron architecture for automatic depression level prediction via facial keypoints and action units","volume":"34","author":"Niu","year":"2024","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"key":"10.1016\/j.bspc.2026.110517_b39","doi-asserted-by":"crossref","DOI":"10.1016\/j.eswa.2025.128532","article-title":"Fine-grained multimodal fusion for depression assisted recognition based on hierarchical knowledge-enhanced prompt learning","author":"Yang","year":"2025","journal-title":"Expert Syst. Appl."},{"issue":"3","key":"10.1016\/j.bspc.2026.110517_b40","doi-asserted-by":"crossref","first-page":"577","DOI":"10.1016\/j.dcan.2023.03.007","article-title":"Depressive semantic awareness from vlog facial and vocal streams via spatio-temporal transformer","volume":"10","author":"Tao","year":"2024","journal-title":"Digit. Commun. Netw."},{"issue":"12","key":"10.1016\/j.bspc.2026.110517_b41","doi-asserted-by":"crossref","first-page":"7749","DOI":"10.1109\/TCYB.2022.3197127","article-title":"MS2-GNN: Exploring GNN-based multimodal fusion network for depression detection","volume":"53","author":"Chen","year":"2022","journal-title":"IEEE Trans. Cybern."},{"issue":"1","key":"10.1016\/j.bspc.2026.110517_b42","doi-asserted-by":"crossref","first-page":"578","DOI":"10.1109\/TAFFC.2021.3072579","article-title":"MDN: A deep maximization-differentiation network for spatio-temporal depression detection","volume":"14","author":"De Melo","year":"2021","journal-title":"IEEE Trans. Affect. Comput."},{"issue":"3","key":"10.1016\/j.bspc.2026.110517_b43","doi-asserted-by":"crossref","first-page":"1078","DOI":"10.1109\/TAFFC.2023.3312263","article-title":"MTDAN: A lightweight multi-scale temporal difference attention networks for automated video depression detection","volume":"15","author":"Zhang","year":"2023","journal-title":"IEEE Trans. Affect. Comput."},{"key":"10.1016\/j.bspc.2026.110517_b44","doi-asserted-by":"crossref","unstructured":"L. Wang, Z. Tong, B. Ji, G. Wu, Tdn: Temporal difference networks for efficient action recognition, in: Proc. IEEE Conf. Comput. Vis. Pattern Recognit., CVPR, 2021, pp. 1895\u20131904.","DOI":"10.1109\/CVPR46437.2021.00193"},{"key":"10.1016\/j.bspc.2026.110517_b45","doi-asserted-by":"crossref","unstructured":"K. Hara, H. Kataoka, Y. Satoh, Learning spatio-temporal features with 3d residual networks for action recognition, in: Proc. IEEE Conf. Comput. Vis. Pattern Recognit., CVPR, 2017, pp. 3154\u20133160.","DOI":"10.1109\/ICCVW.2017.373"},{"key":"10.1016\/j.bspc.2026.110517_b46","doi-asserted-by":"crossref","unstructured":"K. He, X. Zhang, S. Ren, J. Sun, Deep residual learning for image recognition, in: Proc. IEEE Conf. Comput. Vis. Pattern Recognit., CVPR, 2016, pp. 770\u2013778.","DOI":"10.1109\/CVPR.2016.90"},{"key":"10.1016\/j.bspc.2026.110517_b47","series-title":"Major depressive disorder","author":"Bains","year":"2020"},{"key":"10.1016\/j.bspc.2026.110517_b48","doi-asserted-by":"crossref","unstructured":"N. Dalal, B. Triggs, Histograms of oriented gradients for human detection, in: Proc. IEEE Conf. Comput. Vis. Pattern Recognit., CVPR, 2005, pp. 886\u2013893.","DOI":"10.1109\/CVPR.2005.177"},{"key":"10.1016\/j.bspc.2026.110517_b49","doi-asserted-by":"crossref","unstructured":"M. Valstar, B. Schuller, K. Smith, T. Almaev, F. Eyben, J. Krajewski, R. Cowie, M. Pantic, Avec 2014: 3d dimensional affect and depression recognition challenge, in: Proc. 4th Int. Workshop Audio\/Visual Emotion Challenge, 2014, pp. 3\u201310.","DOI":"10.1145\/2661806.2661807"},{"key":"10.1016\/j.bspc.2026.110517_b50","doi-asserted-by":"crossref","unstructured":"M. Valstar, J. Gratch, B. Schuller, F. Ringeval, D. Lalanne, M. Torres, S. Scherer, G. Stratou, R. Cowie, M. Pantic, AVEC 2016: Depression, Mood, and Emotion Recognition Workshop and Challenge, in: Proc. 6th ACM Int. Workshop Audio\/Visual Emotion Challenge, 2016, pp. 3\u201310.","DOI":"10.1145\/2988257.2988258"},{"issue":"10","key":"10.1016\/j.bspc.2026.110517_b51","doi-asserted-by":"crossref","first-page":"1499","DOI":"10.1109\/LSP.2016.2603342","article-title":"Joint face detection and alignment using multitask cascaded convolutional networks","volume":"23","author":"Zhang","year":"2016","journal-title":"IEEE Signal Process. Lett."},{"key":"10.1016\/j.bspc.2026.110517_b52","doi-asserted-by":"crossref","unstructured":"F. Ringeval, B. Schuller, M. Valstar, N. Cummins, R. Cowie, L. Tavabi, M. Schmitt, S. Alisamir, S. Amiriparian, E.-M. Messner, et al., AVEC 2019 workshop and challenge: state-of-mind, detecting depression with AI, and cross-cultural affect recognition, in: Proc. 9th Int. Audio\/Visual Emotion Challenge and Workshop, 2019, pp. 3\u201312.","DOI":"10.1145\/3347320.3357688"},{"key":"10.1016\/j.bspc.2026.110517_b53","doi-asserted-by":"crossref","DOI":"10.1016\/j.eswa.2022.117512","article-title":"Depressioner: Facial dynamic representation for automatic depression level prediction","volume":"204","author":"Niu","year":"2022","journal-title":"Expert Syst. Appl."},{"issue":"3","key":"10.1016\/j.bspc.2026.110517_b54","doi-asserted-by":"crossref","first-page":"2153","DOI":"10.1109\/TAFFC.2022.3179478","article-title":"Deep multi-modal network based automated depression severity estimation","volume":"14","author":"Uddin","year":"2022","journal-title":"IEEE Trans. Affect. Comput."},{"issue":"3","key":"10.1016\/j.bspc.2026.110517_b55","doi-asserted-by":"crossref","first-page":"828","DOI":"10.1109\/TAFFC.2023.3296318","article-title":"Integrating deep facial priors into landmarks for privacy preserving multimodal depression recognition","volume":"15","author":"Pan","year":"2023","journal-title":"IEEE Trans. Affect. Comput."},{"key":"10.1016\/j.bspc.2026.110517_b56","doi-asserted-by":"crossref","DOI":"10.1016\/j.eswa.2023.121276","article-title":"Facial expression analysis using decomposed multiscale spatiotemporal networks","volume":"236","author":"De Melo","year":"2024","journal-title":"Expert Syst. Appl."},{"key":"10.1016\/j.bspc.2026.110517_b57","doi-asserted-by":"crossref","DOI":"10.1016\/j.bspc.2024.106490","article-title":"Depressformer: Leveraging video swin transformer and fine-grained local features for depression scale estimation","volume":"96","author":"He","year":"2024","journal-title":"Biomed. Signal Process. Control."},{"issue":"6","key":"10.1016\/j.bspc.2026.110517_b58","doi-asserted-by":"crossref","first-page":"6195","DOI":"10.1109\/TCSVT.2025.3533480","article-title":"Depression scale dictionary decomposition framework for multimodal automatic depression level prediction","volume":"35","author":"Niu","year":"2025","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"key":"10.1016\/j.bspc.2026.110517_b59","first-page":"1","article-title":"Simma: Multimodal automatic depression detection via spatiotemporal ensemble and cross-modal alignment","author":"Wang","year":"2025","journal-title":"IEEE Trans. Comput. Soc. Syst."},{"key":"10.1016\/j.bspc.2026.110517_b60","first-page":"1","article-title":"Depression recognition by fuzzy learning of facial movements based on graph neural networks","author":"Liu","year":"2025","journal-title":"IEEE Trans. Fuzzy Syst."},{"key":"10.1016\/j.bspc.2026.110517_b61","first-page":"1","article-title":"MLM-EOE: Automatic depression detection via sentimental annotation and multi-expert ensemble","author":"Lin","year":"2025","journal-title":"IEEE Trans. Affect. Comput."},{"key":"10.1016\/j.bspc.2026.110517_b62","doi-asserted-by":"crossref","unstructured":"S. Song, L. Shen, M. Valstar, Human Behaviour-Based Automatic Depression Analysis Using Hand-Crafted Statistics and Deep Learned Spectral Features, in: Proc. 13th IEEE Int. Conf. Automatic Face & Gesture Recognition (FG 2018), 2018, pp. 158\u2013165.","DOI":"10.1109\/FG.2018.00032"},{"key":"10.1016\/j.bspc.2026.110517_b63","doi-asserted-by":"crossref","unstructured":"S. Rasipuram, J.H. Bhat, A. Maitra, B. Shaw, S. Saha, Multimodal Depression Detection Using Task-oriented Transformer-based Embedding, in: Proc. 2022 IEEE Symp. Computers and Communications, ISCC, 2022, pp. 01\u201304.","DOI":"10.1109\/ISCC55528.2022.9913044"},{"key":"10.1016\/j.bspc.2026.110517_b64","doi-asserted-by":"crossref","DOI":"10.1016\/j.bspc.2022.104561","article-title":"A multimodal fusion model with multi-level attention mechanism for depression detection","volume":"82","author":"Fang","year":"2023","journal-title":"Biomed. Signal Process. Control."},{"issue":"5","key":"10.1016\/j.bspc.2026.110517_b65","doi-asserted-by":"crossref","first-page":"6830","DOI":"10.1109\/TCSS.2024.3416029","article-title":"Parallel multiscale bridge fusion network for Audio\u2013Visual automatic depression assessment","volume":"11","author":"Hu","year":"2024","journal-title":"IEEE Trans. Comput. Soc. Syst."},{"key":"10.1016\/j.bspc.2026.110517_b66","doi-asserted-by":"crossref","DOI":"10.1016\/j.jbi.2025.104965","article-title":"MDD-MARF: a multimodal depression detection model based on multi-level attention mechanism and residual fusion","volume":"173","author":"Zhou","year":"2026","journal-title":"J. Biomed. Inf."},{"key":"10.1016\/j.bspc.2026.110517_b67","series-title":"Gated multimodal units for information fusion","author":"Arevalo","year":"2017"},{"key":"10.1016\/j.bspc.2026.110517_b68","doi-asserted-by":"crossref","unstructured":"R.R. Selvaraju, M. Cogswell, A. Das, R. Vedantam, D. Parikh, D. Batra, Grad-cam: Visual explanations from deep networks via gradient-based localization, in: Proc. IEEE Int. Conf. Comput. Vis., ICCV, 2017, pp. 618\u2013626.","DOI":"10.1109\/ICCV.2017.74"}],"container-title":["Biomedical Signal Processing and Control"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1746809426010712?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1746809426010712?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,5,27]],"date-time":"2026-05-27T06:26:54Z","timestamp":1779863214000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1746809426010712"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,9]]},"references-count":68,"alternative-id":["S1746809426010712"],"URL":"https:\/\/doi.org\/10.1016\/j.bspc.2026.110517","relation":{},"ISSN":["1746-8094"],"issn-type":[{"value":"1746-8094","type":"print"}],"subject":[],"published":{"date-parts":[[2026,9]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"A long\u2013short behavioral evolution modeling for video depression recognition","name":"articletitle","label":"Article Title"},{"value":"Biomedical Signal Processing and Control","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.bspc.2026.110517","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier Ltd. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"110517"}}