{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T05:05:20Z","timestamp":1750309520053,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":29,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,10,25]],"date-time":"2024-10-25T00:00:00Z","timestamp":1729814400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"National Natural Science Foundation of China","award":["72271126"],"award-info":[{"award-number":["72271126"]}]},{"name":"National Natural Science Foundation of China","award":["12227808"],"award-info":[{"award-number":["12227808"]}]},{"name":"Major Project of Natural Science Foundation of Jiangsu Education Department","award":["22KJA630001"],"award-info":[{"award-number":["22KJA630001"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,10,25]]},"DOI":"10.1145\/3704323.3704375","type":"proceedings-article","created":{"date-parts":[[2025,1,7]],"date-time":"2025-01-07T08:25:22Z","timestamp":1736238322000},"page":"226-232","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Enhanced Depression Detection through Optimally Weighted Spectrogram Feature Fusion"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7028-4200","authenticated-orcid":false,"given":"Pingping","family":"Wu","sequence":"first","affiliation":[{"name":"School of Engineering Audit, Jiangsu Key Laboratory of Public Project Audit, Nanjing Audit University, Nanjing, Jiangsu, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-3962-6783","authenticated-orcid":false,"given":"Fangfang","family":"Xu","sequence":"additional","affiliation":[{"name":"School of Computer Science, Nanjing Audit University, Nanjing, Jiangsu, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5136-5059","authenticated-orcid":false,"given":"Han","family":"Lin","sequence":"additional","affiliation":[{"name":"School of Engineering Audit, Jiangsu Key Laboratory of Public Project Audit, Nanjing Audit University, Nanjing, Jiangsu, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,1,7]]},"reference":[{"doi-asserted-by":"publisher","unstructured":"Tania\u00a0H Bisgaard Kristine\u00a0H Allin and Keefer. 2022. Depression and anxiety in inflammatory bowel disease: epidemiology mechanisms and treatment. Nat. Rev. Gastroenterol. Hepatol. 19 (Nov 2022) 717\u2013726. 10.1016\/j.bspc.2023.105020","key":"e_1_3_3_1_2_2","DOI":"10.1016\/j.bspc.2023.105020"},{"doi-asserted-by":"publisher","unstructured":"Yoonseo Park Sewon Park and Munjae Lee. 2024. Effectiveness of artificial intelligence in detecting and managing depressive disorders: Systematic review. J. Affect. Disord. 361 (Sep 2024) 445\u2013456. 10.1016\/j.jad.2024.06.035","key":"e_1_3_3_1_3_2","DOI":"10.1016\/j.jad.2024.06.035"},{"doi-asserted-by":"publisher","unstructured":"Shaykhah\u00a0A Almaghrabi Scott\u00a0R Clark and Mathias Baumert. 2023. Bio-acoustic features of depression: A review. Biomed. Signal Process. Control 85 (Aug 2023) 105020. 10.1016\/j.bspc.2023.105020","key":"e_1_3_3_1_4_2","DOI":"10.1016\/j.bspc.2023.105020"},{"doi-asserted-by":"publisher","unstructured":"Yunji Liang Huihui Li Bin Guo Zhiwen Yu Xiaolong Zheng Sagar Samtani and Daniel\u00a0D Zeng. 2021. Fusion of heterogeneous attention mechanisms in multi-view convolutional neural network for text classification. Inf. Sci. (Ny) 548 (Feb 2021) 295\u2013312. 10.1016\/j.ins.2020.10.021","key":"e_1_3_3_1_5_2","DOI":"10.1016\/j.ins.2020.10.021"},{"doi-asserted-by":"publisher","unstructured":"Sara Sardari Bahareh Nakisa Mohammed\u00a0Naim Rastgoo and Peter Eklund. 2022. Audio based depression detection using Convolutional Autoencoder. Expert Syst. Appl. 189 (Mar 2022) 116076. 10.1016\/j.eswa.2021.116076","key":"e_1_3_3_1_6_2","DOI":"10.1016\/j.eswa.2021.116076"},{"doi-asserted-by":"publisher","unstructured":"Andr\u00e9s G\u00f3mez-Rodellar Daniel Palacios-Alonso and Ferr\u00e1ndez Vicente. 2020. A methodology to differentiate Parkinson\u2019s Disease and aging speech based on glottal flow acoustic analysis. Int. J. Neural Syst. 30 (Oct 2020) 2050058. 10.1142\/S0129065720500586","key":"e_1_3_3_1_7_2","DOI":"10.1142\/S0129065720500586"},{"doi-asserted-by":"publisher","unstructured":"A.\u00a0J. Rush M.\u00a0H. Trivedi H.\u00a0M. Ibrahim and T.\u00a0J. Carmody. 2003. The 16-Item Quick Inventory of Depressive Symptomatology (QIDS) clinician rating (QIDS-C) and self-report (QIDS-SR): a psychometric evaluation in patients with chronic major depression. Biol. Psychiatry 54 (September 2003) 573\u2013583. 10.1016\/S0006-3223(02)01866-8","key":"e_1_3_3_1_8_2","DOI":"10.1016\/S0006-3223(02)01866-8"},{"doi-asserted-by":"publisher","unstructured":"Mingyue Niu Jianhua Tao Bin Liu and Huang. 2023. Multimodal spatiotemporal representation for automatic depression level detection. IEEE Trans. Affect. Comput. 14 (Jan 2023) 294\u2013307. 10.1109\/TAFFC.2020.3031345","key":"e_1_3_3_1_9_2","DOI":"10.1109\/TAFFC.2020.3031345"},{"doi-asserted-by":"publisher","unstructured":"Zhaocheng Huang Julien Epps and Dale Joachim. 2022. Investigation of speech landmark patterns for depression detection. IEEE Trans. Affect. Comput. 13 (Apr 2022) 666\u2013679. 10.1109\/TAFFC.2019.2944380","key":"e_1_3_3_1_10_2","DOI":"10.1109\/TAFFC.2019.2944380"},{"doi-asserted-by":"publisher","unstructured":"Yael Wasserzug Yoav Degani and Bar-Shaked. 2023. Development and validation of a machine learning-based vocal predictive model for major depressive disorder. J. Affect. Disord. 325 (Mar 2023) 627\u2013632. 10.1016\/j.jad.2022.12.117","key":"e_1_3_3_1_11_2","DOI":"10.1016\/j.jad.2022.12.117"},{"doi-asserted-by":"publisher","unstructured":"Minghao Du Shuang Liu Tao Wang and Zhang. 2023. Depression recognition using a proposed speech chain model fusing speech production and perception features. J. Affect. Disord. 323 (Feb 2023) 299\u2013308. 10.1016\/j.jad.2022.11.060","key":"e_1_3_3_1_12_2","DOI":"10.1016\/j.jad.2022.11.060"},{"doi-asserted-by":"publisher","unstructured":"Jiatong Han Hao Li Han Lin and Wu. 2023. Depression prediction based on LassoNet-RNN model: A longitudinal study. 9 (Oct 2023) e20684. 10.1016\/j.heliyon.2023.e20684","key":"e_1_3_3_1_13_2","DOI":"10.1016\/j.heliyon.2023.e20684"},{"doi-asserted-by":"publisher","unstructured":"Emna Rejaibi Ali Komaty and Meriaudeau. 2022. MFCC-based Recurrent Neural Network for automatic clinical depression recognition and assessment from speech. Biomed. Signal Process. Control 71 (Jan 2022) 103107. 10.1016\/j.bspc.2021.103107","key":"e_1_3_3_1_14_2","DOI":"10.1016\/j.bspc.2021.103107"},{"doi-asserted-by":"publisher","unstructured":"Timo Brockmeyer Dominika Kulessa and Hautzinger. 2015. Mood-incongruent processing during the recall of a sad life event predicts the course and severity of depression. 187 (Nov 2015) 91\u201396. 10.1016\/j.jad.2015.08.010","key":"e_1_3_3_1_15_2","DOI":"10.1016\/j.jad.2015.08.010"},{"doi-asserted-by":"publisher","unstructured":"Wenju Yang Jiankang Liu and Cao. 2023. Attention guided learnable time-domain filterbanks for speech depression detection. Neural Netw. 165 (Aug 2023) 135\u2013149. 10.1145\/2988257.2988267","key":"e_1_3_3_1_16_2","DOI":"10.1145\/2988257.2988267"},{"doi-asserted-by":"publisher","unstructured":"Lang He and Cui Cao. 2018. Automated depression analysis using convolutional neural networks from speech. J. Biomed. Inform. 83 (Jul 2018) 103\u2013111. 10.1016\/j.jbi.2018.05.007","key":"e_1_3_3_1_17_2","DOI":"10.1016\/j.jbi.2018.05.007"},{"doi-asserted-by":"publisher","unstructured":"Siyang Song Shashank Jaiswal and Shen. 2022. Spectral representation of behaviour primitives for depression analysis. IEEE Trans. Affect. Comput. 13 (Apr 2022) 829\u2013844. 10.1109\/TAFFC.2020.2970712","key":"e_1_3_3_1_18_2","DOI":"10.1109\/TAFFC.2020.2970712"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_19_2","DOI":"10.1145\/2988257.2988267"},{"doi-asserted-by":"publisher","unstructured":"Sara Sardari Bahareh Nakisa and Rastgoo. 2022. Audio based depression detection using Convolutional Autoencoder. Expert Syst. Appl. 189 (Mar 2022) 116076. 10.1016\/j.eswa.2021.116076","key":"e_1_3_3_1_20_2","DOI":"10.1016\/j.eswa.2021.116076"},{"doi-asserted-by":"publisher","unstructured":"Arnab\u00a0Kumar Das and Ruchira Naskar. 2024. A deep learning model for depression detection based on MFCC and CNN generated spectrogram features. Biomed. Signal Process. Control 90 (Apr 2024) 105898. 10.1016\/j.bspc.2023.105898","key":"e_1_3_3_1_21_2","DOI":"10.1016\/j.bspc.2023.105898"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_22_2","DOI":"10.48550\/arXiv.1801.04381"},{"doi-asserted-by":"publisher","unstructured":"Tao Zhang Guoqing Feng and Liang. 2021. Acoustic scene classification based on Mel spectrogram decomposition and model merging. Appl. Acoust. 182 (Nov 2021) 108258. 10.1016\/j.apacoust.2021.108258","key":"e_1_3_3_1_23_2","DOI":"10.1016\/j.apacoust.2021.108258"},{"doi-asserted-by":"publisher","unstructured":"Shahid Ismail Basit Ismail and Siddiqi. 2023. PCG classification through spectrogram using transfer learning. Biomed. Signal Process. Control 79 (Jan 2023) 104075. 10.1016\/j.bspc.2022.104075","key":"e_1_3_3_1_24_2","DOI":"10.1016\/j.bspc.2022.104075"},{"doi-asserted-by":"publisher","unstructured":"Dimitris Bertsimas and John Tsitsiklis. 1993. Simulated Annealing. Stat. Sci. 8 (Feb 1993) 10\u201315. 10.1214\/ss\/1177011077","key":"e_1_3_3_1_25_2","DOI":"10.1214\/ss\/1177011077"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_26_2","DOI":"10.1109\/ICASSP43922.2022.9746569"},{"doi-asserted-by":"publisher","unstructured":"Hanshu Cai Zhenqin Yuan and Gao. 2022. A multi-modal open dataset for mental-disorder analysis. Sci. Data 9 (Apr 2022) 178. 10.1038\/s41597-022-01211-x","key":"e_1_3_3_1_27_2","DOI":"10.1038\/s41597-022-01211-x"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_28_2","DOI":"10.1145\/3347320.3357688"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_29_2","DOI":"10.23919\/EUSIPCO58844.2023.10289973"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_30_2","DOI":"10.1109\/ICASSP48485.2024.10446253"}],"event":{"acronym":"ICCPR 2024","name":"ICCPR 2024: 2024 13th International Conference on Computing and Pattern Recognition","location":"Tianjin China"},"container-title":["Proceedings of the 2024 13th International Conference on Computing and Pattern Recognition"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3704323.3704375","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3704323.3704375","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:18:05Z","timestamp":1750295885000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3704323.3704375"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,25]]},"references-count":29,"alternative-id":["10.1145\/3704323.3704375","10.1145\/3704323"],"URL":"https:\/\/doi.org\/10.1145\/3704323.3704375","relation":{},"subject":[],"published":{"date-parts":[[2024,10,25]]},"assertion":[{"value":"2025-01-07","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}