{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,15]],"date-time":"2026-04-15T20:43:29Z","timestamp":1776285809873,"version":"3.50.1"},"reference-count":50,"publisher":"IEEE","license":[{"start":{"date-parts":[[2019,7,1]],"date-time":"2019-07-01T00:00:00Z","timestamp":1561939200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2019,7,1]],"date-time":"2019-07-01T00:00:00Z","timestamp":1561939200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,7,1]],"date-time":"2019-07-01T00:00:00Z","timestamp":1561939200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019,7]]},"DOI":"10.1109\/ijcnn.2019.8852330","type":"proceedings-article","created":{"date-parts":[[2019,10,1]],"date-time":"2019-10-01T03:44:32Z","timestamp":1569901472000},"page":"1-7","source":"Crossref","is-referenced-by-count":18,"title":["Audio-based Recognition of Bipolar Disorder Utilising Capsule Networks"],"prefix":"10.1109","author":[{"given":"Shahin","family":"Amiriparian","sequence":"first","affiliation":[]},{"given":"Arsany","family":"Awad","sequence":"additional","affiliation":[]},{"given":"Maurice","family":"Gerczuk","sequence":"additional","affiliation":[]},{"given":"Lukas","family":"Stappen","sequence":"additional","affiliation":[]},{"given":"Alice","family":"Baird","sequence":"additional","affiliation":[]},{"given":"Sandra","family":"Ottl","sequence":"additional","affiliation":[]},{"given":"Bjorn","family":"Schuller","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","first-page":"1871","article-title":"LIBLINEAR: A library for large linear classification","volume":"9","author":"fan","year":"2008","journal-title":"Journal of Machine Learning Research"},{"key":"ref38","first-page":"1929","article-title":"Dropout: A simple way to prevent neural networks from overfitting","volume":"15","author":"srivastava","year":"2014","journal-title":"Journal of Machine Learning Research"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1145\/3123266.3123371"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ACII.2017.8273622"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2018.8489416"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ACIIW.2017.8272618"},{"key":"ref37","article-title":"Adam: A method for stochastic optimization","author":"kingma","year":"2014","journal-title":"Proceedings of the 3rd International Conference on Learning Representations"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.50"},{"key":"ref35","first-page":"3371","article-title":"Stacked denoising autoencoders: Learning useful representations in a deep network with a local denoising criterion","volume":"11","author":"vincent","year":"2010","journal-title":"Journal of Machine Learning Research"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-35289-8_32"},{"key":"ref28","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2014"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-730"},{"key":"ref2","article-title":"Mental disorders affect one in four people","year":"2001"},{"key":"ref1","first-page":"168","article-title":"Lifetime prevalence and age-of-onset distributions of mental disorders in the world health organization&#x2019;s world mental health survey initiative","volume":"6","author":"kessler","year":"2007","journal-title":"World Psychiatry"},{"key":"ref20","article-title":"Polyphonic sound event detection by using capsule neural network","author":"vesperini","year":"2018"},{"key":"ref22","first-page":"17","article-title":"Sequence to sequence autoencoders for unsupervised representation learning from audio","author":"amiriparian","year":"2017","journal-title":"Proceedings of the 2nd Detection and Classification of Acoustic Scenes and Events 2017 Workshop (DCASE 2017)"},{"key":"ref21","year":"2013","journal-title":"Diagnostic Criteria and Codes"},{"key":"ref24","first-page":"44","article-title":"Transforming auto- encoders","volume":"6791","author":"hinton","year":"2011","journal-title":"International Conference on Artificial Neural Networks"},{"key":"ref23","first-page":"1","article-title":"audeep: Unsupervised learning of representations from audio with deep recurrent neural networks","volume":"18","author":"freitag","year":"2018","journal-title":"Journal of Machine Learning Research"},{"key":"ref26","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"Advances in Neural Information Processing Systems 25"},{"key":"ref25","first-page":"807","article-title":"Rectified linear units improve restricted boltzmann machines","author":"nair","year":"2010","journal-title":"Proceedings of the 27th International Conference on Machine Learning (ICML-10)"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/EUSIPCO.2016.7760424"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1159\/000470803"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1111\/j.1399-5618.2007.00484.x"},{"key":"ref40","first-page":"2825","article-title":"Scikit-learn: Machine learning in Python","volume":"12","author":"pedregosa","year":"2011","journal-title":"Journal of Machine Learning Research"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1192\/bjp.bp.110.086983"},{"key":"ref13","first-page":"1","article-title":"The turkish audio-visual bipolar disorder corpus","author":"\u00e7ift\u00e7i","year":"2018","journal-title":"2018 First Asian Conference on Affective Computing and Intelligent Interaction (ACII Asia)"},{"key":"ref14","first-page":"3370","article-title":"Openxbow: introducing the passau open- source crossmodal bag-of-words toolkit","volume":"18","author":"schmitt","year":"2017","journal-title":"The Journal of Machine Learning Research"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2017-434"},{"key":"ref16","article-title":"Dynamic routing between capsules","author":"sabour","year":"2017","journal-title":"CoRR"},{"key":"ref17","article-title":"Introducing capsule networks","author":"g\u00e9ron","year":"0"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2018.8451379"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1013"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3266302.3266316"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1176\/ajp.155.5.646"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1176\/ps.39.6.652"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/S0006-3223(00)00909-4"},{"key":"ref8","article-title":"3: burden of disease in dalys by cause, sex and mortality stratum in who regions, estimates for 2002","author":"table","year":"2004","journal-title":"The World Health Report"},{"key":"ref7","doi-asserted-by":"crossref","first-page":"1635","DOI":"10.1176\/ajp.152.11.1635","article-title":"Relapse and impairment in bipolar disorder","volume":"152","author":"gitlin","year":"1995","journal-title":"The American Journal of Psychiatry"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2017.7966293"},{"key":"ref9","first-page":"227","article-title":"Treatment-resistant bipolar disorder","volume":"11","author":"gitlin","year":"2007","journal-title":"FOCUS"},{"key":"ref46","first-page":"11","article-title":"are you playing a shooter again?!&#x201D; deep representation learning for audio-based video game genre recognition","author":"amiriparian","year":"2018","journal-title":"IEEE Transactions on Games"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-1772"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472669"},{"key":"ref47","article-title":"Matrix capsules with em routing","author":"hinton","year":"2018"},{"key":"ref42","article-title":"Recurrent neural network based language model","author":"mikolov","year":"2010","journal-title":"Eleventh Annual Conference of the International Speech Communication Association"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6638947"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2018-51"},{"key":"ref43","article-title":"Long short-term memory recurrent neural network architectures for large scale acoustic modeling","author":"sak","year":"2014","journal-title":"Fifteenth Annual Conference of the International Speech Communication Association"}],"event":{"name":"2019 International Joint Conference on Neural Networks (IJCNN)","location":"Budapest, Hungary","start":{"date-parts":[[2019,7,14]]},"end":{"date-parts":[[2019,7,19]]}},"container-title":["2019 International Joint Conference on Neural Networks (IJCNN)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8840768\/8851681\/08852330.pdf?arnumber=8852330","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,17]],"date-time":"2022-07-17T21:53:45Z","timestamp":1658094825000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8852330\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,7]]},"references-count":50,"URL":"https:\/\/doi.org\/10.1109\/ijcnn.2019.8852330","relation":{},"subject":[],"published":{"date-parts":[[2019,7]]}}}