{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,17]],"date-time":"2026-06-17T22:22:12Z","timestamp":1781734932736,"version":"3.54.5"},"reference-count":60,"publisher":"IEEE","license":[{"start":{"date-parts":[[2022,8,21]],"date-time":"2022-08-21T00:00:00Z","timestamp":1661040000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,8,21]],"date-time":"2022-08-21T00:00:00Z","timestamp":1661040000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022,8,21]]},"DOI":"10.1109\/icpr56361.2022.9956027","type":"proceedings-article","created":{"date-parts":[[2022,11,29]],"date-time":"2022-11-29T19:34:13Z","timestamp":1669750453000},"page":"2605-2612","source":"Crossref","is-referenced-by-count":41,"title":["Transformer-Based Self-Supervised Learning for Emotion Recognition"],"prefix":"10.1109","author":[{"given":"Juan","family":"Vazquez-Rodriguez","sequence":"first","affiliation":[{"name":"Orange Labs,Grenoble,France"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Gregoire","family":"Lefebvre","sequence":"additional","affiliation":[{"name":"Orange Labs,Grenoble,France"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Julien","family":"Cumin","sequence":"additional","affiliation":[{"name":"Orange Labs,Grenoble,France"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"James L.","family":"Crowley","sequence":"additional","affiliation":[{"name":"Univ. Grenoble Alpes,CNRS, Inria, Grenoble INP, LIG,Grenoble,France"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1145\/3475957.3484454"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053762"},{"key":"ref33","first-page":"1","article-title":"Utilizing Deep Learning Towards Multi-modal Bio-sensing and Vision-based Affective Computing","author":"siddharth","year":"2019","journal-title":"IEEE Transactions on Affective Computing"},{"key":"ref32","first-page":"1","article-title":"A Bayesian Deep Learning Framework for End-To-End Prediction of Emotion from Heartbeat","author":"harper","year":"2020","journal-title":"IEEE Transactions on Affective Computing"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.3390\/s20030718"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2017.2781732"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ACII.2019.8925497"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1656"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2005.12.126"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1121\/1.2133000"},{"key":"ref60","first-page":"1437","article-title":"BOHB: Robust and Efficient Hyperparameter Optimization at Scale","author":"falkner","year":"2018","journal-title":"Proceedings of the 35th International Conference on Machine Learning"},{"key":"ref28","article-title":"An Inter-domain Study for Arousal Recognition from Physiological Signals","volume":"42","author":"gjoreski","year":"2018","journal-title":"Informatica"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3462244.3479955"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/s40846-019-00505-7"},{"key":"ref2","article-title":"Attention is All you Need","volume":"30","author":"vaswani","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref1","article-title":"Neural machine translation by jointly learning to align and translate","author":"bahdanau","year":"0"},{"key":"ref20","first-page":"1597","article-title":"A Simple Framework for Contrastive Learning of Visual Representations","author":"chen","year":"2020","journal-title":"Proceedings of the 37th International Conference on Machine Learning"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/s12652-021-03462-9"},{"key":"ref21","article-title":"Visual Transformers: Token-based Image Representation and Processing for Computer Vision","author":"wu","year":"2020"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2021.3064601"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/SLT48900.2021.9383456"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01118"},{"key":"ref25","article-title":"Self-supervised learning of a facial attribute embedding from video","author":"wiles","year":"2018"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1145\/3447548.3467401"},{"key":"ref51","first-page":"12449","article-title":"Wav2vec 2.0: A Framework for Self-Supervised Learning of Speech Representations","volume":"33","author":"baevski","year":"2020","journal-title":"Advances in neural information processing systems"},{"key":"ref59","article-title":"Tune: A Research Platform for Distributed Model Selection and Training","author":"liaw","year":"2018"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.3389\/fnins.2019.01131"},{"key":"ref57","article-title":"PsPM-VIS: SCR, ECG, respiration and eyetracker measurements in a delay fear conditioning task with visual CS and electrical US","author":"xia","year":"2020"},{"key":"ref56","article-title":"PsPM-RRM12: SCR, ECG, respiration and eye tracker measurements in response to electric stimulation or visual targets","author":"bach","year":"2019"},{"key":"ref55","article-title":"PsPM-HRM5: SCR, ECG and respiration measurements in response to positive\/negative IAPS pictures, and neutral\/aversive sounds","author":"paulus","year":"2020"},{"key":"ref54","article-title":"PsPM-FR: SCR, ECG and respiration measurements in a delay fear conditioning task with visual CS and electrical US","author":"tzovara","year":"2018"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/JBHI.2017.2688239"},{"key":"ref52","article-title":"Layer Normalization","author":"ba","year":"2016"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2018.2817622"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2017.2768030"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1145\/3461615.3485411"},{"key":"ref12","first-page":"1","article-title":"Feature Extraction and Selection for Emotion Recognition from Electrodermal Activity","author":"shukla","year":"2019","journal-title":"IEEE Transactions on Affective Computing"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.3390\/s21031018"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/s11760-021-01942-1"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/T-AFFC.2011.15"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TAFFC.2016.2625250"},{"key":"ref17","first-page":"1","article-title":"AMIGOS: A Dataset for Affect, Personality and Mood Research on Individuals and Groups","author":"correa","year":"2018","journal-title":"IEEE Transactions on Affective Computing"},{"key":"ref18","doi-asserted-by":"crossref","first-page":"2227","DOI":"10.18653\/v1\/N18-1202","article-title":"Deep Contextualized Word Representations","author":"peters","year":"2018","journal-title":"Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics Human Language Technologies Volume 1 (Long Papers)"},{"key":"ref19","first-page":"4171","article-title":"BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding","author":"devlin","year":"2019","journal-title":"Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics Human Language Technologies Volume 1 (Long and Short Papers)"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/BIBM47256.2019.8983326"},{"key":"ref3","article-title":"Enhancing the Locality and Breaking the Memory Bottleneck of Transformer on Time Series Forecasting","volume":"32","author":"li","year":"2019","journal-title":"Advances in neural information processing systems"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3410531.3414306"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/EMBC44109.2020.9175730"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2018.2883213"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.3390\/s18072074"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/SLT48900.2021.9383618"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053985"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-1827"},{"key":"ref45","first-page":"201","article-title":"Why Does Unsupervised Pre-training Help Deep Learning?","author":"erhan","year":"2010","journal-title":"Proceedings of the Thirteenth International Conference on Artificial Intelligence and Statistics JMLR Workshop and Conference Proceedings"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3026823"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.214"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/EMBC46164.2021.9629837"},{"key":"ref41","article-title":"Deep Transformer Models for Time Series Forecasting: The Influenza Prevalence Case","author":"wu","year":"2020"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1145\/3460421.3480427"},{"key":"ref43","article-title":"An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale","author":"dosovitskiy","year":"2020"}],"event":{"name":"2022 26th International Conference on Pattern Recognition (ICPR)","location":"Montreal, QC, Canada","start":{"date-parts":[[2022,8,21]]},"end":{"date-parts":[[2022,8,25]]}},"container-title":["2022 26th International Conference on Pattern Recognition (ICPR)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9956007\/9955631\/09956027.pdf?arnumber=9956027","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,19]],"date-time":"2022-12-19T20:03:24Z","timestamp":1671480204000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9956027\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,8,21]]},"references-count":60,"URL":"https:\/\/doi.org\/10.1109\/icpr56361.2022.9956027","relation":{},"subject":[],"published":{"date-parts":[[2022,8,21]]}}}