{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,3]],"date-time":"2025-07-03T04:22:04Z","timestamp":1751516524879,"version":"3.41.0"},"publisher-location":"Cham","reference-count":46,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030780913"},{"type":"electronic","value":"9783030780920"}],"license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-78092-0_43","type":"book-chapter","created":{"date-parts":[[2021,7,2]],"date-time":"2021-07-02T23:20:19Z","timestamp":1625268019000},"page":"617-629","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Supervised Contrastive Learning for\u00a0Game-Play Frustration Detection from Speech"],"prefix":"10.1007","author":[{"given":"Meishu","family":"Song","sequence":"first","affiliation":[]},{"given":"Emilia","family":"Parada-Cabaleiro","sequence":"additional","affiliation":[]},{"given":"Shuo","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Manuel","family":"Milling","sequence":"additional","affiliation":[]},{"given":"Alice","family":"Baird","sequence":"additional","affiliation":[]},{"given":"Zijiang","family":"Yang","sequence":"additional","affiliation":[]},{"given":"Bj\u00f6rn W.","family":"Schuller","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,7,3]]},"reference":[{"issue":"6356","key":"43_CR1","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1038\/355161a0","volume":"355","author":"S Becker","year":"1992","unstructured":"Becker, S., Hinton, G.E.: Self-organizing neural network that discovers surfaces in random-dot stereograms. Nature 355(6356), 161\u2013163 (1992)","journal-title":"Nature"},{"key":"43_CR2","unstructured":"Bevan, N.: What is the difference between the purpose of usability and user experience evaluation methods. In: Proceedings of the Workshop UXEM, pp. 1\u20134. Uppsala, Sweden (2009)"},{"key":"43_CR3","unstructured":"Byrd, D., McLaughlin, M., Khurana, S., Landes, M., Ucar, T.: Chimp: Children interacting with machines project"},{"key":"43_CR4","unstructured":"Ceylan, C., Gutmann, M.U.: Conditional noise-contrastive estimation of unnormalised models. In: Proceedings of the International Conference on Machine Learning, pp. 726\u2013734. Vienna, Austria (2018)"},{"key":"43_CR5","unstructured":"Chen, T., Kornblith, S., Norouzi, M., Hinton, G.: A simple framework for contrastive learning of visual representations. In: Proceedings of the International Conference on Machine Learning, pp. 1597\u20131607. Virtual (2020)"},{"key":"43_CR6","doi-asserted-by":"crossref","unstructured":"Chopra, S., Hadsell, R., LeCun, Y.: Learning a similarity metric discriminatively, with application to face verification. In: Proceedings of the Computer Society Conference on Computer Vision and Pattern Recognition. vol. 1, pp. 539\u2013546. San Diego, USA (2005)","DOI":"10.1109\/CVPR.2005.202"},{"issue":"2","key":"43_CR7","doi-asserted-by":"publisher","first-page":"152","DOI":"10.1007\/s40593-017-0152-1","volume":"28","author":"JA DeFalco","year":"2018","unstructured":"DeFalco, J.A., Rowe, J.P., Paquette, L., Georgoulas-Sherry, V., Brawner, K., Mott, B.W., Baker, R.S., Lester, J.C.: Detecting and addressing frustration in a serious game for military training. Int. J. Artif. Intell. Educ. 28(2), 152\u2013193 (2018)","journal-title":"Int. J. Artif. Intell. Educ."},{"key":"43_CR8","unstructured":"Ekman, P., Keltner, D.: Universal facial expressions of emotion. In: Segerstrale U, P. Molnar, P., (eds.) Nonverbal communication: Where nature meets culture vol. 54 no. 2, pp. 27\u201346 (1997)"},{"key":"43_CR9","doi-asserted-by":"crossref","unstructured":"Franz, O., Drewitz, U., Ihme, K.: Facing driver frustration: towards real-time in-vehicle frustration estimation based on video streams of the face. In: Proceedings of the International Conference on Human-Computer Interaction, pp. 349\u2013356. Virtual (2020)","DOI":"10.1007\/978-3-030-50732-9_46"},{"key":"43_CR10","unstructured":"Goetsu, S., Sakai, T.: Different types of voice user interface failures may cause different degrees of frustration. arXiv preprint arXiv:2002.03582 (2020)"},{"key":"43_CR11","doi-asserted-by":"crossref","unstructured":"Grafsgaard, J.F., Wiggins, J.B., Boyer, K.E., Wiebe, E.N., Lester, J.C.: Automatically recognizing facial indicators of frustration: a learning-centric analysis. In: Proceedings of the Humaine Association Conference on Affective Computing and Intelligent Interaction, pp. 159\u2013165. Geneva, Switzerland (2013)","DOI":"10.1109\/ACII.2013.33"},{"key":"43_CR12","doi-asserted-by":"crossref","unstructured":"Grafsgaard, J.F., Wiggins, J.B., Vail, A.K., Boyer, K.E., Wiebe, E.N., Lester, J.C.: The additive value of multimodal features for predicting engagement, frustration, and learning during tutoring. In: Proc. International Conference on Multimodal Interaction, pp. 42\u201349. Istanbul, Turkey (2014)","DOI":"10.1145\/2663204.2663264"},{"key":"43_CR13","doi-asserted-by":"crossref","unstructured":"Grewe, L., Hu, C.: Ulearn: understanding and reacting to student frustration using deep learning, mobile vision and nlp. In: Proceedings of the Signal Processing, Sensor\/Information Fusion, and Target Recognition XXVIII. p. 110. Maryland, USA (2019)","DOI":"10.1117\/12.2518262"},{"key":"43_CR14","unstructured":"Gutmann, M., Hyv\u00e4rinen, A.: Noise-contrastive estimation: a new estimation principle for unnormalized statistical models. In: Proceedings of the International Conference on Artificial Intelligence and Statistics, pp. 297\u2013304. Sardinia, Italy (2010)"},{"key":"43_CR15","doi-asserted-by":"crossref","unstructured":"Hadsell, R., Chopra, S., LeCun, Y.: Dimensionality reduction by learning an invariant mapping. In: Proceedings of the Computer Society Conference on Computer Vision and Pattern Recognition, pp. 1735\u20131742. New York, USA (2006)","DOI":"10.1109\/CVPR.2006.100"},{"issue":"4","key":"43_CR16","doi-asserted-by":"publisher","first-page":"130","DOI":"10.1109\/MSP.2017.2699039","volume":"34","author":"JH Hansen","year":"2017","unstructured":"Hansen, J.H., Busso, C., Zheng, Y., Sathyanarayana, A.: Driver modeling for detection and assessment of driver distraction: examples from the utdrive test bed. IEEE Signal Process. Mag. 34(4), 130\u2013142 (2017)","journal-title":"IEEE Signal Process. Mag."},{"key":"43_CR17","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the Computer Vision and Pattern Recognition, pp. 770\u2013778. Las Vegas, USA (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"43_CR18","doi-asserted-by":"crossref","unstructured":"Henderson, N.L., Rowe, J.P., Mott, B.W., Brawner, K., Baker, R., Lester, J.C.: 4d affect detection: improving frustration detection in game-based learning with posture-based temporal data fusion. In: Proceedings of the Artificial Intelligence in Education, pp. 144\u2013156. Beijing, China (2019)","DOI":"10.1007\/978-3-030-23204-7_13"},{"key":"43_CR19","unstructured":"Hertzum, M.: Frustration: a common user experience. DHRS2010 p. 11 (2010)"},{"key":"43_CR20","unstructured":"Hjelm, R.D., Fedorov, A., Lavoie-Marchildon, S., Grewal, K., Bachman, P., Trischler, A., Bengio, Y.: Learning deep representations by mutual information estimation and maximization. arXiv preprint arXiv:1808.06670 (2018)"},{"key":"43_CR21","unstructured":"Inoue, N., Goto, K.: Semi-supervised contrastive learning with generalized contrastive loss and its application to speaker recognition. In: Proceedings of the Asia-Pacific Signal and Information Processing Association Annual Summit and Conference, pp. 1641\u20131646. Virtual (2020)"},{"issue":"1","key":"43_CR22","doi-asserted-by":"publisher","first-page":"2","DOI":"10.3390\/technologies9010002","volume":"9","author":"A Jaiswal","year":"2021","unstructured":"Jaiswal, A., Babu, A.R., Zadeh, M.Z., Banerjee, D., Makedon, F.: A survey on contrastive self-supervised learning. Technologies 9(1), 2 (2021)","journal-title":"Technologies"},{"key":"43_CR23","unstructured":"Khosla, P., et al.: Supervised contrastive learning. arXiv preprint arXiv:2004.11362 (2020)"},{"key":"43_CR24","doi-asserted-by":"crossref","unstructured":"Le-Khac, P.H., Healy, G., Smeaton, A.F.: Contrastive representation learning: a framework and review. IEEE Access (2020)","DOI":"10.1109\/ACCESS.2020.3031549"},{"key":"43_CR25","unstructured":"Macary, M., Tahon, M., Est\u00e8ve, Y., Rousseau, A.: Allosat: a new call center French corpus for satisfaction and frustration analysis. In: Proceedings of the Language Resources and Evaluation Conference, pp. 1590\u20131597. Virtual (2020)"},{"issue":"1","key":"43_CR26","doi-asserted-by":"publisher","first-page":"109","DOI":"10.1109\/TITS.2010.2070839","volume":"12","author":"L Malta","year":"2010","unstructured":"Malta, L., Miyajima, C., Kitaoka, N., Takeda, K.: Analysis of real-world driver\u2019s frustration. IEEE Trans. Intell. Transp. Syst. 12(1), 109\u2013118 (2010)","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"key":"43_CR27","unstructured":"Mnih, A., Teh, Y.W.: A fast and simple algorithm for training neural probabilistic language models. arXiv preprint arXiv:1206.6426 (2012)"},{"key":"43_CR28","doi-asserted-by":"crossref","unstructured":"Oehl, M., Ihme, K., Drewitz, U., Pape, A.A., Cornelsen, S., Schramm, M.: Towards a frustration-aware assistant for increased in-vehicle UX: F-RELACS. In: Proceedings of the Automotive User Interfaces and Interactive Vehicular Applications, pp. 260\u2013264. Utrecht, Netherlands (2019)","DOI":"10.1145\/3349263.3351518"},{"key":"43_CR29","doi-asserted-by":"crossref","unstructured":"Oh Song, H., Xiang, Y., Jegelka, S., Savarese, S.: Deep metric learning via lifted structured feature embedding. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 4004\u20134012 (2016)","DOI":"10.1109\/CVPR.2016.434"},{"issue":"1","key":"43_CR30","doi-asserted-by":"publisher","first-page":"169","DOI":"10.1007\/s10772-020-09675-1","volume":"23","author":"E Parada-Cabaleiro","year":"2020","unstructured":"Parada-Cabaleiro, E., Batliner, A., Baird, A., Schuller, B.: The perception of emotional cues by children in artificial background noise. Int. J. Speech Technol. 23(1), 169\u2013182 (2020). https:\/\/doi.org\/10.1007\/s10772-020-09675-1","journal-title":"Int. J. Speech Technol."},{"key":"43_CR31","doi-asserted-by":"publisher","first-page":"341","DOI":"10.1007\/s10579-019-09450-y","volume":"54","author":"E Parada-Cabaleiro","year":"2020","unstructured":"Parada-Cabaleiro, E., Costantini, G., Batliner, A., Schmitt, M., Schuller, B.W.: DEMoS: an Italian emotional speech corpus: elicitation methods, machine learning, and perception. Lang. Resour. Eval. 54, 341\u2013383 (2020)","journal-title":"Lang. Resour. Eval."},{"key":"43_CR32","unstructured":"Paszke, A., et al.: Automatic differentiation in PyTorch. In: NIPS-W (2017)"},{"key":"43_CR33","volume-title":"Computational paralinguistics: emotion, affect and personality in speech and language processing","author":"B Schuller","year":"2014","unstructured":"Schuller, B., Batliner, A.: Computational paralinguistics: emotion, affect and personality in speech and language processing. Wiley, Sussex, UK (2014)"},{"key":"43_CR34","doi-asserted-by":"crossref","unstructured":"Shoumy, N.J., Ang, L.M., Seng, K.P., Rahaman, D.M., Zia, T.: Multimodal big data affective analytics: a comprehensive survey using text, audio, visual and physiological signals. J. Netw. Comput. Appl. 149, 102447 (2020)","DOI":"10.1016\/j.jnca.2019.102447"},{"key":"43_CR35","unstructured":"Song, M., et al.: Frustration recognition from speech during game interaction using wide residual networks. Virtual Reality & Intelligent Hardware 10, (2020)"},{"key":"43_CR36","doi-asserted-by":"crossref","unstructured":"Song, M., et al.: Predicting group work performance from physical handwriting features in a smart English classroom. In: Proceedings of the International Conference on Digital Signal Processing (ICDSP). Chengdu, China (2021)","DOI":"10.1145\/3458380.3458404"},{"key":"43_CR37","doi-asserted-by":"crossref","unstructured":"Song, M., et al.: Audiovisual analysis for recognising frustration during game-play: introducing the multimodal game frustration database. In: Proceedings of the Affective Computing and Intelligent Interaction, pp. 517\u2013523. Cambridge, the UK (2019)","DOI":"10.1109\/ACII.2019.8925464"},{"key":"43_CR38","unstructured":"Tian, Y., Sun, C., Poole, B., Krishnan, D., Schmid, C., Isola, P.: What makes for good views for contrastive learning. arXiv preprint arXiv:2005.10243 (2020)"},{"key":"43_CR39","doi-asserted-by":"publisher","first-page":"1454","DOI":"10.3389\/fpsyg.2017.01454","volume":"8","author":"CM Tyng","year":"2017","unstructured":"Tyng, C.M., Amin, H.U., Saad, M.N., Malik, A.S.: The influences of emotion on learning and memory. Front. Psychol. 8, 1454 (2017)","journal-title":"Front. Psychol."},{"key":"43_CR40","doi-asserted-by":"crossref","unstructured":"Valdez, M.G., Hern\u00e1ndez-\u00c1guila, A., Guerv\u00f3s, J.J.M., Soto, A.M.: Enhancing student engagement via reduction of frustration with programming assignments using machine learning. In: Proceedings of the International Joint Conference on Computational Intelligence, pp. 297\u2013304. Funchal, Portugal (2017)","DOI":"10.5220\/0006502102970304"},{"issue":"4","key":"43_CR41","doi-asserted-by":"publisher","first-page":"625","DOI":"10.1037\/a0033413","volume":"60","author":"M Wei","year":"2013","unstructured":"Wei, M., Su, J.C., Carrera, S., Lin, S.P., Yi, F.: Suppression and interpersonal harmony: a cross-cultural comparison between chinese and european americans. J. Couns. Psychol. 60(4), 625 (2013)","journal-title":"J. Couns. Psychol."},{"key":"43_CR42","unstructured":"Xiao, T., Wang, X., Efros, A.A., Darrell, T.: What should not be contrastive in contrastive learning. arXiv preprint arXiv:2008.05659 (2020)"},{"key":"43_CR43","doi-asserted-by":"crossref","unstructured":"Zepf, S., Stracke, T., Schmitt, A., van de Camp, F., Beyerer, J.: Towards real-time detection and mitigation of driver frustration using SVM. In: Proceedings of the Machine Learning and Applications, pp. 202\u2013209. Florida, USA (2019)","DOI":"10.1109\/ICMLA.2019.00039"},{"key":"43_CR44","unstructured":"Zhang, M., Ihme, K., Drewitz, U.: Discriminating drivers\u2019 fear and frustration through the dimension of power. In: Proceedings of the Humanist Conference, p. 98. Hague, Netherlands (2018)"},{"key":"43_CR45","unstructured":"Zhang, Z., Sabuncu, M.R.: Generalized cross entropy loss for training deep neural networks with noisy labels. arXiv preprint arXiv:1805.07836 (2018)"},{"key":"43_CR46","unstructured":"Zweig, G., Burges, C.J.: The microsoft research sentence completion challenge. Microsoft Research, Redmond, WA, USA, Technical report. MSR-TR-2011-129 (2011)"}],"container-title":["Lecture Notes in Computer Science","Universal Access in Human-Computer Interaction. Design Methods and User Experience"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-78092-0_43","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,2]],"date-time":"2025-07-02T22:30:25Z","timestamp":1751495425000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-78092-0_43"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"ISBN":["9783030780913","9783030780920"],"references-count":46,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-78092-0_43","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2021]]},"assertion":[{"value":"3 July 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"HCII","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Human-Computer Interaction","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"24 July 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 July 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"hcii2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/2021.hci.international\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}