{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T23:11:36Z","timestamp":1761174696404,"version":"3.40.3"},"publisher-location":"Cham","reference-count":31,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319674001"},{"type":"electronic","value":"9783319674018"}],"license":[{"start":{"date-parts":[[2017,1,1]],"date-time":"2017-01-01T00:00:00Z","timestamp":1483228800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017]]},"DOI":"10.1007\/978-3-319-67401-8_18","type":"book-chapter","created":{"date-parts":[[2017,8,25]],"date-time":"2017-08-25T07:13:01Z","timestamp":1503645181000},"page":"160-169","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":18,"title":["Predicting Head Pose in Dyadic Conversation"],"prefix":"10.1007","author":[{"given":"David","family":"Greenwood","sequence":"first","affiliation":[]},{"given":"Stephen","family":"Laycock","sequence":"additional","affiliation":[]},{"given":"Iain","family":"Matthews","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,8,26]]},"reference":[{"issue":"1","key":"18_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1093\/jos\/9.1.1","volume":"9","author":"J Allwood","year":"1992","unstructured":"Allwood, J., Nivre, J., Ahls\u00e9n, E.: On the semantics and pragmatics of linguistic feedback. Journal of Semantics 9(1), 1\u201326 (1992)","journal-title":"Journal of Semantics"},{"unstructured":"Bengio, Y., Laufer, E., Alain, G., Yosinski, J.: Deep generative stochastic networks trainable by backprop. In: Proceedings of The 31st International Conference on Machine Learning, pp. 226\u2013234 (2014)","key":"18_CR2"},{"issue":"1\u20132","key":"18_CR3","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1007\/s12193-012-0094-8","volume":"6","author":"E Bevacqua","year":"2012","unstructured":"Bevacqua, E., De Sevin, E., Hyniewska, S.J., Pelachaud, C.: A listener model: introducing personality traits. Journal on Multimodal User Interfaces 6(1\u20132), 27\u201338 (2012)","journal-title":"Journal on Multimodal User Interfaces"},{"doi-asserted-by":"crossref","unstructured":"Bowman, S.R., Vilnis, L., Vinyals, O., Dai, A.M., Jozefowicz, R., Bengio, S.: Generating sentences from a continuous space. In: CoNLL 2016, p. 10 (2016)","key":"18_CR4","DOI":"10.18653\/v1\/K16-1002"},{"issue":"3","key":"18_CR5","doi-asserted-by":"publisher","first-page":"1075","DOI":"10.1109\/TASL.2006.885910","volume":"15","author":"C Busso","year":"2007","unstructured":"Busso, C., Deng, Z., Grimm, M., Neumann, U., Narayanan, S.: Rigid head motion in expressive speech animation: Analysis and synthesis. IEEE Transactions on Audio, Speech, and Language Processing 15(3), 1075\u20131086 (2007)","journal-title":"IEEE Transactions on Audio, Speech, and Language Processing"},{"doi-asserted-by":"crossref","unstructured":"Cassell, J., Bickmore, T., Billinghurst, M., Campbell, L., Chang, K., Vilhj\u00e1lmsson, H., Yan, H.: Embodiment in conversational interfaces: Rea. In: Proceedings of the SIGCHI Conference on Human Factors in Computing Systems, pp. 520\u2013527. ACM (1999)","key":"18_CR6","DOI":"10.1145\/302979.303150"},{"issue":"1","key":"18_CR7","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1075\/pc.7.1.03cas","volume":"7","author":"J Cassell","year":"1999","unstructured":"Cassell, J., McNeill, D., McCullough, K.E.: Speech-gesture mismatches: Evidence for one underlying representation of linguistic and nonlinguistic information. Pragmatics & Cognition 7(1), 1\u201334 (1999)","journal-title":"Pragmatics & Cognition"},{"unstructured":"Chollet, F., et al.: Keras (2015). https:\/\/github.com\/fchollet\/keras","key":"18_CR8"},{"doi-asserted-by":"crossref","unstructured":"Deng, L., Hinton, G., Kingsbury, B.: New types of deep neural network learning for speech recognition and related applications: an overview. In: 2013 IEEE International Conference on Acoustics, Speech and Signal Processing, pp. 8599\u20138603. IEEE (2013)","key":"18_CR9","DOI":"10.1109\/ICASSP.2013.6639344"},{"doi-asserted-by":"crossref","unstructured":"Deng, L., Li, J., Huang, J.T., Yao, K., Yu, D., Seide, F., Seltzer, M., Zweig, G., He, X., Williams, J., et al.: Recent advances in deep learning for speech research at Microsoft. In: 2013 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 8604\u20138608. IEEE (2013)","key":"18_CR10","DOI":"10.1109\/ICASSP.2013.6639345"},{"doi-asserted-by":"crossref","unstructured":"Deng, Z., Narayanan, S., Busso, C., Neumann, U.: Audio-based head motion synthesis for avatar-based telepresence systems. In: Proceedings of the 2004 ACM SIGMM Workshop on Effective Telepresence, pp. 24\u201330. ACM (2004)","key":"18_CR11","DOI":"10.1145\/1026776.1026784"},{"issue":"22","key":"18_CR12","doi-asserted-by":"publisher","first-page":"9871","DOI":"10.1007\/s11042-014-2156-2","volume":"74","author":"Chuang Ding","year":"2014","unstructured":"Ding, C., Xie, L., Zhu, P.: Head motion synthesis from speech using deep neural networks. In: Multimedia Tools and Applications, pp. 1\u201318 (2014)","journal-title":"Multimedia Tools and Applications"},{"doi-asserted-by":"crossref","unstructured":"Ding, C., Zhu, P., Xie, L.: Blstm neural networks for speech driven head motion synthesis. In: Sixteenth Annual Conference of the International Speech Communication Association (2015)","key":"18_CR13","DOI":"10.21437\/Interspeech.2015-137"},{"doi-asserted-by":"crossref","unstructured":"Gehring, J., Miao, Y., Metze, F., Waibel, A.: Extracting deep bottleneck features using stacked auto-encoders. In: 2013 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 3377\u20133381. IEEE (2013)","key":"18_CR14","DOI":"10.1109\/ICASSP.2013.6638284"},{"issue":"1","key":"18_CR15","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1007\/BF02291478","volume":"40","author":"JC Gower","year":"1975","unstructured":"Gower, J.C.: Generalized procrustes analysis. Psychometrika 40(1), 33\u201351 (1975)","journal-title":"Psychometrika"},{"unstructured":"Graves, A.: Generating sequences with recurrent neural networks. CoRR abs\/1308.0850 (2013), http:\/\/arxiv.org\/abs\/1308.0850","key":"18_CR16"},{"key":"18_CR17","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"198","DOI":"10.1007\/978-3-319-47665-0_18","volume-title":"Intelligent Virtual Agents","author":"K Haag","year":"2016","unstructured":"Haag, K., Shimodaira, H.: Bidirectional LSTM networks employing stacked bottleneck features for expressive speech-driven head motion synthesis. In: Traum, D., Swartout, W., Khooshabeh, P., Kopp, S., Scherer, S., Leuski, A. (eds.) IVA 2016. LNCS, vol. 10011, pp. 198\u2013207. Springer, Cham (2016). doi: 10.1007\/978-3-319-47665-0_18"},{"issue":"8","key":"18_CR18","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S., Schmidhuber, J.: Long short-term memory. Neural Computation 9(8), 1735\u20131780 (1997)","journal-title":"Neural Computation"},{"doi-asserted-by":"crossref","unstructured":"Huang, J.T., Li, J., Gong, Y.: An analysis of convolutional neural networks for speech recognition. In: 2015 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 4989\u20134993. IEEE (2015)","key":"18_CR19","DOI":"10.1109\/ICASSP.2015.7178920"},{"unstructured":"Kingma, D.P., Mohamed, S., Rezende, D.J., Welling, M.: Semi-supervised learning with deep generative models. In: Advances in Neural Information Processing Systems, pp. 3581\u20133589 (2014)","key":"18_CR20"},{"issue":"2","key":"18_CR21","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1023\/B:VISI.0000029666.37597.d3","volume":"60","author":"I Matthews","year":"2004","unstructured":"Matthews, I., Baker, S.: Active appearance models revisited. International Journal of Computer Vision 60(2), 135\u2013164 (2004)","journal-title":"International Journal of Computer Vision"},{"unstructured":"McNeill, D.: Hand and mind: What gestures reveal about thought. University of Chicago Press (1992)","key":"18_CR22"},{"key":"18_CR23","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"176","DOI":"10.1007\/978-3-540-85483-8_18","volume-title":"Intelligent Virtual Agents","author":"L-P Morency","year":"2008","unstructured":"Morency, L.-P., Kok, I., Gratch, J.: Predicting listener backchannels: a probabilistic multimodal approach. In: Prendinger, H., Lester, J., Ishizuka, M. (eds.) IVA 2008. LNCS, vol. 5208, pp. 176\u2013190. Springer, Heidelberg (2008). doi: 10.1007\/978-3-540-85483-8_18"},{"issue":"4","key":"18_CR24","first-page":"33","volume":"7","author":"M Mori","year":"1970","unstructured":"Mori, M.: The uncanny valley. Energy 7(4), 33\u201335 (1970)","journal-title":"Energy"},{"issue":"2","key":"18_CR25","doi-asserted-by":"publisher","first-page":"133","DOI":"10.1111\/j.0963-7214.2004.01502010.x","volume":"15","author":"KG Munhall","year":"2004","unstructured":"Munhall, K.G., Jones, J.A., Callan, D.E., Kuratate, T., Vatikiotis-Bateson, E.: Visual prosody and speech intelligibility: head movement improves auditory speech perception. Psychological Science: A Journal of the American Psychological Society \/ APS 15(2), 133\u2013137 (2004)","journal-title":"Psychological Science : A Journal of the American Psychological Society \/ APS"},{"key":"18_CR26","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"599","DOI":"10.1007\/978-3-540-74628-7_77","volume-title":"Text, Speech and Dialogue","author":"R Nishimura","year":"2007","unstructured":"Nishimura, R., Kitaoka, N., Nakagawa, S.: A spoken dialog system for chat-like conversations considering response timing. In: Matou\u0161ek, V., Mautner, P. (eds.) TSD 2007. LNCS, vol. 4629, pp. 599\u2013606. Springer, Heidelberg (2007). doi: 10.1007\/978-3-540-74628-7_77"},{"unstructured":"Rezende, D.J., Mohamed, S., Wierstra, D.: Stochastic backpropagation and approximate inference in deep generative models. In: Proceedings of The 31st International Conference on Machine Learning, pp. 1278\u20131286 (2014)","key":"18_CR27"},{"unstructured":"Sutskever, I., Vinyals, O., Le, Q.V.: Sequence to sequence learning with neural networks. In: Advances in Neural Information Processing Systems, pp. 3104\u20133112 (2014)","key":"18_CR28"},{"issue":"8","key":"18_CR29","doi-asserted-by":"publisher","first-page":"1177","DOI":"10.1016\/S0378-2166(99)00109-5","volume":"32","author":"N Ward","year":"2000","unstructured":"Ward, N., Tsukahara, W.: Prosodic features which cue back-channel responses in english and japanese. Journal of Pragmatics 32(8), 1177\u20131207 (2000)","journal-title":"Journal of Pragmatics"},{"issue":"1","key":"18_CR30","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1207\/s15327590ijhc1701_4","volume":"17","author":"T Watanabe","year":"2004","unstructured":"Watanabe, T., Okubo, M., Nakashige, M., Danbara, R.: Interactor: Speech-driven embodied interactive actor. International Journal of Human-Computer Interaction 17(1), 43\u201360 (2004)","journal-title":"International Journal of Human-Computer Interaction"},{"unstructured":"Yngve, V.H.: On getting a word in edgewise. In: Chicago Linguistics Society, 6th Meeting, pp. 567\u2013578 (1970)","key":"18_CR31"}],"container-title":["Lecture Notes in Computer Science","Intelligent Virtual Agents"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-67401-8_18","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,1]],"date-time":"2022-08-01T19:40:58Z","timestamp":1659382858000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-67401-8_18"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017]]},"ISBN":["9783319674001","9783319674018"],"references-count":31,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-67401-8_18","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2017]]},"assertion":[{"value":"26 August 2017","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"IVA","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Intelligent Virtual Agents","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Stockholm","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Sweden","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2017","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 August 2017","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"30 August 2017","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"iva2017","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.iva2017.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}