{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,10]],"date-time":"2026-02-10T16:43:57Z","timestamp":1770741837288,"version":"3.49.0"},"publisher-location":"Cham","reference-count":49,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030342548","type":"print"},{"value":"9783030342555","type":"electronic"}],"license":[{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019]]},"DOI":"10.1007\/978-3-030-34255-5_9","type":"book-chapter","created":{"date-parts":[[2019,11,6]],"date-time":"2019-11-06T00:11:49Z","timestamp":1572999109000},"page":"123-138","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Action Recognition Using Local Visual Descriptors and Inertial Data"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3673-5397","authenticated-orcid":false,"given":"Taha","family":"Alhersh","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2336-0490","authenticated-orcid":false,"given":"Samir","family":"Brahim Belhaouari","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0209-3859","authenticated-orcid":false,"given":"Heiner","family":"Stuckenschmidt","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2019,11,4]]},"reference":[{"key":"9_CR1","doi-asserted-by":"crossref","unstructured":"Abebe, G., Cavallaro, A.: Inertial-vision: cross-domain knowledge transfer for wearable sensors. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1392\u20131400 (2017)","DOI":"10.1109\/ICCVW.2017.165"},{"key":"9_CR2","doi-asserted-by":"crossref","unstructured":"Akpinar, S., Alpaslan, F.N.: Video action recognition using an optical flow based representation. In: IPCV, the Steering Committee of the World Congress in Computer Science, Computer Engineering and Applied Computing (WorldComp), p. 1 (2014)","DOI":"10.1016\/B978-0-12-802045-6.00021-1"},{"key":"9_CR3","doi-asserted-by":"crossref","unstructured":"Alhersh, T., Stuckenschmidt, H.: On the combination of IMU and optical flow for action recognition. In: 2019 IEEE International Conference on Pervasive Computing and Communications Workshops (PerCom Workshops). IEEE (2019)","DOI":"10.1109\/PERCOMW.2019.8730743"},{"key":"9_CR4","doi-asserted-by":"publisher","unstructured":"Alhersh, T., Stuckenschmidt, H.: Unsupervised fine-tuning of optical flow for better motion boundary estimation. In: Proceedings of the 14th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications, Prague, Czech Republic, 25\u201327 February 2019. VISAPP, vol. 5. pp. 776\u2013783. SciTePress, Set\u00fabal (2019). https:\/\/doi.org\/10.5220\/0007343707760783 . http:\/\/ub-madoc.bib.uni-mannheim.de\/49196\/ , online-Resource","DOI":"10.5220\/0007343707760783"},{"key":"9_CR5","unstructured":"Arabac\u0131, M.A., \u00d6zkan, F., Surer, E., Jan\u010dovi\u010d, P., Temizel, A.: Multi-modal egocentric activity recognition using audio-visual features. arXiv preprint arXiv:1807.00612 (2018)"},{"key":"9_CR6","doi-asserted-by":"crossref","unstructured":"Ashry, S., Elbasiony, R., Gomaa, W.: An LSTM-based descriptor for human activities recognition using IMU sensors. In: Proceedings of the 15th International Conference on Informatics in Control, Automation and Robotics, ICINCO, vol. 1, pp. 494\u2013501 (2018)","DOI":"10.5220\/0006902405040511"},{"issue":"12","key":"9_CR7","doi-asserted-by":"publisher","first-page":"31314","DOI":"10.3390\/s151229858","volume":"15","author":"F Attal","year":"2015","unstructured":"Attal, F., Mohammed, S., Dedabrishvili, M., Chamroukhi, F., Oukhellou, L., Amirat, Y.: Physical human activity recognition using wearable sensors. Sensors 15(12), 31314\u201331338 (2015)","journal-title":"Sensors"},{"issue":"5","key":"9_CR8","doi-asserted-by":"publisher","first-page":"744","DOI":"10.1109\/TCSVT.2015.2409731","volume":"25","author":"A Betancourt","year":"2015","unstructured":"Betancourt, A., Morerio, P., Regazzoni, C.S., Rauterberg, M.: The evolution of first person vision methods: a survey. IEEE Trans. Circuits Syst. Video Technol. 25(5), 744\u2013760 (2015)","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"key":"9_CR9","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"541","DOI":"10.1007\/978-3-030-10997-4_33","volume-title":"Machine Learning and Knowledge Discovery in Databases","author":"A Bevilacqua","year":"2019","unstructured":"Bevilacqua, A., MacDonald, K., Rangarej, A., Widjaya, V., Caulfield, B., Kechadi, T.: Human activity recognition with convolutional neural networks. In: Brefeld, U., et al. (eds.) ECML PKDD 2018. LNCS (LNAI), vol. 11053, pp. 541\u2013552. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-10997-4_33"},{"issue":"3","key":"9_CR10","doi-asserted-by":"publisher","first-page":"500","DOI":"10.1109\/TPAMI.2010.143","volume":"33","author":"T Brox","year":"2011","unstructured":"Brox, T., Malik, J.: Large displacement optical flow: descriptor matching in variational motion estimation. IEEE Trans. Pattern Anal. Mach. Intell. 33(3), 500\u2013513 (2011)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"3","key":"9_CR11","doi-asserted-by":"publisher","first-page":"4405","DOI":"10.1007\/s11042-015-3177-1","volume":"76","author":"C Chen","year":"2017","unstructured":"Chen, C., Jafari, R., Kehtarnavaz, N.: A survey of depth and inertial sensor fusion for human action recognition. Multimed. Tools Appl. 76(3), 4405\u20134425 (2017)","journal-title":"Multimed. Tools Appl."},{"issue":"3","key":"9_CR12","first-page":"273","volume":"20","author":"C Cortes","year":"1995","unstructured":"Cortes, C., Vapnik, V.: Support-vector networks. Mach. Learn. 20(3), 273\u2013297 (1995)","journal-title":"Mach. Learn."},{"key":"9_CR13","doi-asserted-by":"crossref","unstructured":"Coskun, H., Tan, D.J., Conjeti, S., Navab, N., Tombari, F.: Human motion analysis with deep metric learning. arXiv preprint arXiv:1807.11176 (2018)","DOI":"10.1007\/978-3-030-01264-9_41"},{"key":"9_CR14","unstructured":"Dalal, N., Triggs, B.: Histograms of oriented gradients for human detection (2005)"},{"key":"9_CR15","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"428","DOI":"10.1007\/11744047_33","volume-title":"Computer Vision \u2013 ECCV 2006","author":"N Dalal","year":"2006","unstructured":"Dalal, N., Triggs, B., Schmid, C.: Human detection using oriented histograms of flow and appearance. In: Leonardis, A., Bischof, H., Pinz, A. (eds.) ECCV 2006. LNCS, vol. 3952, pp. 428\u2013441. Springer, Heidelberg (2006). https:\/\/doi.org\/10.1007\/11744047_33"},{"issue":"1","key":"9_CR16","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1109\/5.554206","volume":"85","author":"BV Dasarathy","year":"1997","unstructured":"Dasarathy, B.V.: Sensor fusion potential exploitation-innovative architectures and illustrative applications. Proc. IEEE 85(1), 24\u201338 (1997)","journal-title":"Proc. IEEE"},{"issue":"6","key":"9_CR17","doi-asserted-by":"publisher","first-page":"1287","DOI":"10.3390\/s17061287","volume":"17","author":"JC Davila","year":"2017","unstructured":"Davila, J.C., Cretu, A.M., Zaremba, M.: Wearable sensor data classification for human activity recognition based on an iterative learning framework. Sensors 17(6), 1287 (2017)","journal-title":"Sensors"},{"key":"9_CR18","doi-asserted-by":"crossref","unstructured":"Dosovitskiy, A., et al.: FlowNet: learning optical flow with convolutional networks. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2758\u20132766 (2015)","DOI":"10.1109\/ICCV.2015.316"},{"key":"9_CR19","unstructured":"Elmenreich, W.: An introduction to sensor fusion. Vienna University of Technology, Austria 502 (2002)"},{"key":"9_CR20","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.cviu.2015.02.008","volume":"134","author":"D Fortun","year":"2015","unstructured":"Fortun, D., Bouthemy, P., Kervrann, C.: Optical flow modeling and computation: a survey. Comput. Vis. Image Underst. 134, 1\u201321 (2015)","journal-title":"Comput. Vis. Image Underst."},{"issue":"1\u20133","key":"9_CR21","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1016\/0004-3702(81)90024-2","volume":"17","author":"BK Horn","year":"1981","unstructured":"Horn, B.K., Schunck, B.G.: Determining optical flow. Artif. Intell. 17(1\u20133), 185\u2013203 (1981)","journal-title":"Artif. Intell."},{"key":"9_CR22","doi-asserted-by":"publisher","first-page":"504","DOI":"10.1016\/j.patcog.2017.07.013","volume":"72","author":"EP Ijjina","year":"2017","unstructured":"Ijjina, E.P., Chalavadi, K.M.: Human action recognition in RGB-D videos using motion sequence information and deep learning. Pattern Recogn. 72, 504\u2013516 (2017)","journal-title":"Pattern Recogn."},{"issue":"4","key":"9_CR23","doi-asserted-by":"publisher","first-page":"989","DOI":"10.1109\/JBHI.2017.2762404","volume":"22","author":"N Jalloul","year":"2018","unstructured":"Jalloul, N., Por\u00e9e, F., Viardot, G., LHostis, P., Carrault, G.: Activity recognition using complex network analysis. IEEE J. Biomed. Health Inform. 22(4), 989\u20131000 (2018)","journal-title":"IEEE J. Biomed. Health Inform."},{"key":"9_CR24","doi-asserted-by":"crossref","unstructured":"Kumar, S.S., John, M.: Human activity recognition using optical flow based feature set. In: 2016 IEEE International Carnahan Conference on Security Technology (ICCST), pp. 1\u20135. IEEE (2016)","DOI":"10.1109\/CCST.2016.7815694"},{"key":"9_CR25","doi-asserted-by":"crossref","unstructured":"Lu, Y., Velipasalar, S.: Human activity classification incorporating egocentric video and inertial measurement unit data. In: 2018 IEEE Global Conference on Signal and Information Processing (GlobalSIP), pp. 429\u2013433. IEEE (2018)","DOI":"10.1109\/GlobalSIP.2018.8646367"},{"key":"9_CR26","unstructured":"Moutinho, N.M.B.: Video and image match searching, US Patent App. 15\/252,142, 2 March 2017"},{"key":"9_CR27","doi-asserted-by":"crossref","unstructured":"Moya Rueda, F., Grzeszick, R., Fink, G., Feldhorst, S., ten Hompel, M.: Convolutional neural networks for human activity recognition using body-worn sensors. In: Informatics, vol. 5, p. 26. Multidisciplinary Digital Publishing Institute (2018)","DOI":"10.3390\/informatics5020026"},{"issue":"1","key":"9_CR28","doi-asserted-by":"publisher","first-page":"72","DOI":"10.3390\/s16010072","volume":"16","author":"THC Nguyen","year":"2016","unstructured":"Nguyen, T.H.C., Nebel, J.C., Florez-Revuelta, F., et al.: Recognition of activities of daily living with egocentric vision: a review. Sensors 16(1), 72 (2016)","journal-title":"Sensors"},{"issue":"15","key":"9_CR29","doi-asserted-by":"publisher","first-page":"209","DOI":"10.3182\/20070903-3-FR-2921.00038","volume":"40","author":"H Romero","year":"2007","unstructured":"Romero, H., Salazar, S., Lozano, R., Benosman, R.: Fusion of optical flow and inertial sensors for four-rotor rotorcraft stabilization. IFAC Proc. Vol. 40(15), 209\u2013214 (2007)","journal-title":"IFAC Proc. Vol."},{"key":"9_CR30","unstructured":"Sabour, S., Frosst, N., Hinton, G.E.: Dynamic routing between capsules. In: Advances in Neural Information Processing Systems, pp. 3856\u20133866 (2017)"},{"key":"9_CR31","unstructured":"Sevilla-Lara, L., Liao, Y., Guney, F., Jampani, V., Geiger, A., Black, M.J.: On the integration of optical flow and action recognition. arXiv preprint arXiv:1712.08416 (2017)"},{"key":"9_CR32","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556 (2014)"},{"key":"9_CR33","doi-asserted-by":"crossref","unstructured":"Singh, S., Arora, C., Jawahar, C.: First person action recognition using deep learned descriptors. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2620\u20132628 (2016)","DOI":"10.1109\/CVPR.2016.287"},{"key":"9_CR34","doi-asserted-by":"publisher","first-page":"82","DOI":"10.1016\/j.cviu.2016.08.012","volume":"154","author":"S Stein","year":"2017","unstructured":"Stein, S., McKenna, S.J.: Recognising complex activities with histograms of relative tracklets. Comput. Vis. Image Underst. 154, 82\u201393 (2017)","journal-title":"Comput. Vis. Image Underst."},{"key":"9_CR35","doi-asserted-by":"crossref","unstructured":"Sudhakaran, S., Escalera, S., Lanz, O.: Hierarchical feature aggregation networks for video action recognition. arXiv preprint arXiv:1905.12462 (2019)","DOI":"10.1109\/CVPR42600.2020.00118"},{"key":"9_CR36","doi-asserted-by":"crossref","unstructured":"Sudhakaran, S., Escalera, S., Lanz, O.: LSTA: long short-term attention for egocentric action recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 9954\u20139963 (2019)","DOI":"10.1109\/CVPR.2019.01019"},{"key":"9_CR37","doi-asserted-by":"crossref","unstructured":"Sun, D., Yang, X., Liu, M.Y., Kautz, J.: PWC-NET: CNNs for optical flow using pyramid, warping, and cost volume. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 8934\u20138943 (2018)","DOI":"10.1109\/CVPR.2018.00931"},{"key":"9_CR38","doi-asserted-by":"crossref","unstructured":"Sun, J., Fu, Y., Li, S., He, J., Xu, C., Tan, L.: Sequential human activity recognition based on deep convolutional network and extreme learning machine using wearable sensors. J. Sensors 2018 (2018)","DOI":"10.1155\/2018\/8580959"},{"key":"9_CR39","doi-asserted-by":"crossref","unstructured":"Sun, S., Kuang, Z., Sheng, L., Ouyang, W., Zhang, W.: Optical flow guided feature: a fast and robust motion representation for video action recognition. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00151"},{"key":"9_CR40","unstructured":"X-IO Technologies Limited: X-IO technologies limited. UK company (2019). http:\/\/x-io.co.uk\/"},{"key":"9_CR41","unstructured":"De la Torre, F., et al.: Guide to the Carnegie Mellon university multimodal activity (CMU-MMAC) database. Robotics Institute, p. 135 (2008)"},{"issue":"1","key":"9_CR42","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1007\/s13735-014-0069-5","volume":"4","author":"J Uijlings","year":"2015","unstructured":"Uijlings, J., Duta, I.C., Sangineto, E., Sebe, N.: Video classification with densely extracted HOG\/HOF\/MBH features: an evaluation of the accuracy\/computational efficiency trade-off. Int. J. Multimed. Inf. Retr. 4(1), 33\u201344 (2015)","journal-title":"Int. J. Multimed. Inf. Retr."},{"key":"9_CR43","doi-asserted-by":"crossref","unstructured":"Uijlings, J.R., Duta, I.C., Rostamzadeh, N., Sebe, N.: Realtime video classification using dense HOF\/HOG. In: Proceedings of International Conference on Multimedia Retrieval, p. 145. ACM (2014)","DOI":"10.1145\/2578726.2578744"},{"key":"9_CR44","doi-asserted-by":"crossref","unstructured":"Wang, H., Kl\u00e4ser, A., Schmid, C., Cheng-Lin, L.: Action recognition by dense trajectories. In: CVPR 2011-IEEE Conference on Computer Vision and Pattern Recognition, pp. 3169\u20133176. IEEE (2011)","DOI":"10.1109\/CVPR.2011.5995407"},{"key":"9_CR45","unstructured":"Wang, X., Wu, Y., Zhu, L., Yang, Y.: Baidu-UTS submission to the EPIC-kitchens action recognition challenge 2019. arXiv preprint arXiv:1906.09383 (2019)"},{"key":"9_CR46","doi-asserted-by":"crossref","unstructured":"Wannenwetsch, A.S., Keuper, M., Roth, S.: ProbFlow: joint optical flow and uncertainty estimation. In: 2017 IEEE International Conference on Computer Vision (ICCV), pp. 1182\u20131191. IEEE (2017)","DOI":"10.1109\/ICCV.2017.133"},{"key":"9_CR47","doi-asserted-by":"crossref","unstructured":"Wrzalik, M., Krechel, D.: Human action recognition using optical flow and convolutional neural networks. In: 2017 16th IEEE International Conference on Machine Learning and Applications (ICMLA), pp. 801\u2013805. IEEE (2017)","DOI":"10.1109\/ICMLA.2017.00-59"},{"key":"9_CR48","doi-asserted-by":"publisher","first-page":"9893","DOI":"10.1109\/ACCESS.2018.2890675","volume":"7","author":"C Xu","year":"2019","unstructured":"Xu, C., Chai, D., He, J., Zhang, X., Duan, S.: InnoHAR: a deep neural network for complex human activity recognition. IEEE Access 7, 9893\u20139902 (2019)","journal-title":"IEEE Access"},{"issue":"9","key":"9_CR49","doi-asserted-by":"publisher","first-page":"2778","DOI":"10.3390\/s18092778","volume":"18","author":"K Yordanova","year":"2018","unstructured":"Yordanova, K., Kr\u00fcger, F.: Creating and exploring semantic annotation for behaviour analysis. Sensors 18(9), 2778 (2018)","journal-title":"Sensors"}],"container-title":["Lecture Notes in Computer Science","Ambient Intelligence"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-34255-5_9","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,1,27]],"date-time":"2021-01-27T10:45:48Z","timestamp":1611744348000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-030-34255-5_9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019]]},"ISBN":["9783030342548","9783030342555"],"references-count":49,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-34255-5_9","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2019]]},"assertion":[{"value":"4 November 2019","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"AmI","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Ambient Intelligence","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Rome","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2019","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"13 November 2019","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15 November 2019","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ami2019","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/ami2019.diag.uniroma1.it\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}