{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T02:20:56Z","timestamp":1730254856524,"version":"3.28.0"},"reference-count":44,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,1,10]],"date-time":"2021-01-10T00:00:00Z","timestamp":1610236800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,1,10]],"date-time":"2021-01-10T00:00:00Z","timestamp":1610236800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,1,10]],"date-time":"2021-01-10T00:00:00Z","timestamp":1610236800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,1,10]]},"DOI":"10.1109\/icpr48806.2021.9412197","type":"proceedings-article","created":{"date-parts":[[2021,5,6]],"date-time":"2021-05-06T02:15:54Z","timestamp":1620267354000},"page":"4680-4687","source":"Crossref","is-referenced-by-count":1,"title":["Anticipating Activity from Multimodal Signals"],"prefix":"10.1109","author":[{"given":"Tiziana","family":"Rotondo","sequence":"first","affiliation":[]},{"given":"Giovanni Maria","family":"Farinella","sequence":"additional","affiliation":[]},{"given":"Davide","family":"Giacalone","sequence":"additional","affiliation":[]},{"given":"Sebastiano Mauro","family":"Strano","sequence":"additional","affiliation":[]},{"given":"Valeria","family":"Tomaselli","sequence":"additional","affiliation":[]},{"given":"Sebastiano","family":"Battiato","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1145\/3123266.3123448"},{"key":"ref38","article-title":"Voice recognition algorithms using mel frequency cepstral coefficient (mfcc) and dynamic time warping (dtw) techniques","author":"muda","year":"2010","journal-title":"Journal of Computing"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/EMBC.2015.7318411"},{"key":"ref32","first-page":"1","article-title":"Activity recognition from user-annotated acceleration data","author":"bao","year":"2004","journal-title":"Pervasive Computing"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ROMAN.2012.6343802"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2014.6942983"},{"key":"ref37","article-title":"An efficient mfcc extraction method in speech recognition","author":"han","year":"0","journal-title":"IEEE International Symposium on Circuits and Systems"},{"key":"ref36","article-title":"Deep metric learning using triplet network","author":"hoffer","year":"0","journal-title":"Eighth International Conference on Learning Representations (ICLR) (Workshop)"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/TMC.2018.2841905"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1088\/0967-3334\/35\/11\/2191"},{"key":"ref10","first-page":"689","article-title":"A hierarchical representation for future action prediction","author":"lan","year":"0","journal-title":"European Conference on Computer Vision ECCV"},{"key":"ref40","article-title":"Spectral basis functions from discriminant analysis","author":"hermansky","year":"0","journal-title":"International Conference on Spoken Language Processing"},{"key":"ref11","first-page":"453","author":"koppula","year":"2016","journal-title":"Anticipatory Planning for Human-Robot Teams"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2013.6696368"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2018.2861569"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2015.2430335"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/j.jvcir.2017.10.004"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.319"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.5220\/0007379001540161"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472171"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.15"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.5244\/C.31.84"},{"key":"ref4","volume":"abs 1706 932","author":"aytar","year":"2017","journal-title":"See hear and read Deep aligned representations"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00635"},{"key":"ref3","first-page":"2949","article-title":"Multimodal learning with deep boltzmann machines","volume":"15","author":"srivastava","year":"2014","journal-title":"Journal of Machine Learning Research"},{"key":"ref6","first-page":"iii-1247","article-title":"Deep canonical correlation analysis","volume":"28","author":"andrew","year":"0","journal-title":"30th International Conference on International Conference on Machine Learning"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-37558-4_25"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1093\/biomet\/28.3-4.321"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/2733373.2806311"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1142\/S012906570000034X"},{"key":"ref2","first-page":"689","article-title":"Mul-timodal deep learning","author":"ngiam","year":"0","journal-title":"28th International Conference on Machine Learning"},{"key":"ref9","doi-asserted-by":"crossref","first-page":"136","DOI":"10.1007\/978-3-319-54190-7_9","article-title":"Anticipating accidents in dashcam videos","author":"chan","year":"2017","journal-title":"Computer Vision ACCV 2016"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1115"},{"key":"ref20","article-title":"Detailed human data acquisition of kitchen activities: the CMU-Multimodal Activity Database (CMU-MMAC)","author":"de la torre","year":"0","journal-title":"CHI 2009 Workshop Developing Shared Home Behavior Datasets to Advance HCI and Ubiquitous Computing Research"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/INSS.2010.5573462"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.721"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/ICBNMT.2009.5348520"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/2733373.2806336"},{"key":"ref41","first-page":"291","author":"gonzalez","year":"2013","journal-title":"Better Than MFCC Audio Classification Features"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2015.7350781"},{"key":"ref44","first-page":"131","author":"hershey","year":"2017","journal-title":"Cnn architectures for large-scale audio classification"},{"key":"ref26","article-title":"Scaling egocentric vision: The epic-kitchens dataset","author":"damen","year":"0","journal-title":"European Conference on Computer Vision (ECCV)"},{"key":"ref43","doi-asserted-by":"crossref","DOI":"10.1023\/A:1026531017760","article-title":"The sound of pixels","author":"zhao","year":"0","journal-title":"the European Conference on Computer Vision (ECCV)"},{"key":"ref25","volume":"abs 1504 8023","author":"vondrick","year":"2015","journal-title":"Anticipating the future by watching unlabeled video"}],"event":{"name":"2020 25th International Conference on Pattern Recognition (ICPR)","start":{"date-parts":[[2021,1,10]]},"location":"Milan, Italy","end":{"date-parts":[[2021,1,15]]}},"container-title":["2020 25th International Conference on Pattern Recognition (ICPR)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9411940\/9411911\/09412197.pdf?arnumber=9412197","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T15:40:50Z","timestamp":1652197250000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9412197\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,1,10]]},"references-count":44,"URL":"https:\/\/doi.org\/10.1109\/icpr48806.2021.9412197","relation":{},"subject":[],"published":{"date-parts":[[2021,1,10]]}}}