{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T05:15:41Z","timestamp":1729660541753,"version":"3.28.0"},"reference-count":27,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014,5]]},"DOI":"10.1109\/icassp.2014.6854473","type":"proceedings-article","created":{"date-parts":[[2014,7,29]],"date-time":"2014-07-29T19:23:23Z","timestamp":1406661803000},"page":"4598-4602","source":"Crossref","is-referenced-by-count":2,"title":["Late fusion and calibration for multimedia event detection using few examples"],"prefix":"10.1109","author":[{"given":"Julien","family":"van Hout","sequence":"first","affiliation":[]},{"given":"Eric","family":"Yeh","sequence":"additional","affiliation":[]},{"given":"Dennis C.","family":"Koelma","sequence":"additional","affiliation":[]},{"given":"Cees G.M.","family":"Snoek","sequence":"additional","affiliation":[]},{"given":"Chen","family":"Sun","sequence":"additional","affiliation":[]},{"given":"Ramakant","family":"Nevatia","sequence":"additional","affiliation":[]},{"given":"Julie","family":"Wong","sequence":"additional","affiliation":[]},{"given":"Gregory K.","family":"Myers","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"19","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2013.6474994"},{"key":"17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995407"},{"journal-title":"MoSIFT Recognizing human actions in surveillance videos","year":"2009","author":"chen","key":"18"},{"key":"15","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-013-0636-x"},{"key":"16","doi-asserted-by":"publisher","DOI":"10.1145\/2461466.2461482"},{"key":"13","article-title":"The 2013 sesame multimedia event detection and recounting system","author":"myers","year":"2013","journal-title":"Proceedings of TRECVID"},{"key":"14","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2009.154"},{"key":"11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6639277"},{"key":"12","doi-asserted-by":"publisher","DOI":"10.1016\/j.csl.2005.08.001"},{"key":"21","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.453"},{"journal-title":"Ucf101 A Dataset of 101 Human Actions Classes from Videos in the Wild","year":"2012","author":"soomro","key":"20"},{"key":"22","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6638340"},{"key":"23","doi-asserted-by":"crossref","first-page":"147","DOI":"10.1007\/s10032-004-0133-4","article-title":"Rectification and recognition of text in 3-d scenes","volume":"7","author":"myers","year":"2005","journal-title":"International Journal of Document Analysis and Recognition (IJDAR)"},{"key":"24","first-page":"627","article-title":"Trust region newton method for logistic regression","volume":"9","author":"lin","year":"2008","journal-title":"The Journal of Machine Learning Research"},{"key":"25","first-page":"2825","article-title":"Scikit-learn: Machine learning in Python","volume":"12","author":"pedregosa","year":"2011","journal-title":"Journal of Machine Learning Research"},{"key":"26","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2005.01.012"},{"journal-title":"Trecvid Multimedia Event Detection Evaluation Plan","year":"2013","key":"27"},{"key":"3","doi-asserted-by":"publisher","DOI":"10.1007\/s00138-013-0527-8"},{"key":"2","doi-asserted-by":"crossref","first-page":"173","DOI":"10.1007\/978-3-642-27355-1_18","article-title":"Double fusion for multimedia event detection","author":"lan","year":"2012","journal-title":"Advances in Multimedia Modeling"},{"key":"10","article-title":"A unified approach for audio characterization and its application to speaker recognition","author":"ferrer","year":"2012","journal-title":"Odyssey 2012 The Speaker and Language Recognition Workshop"},{"key":"1","doi-asserted-by":"publisher","DOI":"10.1145\/1101149.1101236"},{"key":"7","article-title":"Ibm research and columbia university trecvid-2012 multimedia event detection (med), multimedia event recounting (mer), and semantic indexing (sin) systems","author":"cao","year":"2012","journal-title":"Proc TRECVID 2012 Workshop"},{"journal-title":"Axes at Trecvid 2012 Kis Ins and Med","year":"2012","author":"oneata","key":"6"},{"journal-title":"TRECVID2011","year":"2011","author":"bao","key":"5"},{"key":"4","article-title":"Trecvid genie","author":"vahdat","year":"2012","journal-title":"Proceedings of TRECVID 2012 NIST"},{"key":"9","doi-asserted-by":"crossref","first-page":"395","DOI":"10.1007\/978-3-642-33885-4_40","article-title":"Explicit performance metric optimization for fusion-based video retrieval","author":"kim","year":"2012","journal-title":"Computer Vision-ECCV 2012 Workshops and Demonstrations"},{"key":"8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6247814"}],"event":{"name":"ICASSP 2014 - 2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2014,5,4]]},"location":"Florence, Italy","end":{"date-parts":[[2014,5,9]]}},"container-title":["2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6844297\/6853544\/06854473.pdf?arnumber=6854473","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,22]],"date-time":"2017-06-22T17:31:35Z","timestamp":1498152695000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/6854473\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,5]]},"references-count":27,"URL":"https:\/\/doi.org\/10.1109\/icassp.2014.6854473","relation":{},"subject":[],"published":{"date-parts":[[2014,5]]}}}