{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,3]],"date-time":"2025-06-03T20:47:01Z","timestamp":1748983621612,"version":"3.28.0"},"reference-count":14,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014,7]]},"DOI":"10.1109\/icmew.2014.6890609","type":"proceedings-article","created":{"date-parts":[[2014,9,10]],"date-time":"2014-09-10T11:50:12Z","timestamp":1410349812000},"page":"1-6","source":"Crossref","is-referenced-by-count":3,"title":["Challenge Huawei challenge: Fusing multimodal features with deep neural networks for Mobile Video Annotation"],"prefix":"10.1109","author":[{"family":"Jian Tu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"family":"Zuxuan Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"family":"Qi Dai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"family":"Yu-Gang Jiang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"family":"Xiangyang Xue","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"13","article-title":"ImageNet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"NIPS"},{"key":"14","article-title":"The AXES submissions at TrecVid 2013","author":"aly","year":"2013","journal-title":"NIST TRECVID workshop"},{"key":"11","article-title":"Improving the fisher kernel for large-scale image classification","author":"perronnin","year":"2010","journal-title":"ECCV"},{"key":"12","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2012.2205597"},{"key":"3","article-title":"Deep Fisher networks for large-scale image classification","author":"simonyan","year":"2013","journal-title":"NIPS"},{"key":"2","article-title":"Robust late fusion with rank minimization","author":"ye","year":"2012","journal-title":"CVPR"},{"key":"1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.441"},{"key":"10","doi-asserted-by":"publisher","DOI":"10.1145\/1282280.1282352"},{"key":"7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2010.5539970"},{"key":"6","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2010.2052027"},{"key":"5","doi-asserted-by":"crossref","first-page":"91","DOI":"10.1023\/B:VISI.0000029664.99615.94","article-title":"Distinctive image features from scale-invariant keypoints","volume":"60","author":"david","year":"2004","journal-title":"IJCV"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1145\/2324796.2324805"},{"key":"9","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2003.1238663"},{"key":"8","article-title":"Fudan at MediaEval 2013: Violent scenes detection using motion features and part-level attributes","author":"dai","year":"2013","journal-title":"MediaEval Workshop"}],"event":{"name":"2014 IEEE International Conference on Multimedia and Expo Workshops (ICMEW)","start":{"date-parts":[[2014,7,14]]},"location":"Chengdu, China","end":{"date-parts":[[2014,7,18]]}},"container-title":["2014 IEEE International Conference on Multimedia and Expo Workshops (ICMEW)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6882610\/6890528\/06890609.pdf?arnumber=6890609","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,22]],"date-time":"2017-06-22T16:13:20Z","timestamp":1498148000000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/6890609\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,7]]},"references-count":14,"URL":"https:\/\/doi.org\/10.1109\/icmew.2014.6890609","relation":{},"subject":[],"published":{"date-parts":[[2014,7]]}}}