{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:27:07Z","timestamp":1750220827257,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":11,"publisher":"ACM","license":[{"start":{"date-parts":[[2019,10,15]],"date-time":"2019-10-15T00:00:00Z","timestamp":1571097600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2019,10,15]]},"DOI":"10.1145\/3343031.3356074","type":"proceedings-article","created":{"date-parts":[[2019,10,21]],"date-time":"2019-10-21T16:32:26Z","timestamp":1571675546000},"page":"2539-2542","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":2,"title":["A Hierarchical Framwork with Improved Loss for Large-scale Multi-modal Video Identification"],"prefix":"10.1145","author":[{"given":"Shichuan","family":"Zhang","sequence":"first","affiliation":[{"name":"Shanghai Advanced Research Institute, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zengming","family":"Tang","sequence":"additional","affiliation":[{"name":"Shanghai Advanced Research Institute, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hao","family":"Pan","sequence":"additional","affiliation":[{"name":"Shanghai Advanced Research Institute, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xinyu","family":"Wei","sequence":"additional","affiliation":[{"name":"Shanghai Advanced Research Institute, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jun","family":"Huang","sequence":"additional","affiliation":[{"name":"Shanghai Advanced Research Institute, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2019,10,15]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"2019.iQIYI AI Competition Platform. http:\/\/challenge.ai.iqiyi.com\/data-cluster  2019.iQIYI AI Competition Platform. http:\/\/challenge.ai.iqiyi.com\/data-cluster"},{"key":"e_1_3_2_1_2_1","unstructured":"Sami Abu-El-Haija Nisarg Kothari Joonseok Lee Paul Natsev George Toderici Balakrishnan Varadarajan and Sudheendra Vijayanarasimhan. 2016. YouTube-8M: A Large-Scale Video Classification Benchmark. (2016).  Sami Abu-El-Haija Nisarg Kothari Joonseok Lee Paul Natsev George Toderici Balakrishnan Varadarajan and Sudheendra Vijayanarasimhan. 2016. YouTube-8M: A Large-Scale Video Classification Benchmark. (2016)."},{"volume-title":"Activity Net: A Large-Scale Video Benchmark for Human Activity Understanding. In Computer Vision Pattern Recognition.","year":"2015","author":"Caba Fabian","key":"e_1_3_2_1_3_1"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"crossref","unstructured":"Jiankang Deng Guo Jia and Stefanos Zafeiriou. 2018. ArcFace: Additive Angular Margin Loss for Deep Face Recognition. (2018).  Jiankang Deng Guo Jia and Stefanos Zafeiriou. 2018. ArcFace: Additive Angular Margin Loss for Deep Face Recognition. (2018).","DOI":"10.1109\/CVPR.2019.00482"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"crossref","unstructured":"Jianfeng Dong Xirong Li Chaoxi Xu Gang Yang and Xun Wang. 2018. Feature Re-Learning with Data Augmentation for Content-based Video Recommendation. In ACM Multimedia. https:\/\/doi.org\/10.1145\/3240508.3266441  Jianfeng Dong Xirong Li Chaoxi Xu Gang Yang and Xun Wang. 2018. Feature Re-Learning with Data Augmentation for Content-based Video Recommendation. In ACM Multimedia. https:\/\/doi.org\/10.1145\/3240508.3266441","DOI":"10.1145\/3240508.3266441"},{"volume-title":"kNN based on probability density for fault detection in multimodal processes. Journal of Chemometrics1","year":"2018","author":"Guo Jinyu","key":"e_1_3_2_1_6_1"},{"key":"e_1_3_2_1_7_1","unstructured":"Kaiming He Xiangyu Zhang Shaoqing Ren and Sun Jian. 2015. Delving Deepinto Rectifiers: Surpassing Human-Level Performance on Image Net Classification.(2015).  Kaiming He Xiangyu Zhang Shaoqing Ren and Sun Jian. 2015. Delving Deepinto Rectifiers: Surpassing Human-Level Performance on Image Net Classification.(2015)."},{"volume-title":"Attention-Based Multimodal Fusion for Video Description. In IEEE International Conference on Computer Vision.","year":"2017","author":"Hori Chiori","key":"e_1_3_2_1_8_1"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1994.6.2.181"},{"key":"e_1_3_2_1_10_1","unstructured":"Will Kay Joao Carreira Karen Simonyan Brian Zhang and Andrew Zisserman. 2017. The Kinetics Human Action Video Dataset. (2017).  Will Kay Joao Carreira Karen Simonyan Brian Zhang and Andrew Zisserman. 2017. The Kinetics Human Action Video Dataset. (2017)."},{"key":"e_1_3_2_1_11_1","unstructured":"Yuanliu Liu Peipei Shi Bo Peng He Yan Yong Zhou Bing Han Yi Zheng Chao Lin Jianbin Jiang Yin Fan etal2018. iQIYI-VID: A Large Dataset for Multi-modal Person Identification. arXiv preprint arXiv:1811.07548(2018).  Yuanliu Liu Peipei Shi Bo Peng He Yan Yong Zhou Bing Han Yi Zheng Chao Lin Jianbin Jiang Yin Fan et al.2018. iQIYI-VID: A Large Dataset for Multi-modal Person Identification. arXiv preprint arXiv:1811.07548(2018)."}],"event":{"name":"MM '19: The 27th ACM International Conference on Multimedia","sponsor":["SIGMM ACM Special Interest Group on Multimedia"],"location":"Nice France","acronym":"MM '19"},"container-title":["Proceedings of the 27th ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3343031.3356074","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3343031.3356074","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T23:13:23Z","timestamp":1750202003000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3343031.3356074"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,10,15]]},"references-count":11,"alternative-id":["10.1145\/3343031.3356074","10.1145\/3343031"],"URL":"https:\/\/doi.org\/10.1145\/3343031.3356074","relation":{},"subject":[],"published":{"date-parts":[[2019,10,15]]},"assertion":[{"value":"2019-10-15","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}