{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:21:18Z","timestamp":1750220478264,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":27,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,10,17]],"date-time":"2021-10-17T00:00:00Z","timestamp":1634428800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,10,17]]},"DOI":"10.1145\/3474085.3479204","type":"proceedings-article","created":{"date-parts":[[2021,10,18]],"date-time":"2021-10-18T10:23:20Z","timestamp":1634552600000},"page":"4808-4812","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["A Solution to Multi-modal Ads Video Tagging Challenge"],"prefix":"10.1145","author":[{"given":"Hao","family":"Wu","sequence":"first","affiliation":[{"name":"Alibaba Group, Hangzhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jiajie","family":"Wang","sequence":"additional","affiliation":[{"name":"Alibaba Group, Hangzhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yuanzhe","family":"Gu","sequence":"additional","affiliation":[{"name":"Alibaba Group, Hangzhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Peisen","family":"Zhao","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhonglin","family":"Zu","sequence":"additional","affiliation":[{"name":"Alibaba Group, Hangzhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2021,10,17]]},"reference":[{"volume-title":"Youtube-8m: A large-scale video classification benchmark. arXiv preprint arXiv:1609.08675","year":"2016","author":"Abu-El-Haija Sami","key":"e_1_3_2_2_1_1"},{"volume-title":"Asymmetric loss for multi-label classification. arXiv preprint arXiv:2009.14119","year":"2020","author":"Ben-Baruch Emanuel","key":"e_1_3_2_2_2_1"},{"key":"e_1_3_2_2_3_1","doi-asserted-by":"publisher","DOI":"10.5555\/645805.670013"},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"publisher","DOI":"10.1155\/2018\/4940593"},{"volume-title":"Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805","year":"2018","author":"Devlin Jacob","key":"e_1_3_2_2_5_1"},{"key":"e_1_3_2_2_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01232"},{"key":"e_1_3_2_2_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"volume-title":"Jort F Gemmeke, Aren Jansen, R Channing Moore, Manoj Plakal, Devin Platt, Rif A Saurous, Bryan Seybold, et almbox.","year":"2017","author":"Hershey Shawn","key":"e_1_3_2_2_8_1"},{"volume-title":"Distilling the knowledge in a neural network. arXiv preprint arXiv:1503.02531","year":"2015","author":"Hinton Geoffrey","key":"e_1_3_2_2_9_1"},{"key":"e_1_3_2_2_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00745"},{"volume-title":"International MICCAI Brainlesion Workshop. Springer, 287--297","year":"2017","author":"Isensee Fabian","key":"e_1_3_2_2_11_1"},{"volume-title":"International MICCAI Brainlesion Workshop. Springer, 234--244","year":"2018","author":"Isensee Fabian","key":"e_1_3_2_2_12_1"},{"volume-title":"Adaptive mixtures of local experts. Neural computation","year":"1991","author":"Jacobs Robert A","key":"e_1_3_2_2_13_1"},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"crossref","unstructured":"Konstantinos Kamnitsas Wenjia Bai Enzo Ferrante Steven McDonagh Matthew Sinclair Nick Pawlowski Martin Rajchl Matthew Lee Bernhard Kainz Daniel Rueckert etal 2017. Ensembles of multiple models and architectures for robust brain tumour segmentation. In International MICCAI brainlesion workshop. Springer 450--462.  Konstantinos Kamnitsas Wenjia Bai Enzo Ferrante Steven McDonagh Matthew Sinclair Nick Pawlowski Martin Rajchl Matthew Lee Bernhard Kainz Daniel Rueckert et al. 2017. Ensembles of multiple models and architectures for robust brain tumour segmentation. In International MICCAI brainlesion workshop. Springer 450--462.","DOI":"10.1007\/978-3-319-75238-9_38"},{"volume-title":"Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980","year":"2014","author":"Kingma Diederik P","key":"e_1_3_2_2_15_1"},{"volume-title":"Proceedings of the European Conference on Computer Vision (ECCV) Workshops. 0--0.","year":"2018","author":"Lin Rongcheng","key":"e_1_3_2_2_16_1"},{"key":"e_1_3_2_2_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"volume-title":"Maksims Volkovs, Ilya Stanevich, and Guangwei Yu.","year":"2019","author":"Ma Junwei","key":"e_1_3_2_2_18_1"},{"key":"e_1_3_2_2_19_1","unstructured":"Q. Meng. 2018. LightGBM: A Highly Efficient Gradient Boosting Decision Tree. (2018).  Q. Meng. 2018. LightGBM: A Highly Efficient Gradient Boosting Decision Tree. (2018)."},{"key":"e_1_3_2_2_20_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-011-5256-5"},{"key":"e_1_3_2_2_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00565"},{"key":"e_1_3_2_2_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2010.164"},{"volume-title":"Modality-Pairing Learning for Brain Tumor Segmentation. arXiv preprint arXiv:2010.09277","year":"2020","author":"Wang Yixin","key":"e_1_3_2_2_23_1"},{"key":"e_1_3_2_2_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM.2019.00179"},{"volume-title":"Cooperative Learning for Noisy Supervision. In 2021 IEEE International Conference on Multimedia and Expo (ICME). https:\/\/doi.org\/10","year":"2021","author":"Wu Hao","key":"e_1_3_2_2_25_1"},{"key":"e_1_3_2_2_26_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01070"},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2006.12.019"}],"event":{"name":"MM '21: ACM Multimedia Conference","sponsor":["SIGMM ACM Special Interest Group on Multimedia"],"location":"Virtual Event China","acronym":"MM '21"},"container-title":["Proceedings of the 29th ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3474085.3479204","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3474085.3479204","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T20:48:48Z","timestamp":1750193328000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3474085.3479204"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,10,17]]},"references-count":27,"alternative-id":["10.1145\/3474085.3479204","10.1145\/3474085"],"URL":"https:\/\/doi.org\/10.1145\/3474085.3479204","relation":{},"subject":[],"published":{"date-parts":[[2021,10,17]]},"assertion":[{"value":"2021-10-17","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}