{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,23]],"date-time":"2025-08-23T05:23:35Z","timestamp":1755926615973,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":44,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,10,26]],"date-time":"2021-10-26T00:00:00Z","timestamp":1635206400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,10,26]]},"DOI":"10.1145\/3459637.3482143","type":"proceedings-article","created":{"date-parts":[[2021,10,30]],"date-time":"2021-10-30T18:34:11Z","timestamp":1635618851000},"page":"3597-3602","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["MixBERT for Image-Ad Relevance Scoring in Advertising"],"prefix":"10.1145","author":[{"given":"Tan","family":"Yu","sequence":"first","affiliation":[{"name":"Baidu Research, Bellevue, WA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiaokang","family":"Li","sequence":"additional","affiliation":[{"name":"Baidu Inc., Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jianwen","family":"Xie","sequence":"additional","affiliation":[{"name":"Baidu Research, Bellevue, WA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ruiyang","family":"Yin","sequence":"additional","affiliation":[{"name":"Baidu Research, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qing","family":"Xu","sequence":"additional","affiliation":[{"name":"Baidu Inc., Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ping","family":"Li","sequence":"additional","affiliation":[{"name":"Baidu Research, Bellevue, WA, USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2021,10,30]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58577-8_7"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-main.707"},{"volume-title":"Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (NAACL-HLT)","year":"2019","author":"Devlin Jacob","key":"e_1_3_2_1_3_1"},{"volume-title":"Proceedings of the British Machine Vision Conference (BMVC)","year":"2018","author":"Faghri Fartash","key":"e_1_3_2_1_4_1"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/3292500.3330651"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/3340531.3412162"},{"volume-title":"Proceedings of the 2021 Conference of the North American","year":"2021","author":"Fei Hongliang","key":"e_1_3_2_1_7_1"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/3404835.3463116"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.5555\/2999792.2999849"},{"key":"e_1_3_2_1_10_1","unstructured":"Zhe Gan Yen-Chun Chen Linjie Li Chen Zhu Yu Cheng and Jingjing Liu. 2020. Large-Scale Adversarial Training for Vision-and-Language Representation Learning. In Advances in Neural Information Processing Systems (NeurIPS). virtual.  Zhe Gan Yen-Chun Chen Linjie Li Chen Zhu Yu Cheng and Jingjing Liu. 2020. Large-Scale Adversarial Training for Vision-and-Language Representation Learning. In Advances in Neural Information Processing Systems (NeurIPS). virtual."},{"volume-title":"Retrieve Fast","year":"1920","author":"Geigle Gregor","key":"e_1_3_2_1_11_1"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"volume-title":"Distilling the knowledge in a neural network. arXiv preprint arXiv:1503.02531","year":"2015","author":"Hinton Geoffrey","key":"e_1_3_2_1_13_1"},{"volume-title":"Proceedings of the 44th International ACM SIGIR Conference on Research and Development in Information Retrieval (SIGIR). Online.","year":"2021","author":"Hong Weixiang","key":"e_1_3_2_1_14_1"},{"volume-title":"TinyBERT: Distilling BERT for natural language understanding. arXiv preprint arXiv:1909.10351","year":"2019","author":"Jiao Xiaoqi","key":"e_1_3_2_1_15_1"},{"volume-title":"International Conference on Machine Learning (ICML).","year":"2021","author":"Kim Wonjae","key":"e_1_3_2_1_16_1"},{"volume-title":"Stacked Cross Attention for Image-Text Matching. In Computer Vision - ECCV 2018 Proceedings of the 15th European Conference on Computer Vision (ECCV), Part IV","year":"2018","author":"Lee Kuang-Huei","key":"e_1_3_2_1_17_1"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6795"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58577-8_8"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/2911451.2911493"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.5555\/3454287.3454289"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01045"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00970"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"crossref","unstructured":"Mayu Otani Yuta Nakashima Esa Rahtu Janne Heikkil\u00e4 and Naokazu Yokoya. 2016. Learning joint representations of videos and sentences with web image search. In ECCV.  Mayu Otani Yuta Nakashima Esa Rahtu Janne Heikkil\u00e4 and Naokazu Yokoya. 2016. Learning joint representations of videos and sentences with web image search. In ECCV.","DOI":"10.1007\/978-3-319-46604-0_46"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.5555\/2969239.2969250"},{"volume-title":"Proceedings of the 8th International Conference on Learning Representations (ICLR). Addis Ababa, Ethiopia.","year":"2020","author":"Su Weijie","key":"e_1_3_2_1_26_1"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00756"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.77"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1514"},{"key":"e_1_3_2_1_30_1","unstructured":"Mingxing Tan and Quoc Le. 2019. EfficientNet: Rethinking Model Scaling for Convolutional Neural Networks. In ICML.  Mingxing Tan and Quoc Le. 2019. EfficientNet: Rethinking Model Scaling for Convolutional Neural Networks. In ICML."},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.5555\/3295222.3295349"},{"volume-title":"MiniVLM: A Smaller and Faster Vision-Language Model. arXiv preprint arXiv:2012.06946","year":"2020","author":"Wang Jianfeng","key":"e_1_3_2_1_32_1"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.14778\/2732296.2732301"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/3448016.3457236"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i4.16431"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDE51399.2021.00225"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1145\/3459637.3482233"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3403297"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/3404835.3462924"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1145\/3459637.3481937"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"crossref","unstructured":"Bowen Zhang Hexiang Hu Vihan Jain Eugene Ie and Fei Sha. 2020. Learning to Represent Image and Text with Denotation Graph. EMNLP.  Bowen Zhang Hexiang Hu Vihan Jain Eugene Ie and Fei Sha. 2020. Learning to Represent Image and Text with Denotation Graph. EMNLP.","DOI":"10.18653\/v1\/2020.emnlp-main.60"},{"volume-title":"Proceedings of the 3rd Conference on Machine Learning and Systems (MLSys)","year":"2020","author":"Zhao Weijie","key":"e_1_3_2_1_42_1"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/3357384.3358045"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1145\/2600428.2609610"}],"event":{"name":"CIKM '21: The 30th ACM International Conference on Information and Knowledge Management","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGIR ACM Special Interest Group on Information Retrieval"],"location":"Virtual Event Queensland Australia","acronym":"CIKM '21"},"container-title":["Proceedings of the 30th ACM International Conference on Information &amp; Knowledge Management"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3459637.3482143","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3459637.3482143","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T19:30:13Z","timestamp":1750188613000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3459637.3482143"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,10,26]]},"references-count":44,"alternative-id":["10.1145\/3459637.3482143","10.1145\/3459637"],"URL":"https:\/\/doi.org\/10.1145\/3459637.3482143","relation":{},"subject":[],"published":{"date-parts":[[2021,10,26]]},"assertion":[{"value":"2021-10-30","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}