{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,13]],"date-time":"2026-02-13T10:42:48Z","timestamp":1770979368512,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":1,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,8,21]],"date-time":"2021-08-21T00:00:00Z","timestamp":1629504000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,8,21]]},"DOI":"10.1145\/3463945.3468170","type":"proceedings-article","created":{"date-parts":[[2021,8,27]],"date-time":"2021-08-27T14:29:53Z","timestamp":1630074593000},"page":"3-3","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":2,"title":["WenLan: Efficient Large-Scale Multi-Modal Pre-Training on Real World Data"],"prefix":"10.1145","author":[{"given":"Ruihua","family":"Song","sequence":"first","affiliation":[{"name":"Renmin University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2021,8,27]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"Yuqi Huo Manli Zhang Guangzhen Liu Haoyu Lu Yizhao Gao Guoxing Yang Jingyuan Wen Heng Zhang Baogui Xu Weihao Zheng Zongzheng Xi Yueqian Yang Anwen Hu Jinming Zhao Ruichen Li Yida Zhao Liang Zhang Yuqing Song Xin Hong Wanqing Cui Dan Yang Hou Yingyan Li Junyi Li Peiyu Liu Zheng Gong Chuhao Jin Yuchong Sun Shizhe Chen Zhiwu Lu Zhicheng Dou Qin Jin Yanyan Lan Wayne Xin Zhao Ruihua Song Ji-Rong Wen. WenLan: Bridging Vision and Language by Large-Scale Multi-Modal Pre-Training. CoRR abs\/2103.06561 (2021)  Yuqi Huo Manli Zhang Guangzhen Liu Haoyu Lu Yizhao Gao Guoxing Yang Jingyuan Wen Heng Zhang Baogui Xu Weihao Zheng Zongzheng Xi Yueqian Yang Anwen Hu Jinming Zhao Ruichen Li Yida Zhao Liang Zhang Yuqing Song Xin Hong Wanqing Cui Dan Yang Hou Yingyan Li Junyi Li Peiyu Liu Zheng Gong Chuhao Jin Yuchong Sun Shizhe Chen Zhiwu Lu Zhicheng Dou Qin Jin Yanyan Lan Wayne Xin Zhao Ruihua Song Ji-Rong Wen. WenLan: Bridging Vision and Language by Large-Scale Multi-Modal Pre-Training. CoRR abs\/2103.06561 (2021)"}],"event":{"name":"ICMR '21: International Conference on Multimedia Retrieval","location":"Taipei Taiwan","acronym":"ICMR '21","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 2021 Workshop on Multi-Modal Pre-Training for Multimedia Understanding"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3463945.3468170","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3463945.3468170","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T20:12:15Z","timestamp":1750191135000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3463945.3468170"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,8,21]]},"references-count":1,"alternative-id":["10.1145\/3463945.3468170","10.1145\/3463945"],"URL":"https:\/\/doi.org\/10.1145\/3463945.3468170","relation":{},"subject":[],"published":{"date-parts":[[2021,8,21]]},"assertion":[{"value":"2021-08-27","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}