{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T05:47:03Z","timestamp":1777873623998,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":30,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,8,3]]},"DOI":"10.1145\/3711896.3737178","type":"proceedings-article","created":{"date-parts":[[2025,8,3]],"date-time":"2025-08-03T21:07:39Z","timestamp":1754255259000},"page":"2186-2197","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Utilizing Strategic Pre-training to Reduce Overfitting: Baguan - A Pre-trained Weather Forecasting Model"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0007-7023-0900","authenticated-orcid":false,"given":"Peisong","family":"Niu","sequence":"first","affiliation":[{"name":"DAMO Academy, Alibaba Group, Hangzhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1567-5054","authenticated-orcid":false,"given":"Ziqing","family":"Ma","sequence":"additional","affiliation":[{"name":"DAMO Academy, Alibaba Group, Hangzhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1789-5413","authenticated-orcid":false,"given":"Tian","family":"Zhou","sequence":"additional","affiliation":[{"name":"DAMO Academy, Alibaba Group, hang zhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-9246-9402","authenticated-orcid":false,"given":"Weiqi","family":"Chen","sequence":"additional","affiliation":[{"name":"DAMO Academy, Alibaba Group, Hangzhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-9203-9086","authenticated-orcid":false,"given":"Lefei","family":"Shen","sequence":"additional","affiliation":[{"name":"Computer Science and Technology, Zhejiang University, Hangzhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8797-4646","authenticated-orcid":false,"given":"Rong","family":"Jin","sequence":"additional","affiliation":[{"name":"DAMO Academy, Alibaba Group, HangZhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-5835-7259","authenticated-orcid":false,"given":"Liang","family":"Sun","sequence":"additional","affiliation":[{"name":"DAMO Academy, Alibaba Group, Hangzhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,8,3]]},"reference":[{"key":"e_1_3_2_2_1_1","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2024\/1203"},{"key":"e_1_3_2_2_2_1","first-page":"533","volume-title":"Nature","volume":"619","author":"Bi Kaifeng","year":"2023","unstructured":"Kaifeng Bi, Lingxi Xie, Hengheng Zhang, Xin Chen, Xiaotao Gu, and Qi Tian. 2023. Accurate medium-range global weather forecasting with 3D neural networks. Nature, Vol. 619, 7970 (2023), 533-538."},{"key":"e_1_3_2_2_3_1","volume-title":"Aurora: A Foundation Model of the Atmosphere. ArXiv","author":"Bodnar Cristian","year":"2024","unstructured":"Cristian Bodnar, Wessel P. Bruinsma, Ana Lucic, Megan Stanley, Johannes Brandstetter, Patrick Garvan, Maik Riechert, Jonathan A. Weyn, Haiyu Dong, Anna Vaughan, Jayesh K. Gupta, Kit Thambiratnam, Alex Archibald, Elizabeth Heider, Max Welling, Richard E. Turner, and Paris Perdikaris. 2024. Aurora: A Foundation Model of the Atmosphere. ArXiv, Vol. abs\/2405.13063 (2024). https:\/\/api.semanticscholar.org\/CorpusID:269983273"},{"key":"e_1_3_2_2_4_1","volume-title":"FengWu: Pushing the Skillful Global Medium-range Weather Forecast beyond 10 Days Lead. ArXiv","author":"Chen Kan","year":"2023","unstructured":"Kan Chen, Tao Han, Junchao Gong, Lei Bai, Fenghua Ling, Jingyao Luo, Xi Chen, Lei Ma, Tianning Zhang, Rui Su, Yuanzheng Ci, Bin Li, Xiaokang Yang, and Wanli Ouyang. 2023a. FengWu: Pushing the Skillful Global Medium-range Weather Forecast beyond 10 Days Lead. ArXiv, Vol. abs\/2304.02948 (2023). https:\/\/api.semanticscholar.org\/CorpusID:257985330"},{"key":"e_1_3_2_2_5_1","volume-title":"Yuan Cheng, Yinghui Xu, Yuan Qi, and Hao Li.","author":"Chen Lei","year":"2023","unstructured":"Lei Chen, Xiaohui Zhong, Feng jun Zhang, Yuan Cheng, Yinghui Xu, Yuan Qi, and Hao Li. 2023b. FuXi: a cascade machine learning forecasting system for 15-day global weather forecast. npj Climate and Atmospheric Science, Vol. 6 (2023), 1-11. https:\/\/api.semanticscholar.org\/CorpusID:259224665"},{"key":"e_1_3_2_2_6_1","doi-asserted-by":"publisher","DOI":"10.1038\/s41612-023-00512-1"},{"key":"e_1_3_2_2_7_1","first-page":"15745","volume-title":"Exploring Simple Siamese Representation Learning. 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)(2020)","author":"Chen Xinlei","year":"2020","unstructured":"Xinlei Chen and Kaiming He. 2020. Exploring Simple Siamese Representation Learning. 2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)(2020), 15745-15753. https:\/\/api.semanticscholar.org\/CorpusID:227118869"},{"key":"e_1_3_2_2_8_1","volume-title":"Karina: An efficient deep learning model for global weather forecast. arXiv preprint arXiv:2403.10555(2024).","author":"Cheon Minjong","year":"2024","unstructured":"Minjong Cheon, Yo-Hwan Choi, Seon-Yu Kang, Yumi Choi, Jeong-Gil Lee, and Daehyun Kang. 2024. Karina: An efficient deep learning model for global weather forecast. arXiv preprint arXiv:2403.10555(2024)."},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511734458"},{"key":"e_1_3_2_2_10_1","unstructured":"Yizhen Guo Tian Zhou Wanyi Jiang Bo Wu Liang Sun and Rong Jin. 2024. Maximizing the Impact of Deep Learning on Subseasonal-to-Seasonal Climate Forecasting: The Essential Role of Optimization. arXiv preprint arXiv:2411.16728(2024)."},{"key":"e_1_3_2_2_11_1","first-page":"40676","article-title":"Siamese masked autoencoders","volume":"36","author":"Gupta Agrim","year":"2023","unstructured":"Agrim Gupta, Jiajun Wu, Jia Deng, and Fei-Fei Li. 2023. Siamese masked autoencoders. Advances in Neural Information Processing Systems, Vol. 36 (2023), 40676-40693.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_2_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"e_1_3_2_2_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1002\/qj.3803"},{"key":"e_1_3_2_2_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/3592979.3593412"},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"publisher","DOI":"10.1126\/science.adi2336"},{"key":"e_1_3_2_2_17_1","volume-title":"Ana Prieto Nemesio, Peter D. Dueben, Andrew Brown, Florian Pappenberger, and Florence Rabier.","author":"Lang Simon","year":"2024","unstructured":"Simon Lang, Mihai Alexe, Matthew Chantry, Jesper Dramsch, Florian Pinault, Baudouin Raoult, Mariana C. A. Clare, Christian Lessig, Michael Maier-Gerber, Linus Magnusson, Zied Ben Bouall\u00e8gue, Ana Prieto Nemesio, Peter D. Dueben, Andrew Brown, Florian Pappenberger, and Florence Rabier. 2024. AIFS - ECMWF's data-driven forecasting system. arXiv:2406.01465 [physics.ao-ph] https:\/\/arxiv.org\/abs\/2406.01465"},{"key":"e_1_3_2_2_18_1","volume-title":"W-mae: Pre-trained weather model with masked autoencoder for multi-variable weather forecasting. arXiv preprint arXiv:2304.08754(2023).","author":"Man Xin","year":"2023","unstructured":"Xin Man, Chenghong Zhang, Jin Feng, Changyu Li, and Jie Shao. 2023. W-mae: Pre-trained weather model with masked autoencoder for multi-variable weather forecasting. arXiv preprint arXiv:2304.08754(2023)."},{"key":"e_1_3_2_2_19_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.2309.15214"},{"key":"e_1_3_2_2_20_1","volume-title":"Chaosbench: A multi-channel, physics-based benchmark for subseasonal-to-seasonal climate prediction. arXiv preprint arXiv:2402.00712(2024).","author":"Nathaniel Juan","year":"2024","unstructured":"Juan Nathaniel, Yongquan Qu, Tung Nguyen, Sungduk Yu, Julius Busecke, Aditya Grover, and Pierre Gentine. 2024. Chaosbench: A multi-channel, physics-based benchmark for subseasonal-to-seasonal climate prediction. arXiv preprint arXiv:2402.00712(2024)."},{"key":"e_1_3_2_2_21_1","volume-title":"International Conference on Machine Learning. https:\/\/api.semanticscholar.org\/CorpusID:256231457","author":"Nguyen Tung","year":"2023","unstructured":"Tung Nguyen, Johannes Brandstetter, Ashish Kapoor, Jayesh K. Gupta, and Aditya Grover. 2023a. ClimaX: A foundation model for weather and climate. In International Conference on Machine Learning. https:\/\/api.semanticscholar.org\/CorpusID:256231457"},{"key":"e_1_3_2_2_22_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.2312.03876"},{"key":"e_1_3_2_2_23_1","first-page":"4172","volume-title":"Scalable Diffusion Models with Transformers. 2023 IEEE\/CVF International Conference on Computer Vision (ICCV)(2022)","author":"William","unstructured":"William S. Peebles and Saining Xie. 2022. Scalable Diffusion Models with Transformers. 2023 IEEE\/CVF International Conference on Computer Vision (ICCV)(2022), 4172-4182. https:\/\/api.semanticscholar.org\/CorpusID:254854389"},{"key":"e_1_3_2_2_24_1","volume-title":"Courville","author":"Perez Ethan","year":"2018","unstructured":"Ethan Perez, Florian Strub, Harm de Vries, Vincent Dumoulin, and Aaron C. Courville. 2018. FiLM: Visual Reasoning with a General Conditioning Layer. In AAAI."},{"key":"e_1_3_2_2_25_1","volume-title":"Peter Dueben, Carla Bromberg, Jared Sisk, Luke Barrington, Aaron Bell, and Fei Sha.","author":"Rasp Stephan","year":"2024","unstructured":"Stephan Rasp, Stephan Hoyer, Alexander Merose, Ian Langmore, Peter Battaglia, Tyler Russel, Alvaro Sanchez-Gonzalez, Vivian Yang, Rob Carver, Shreya Agrawal, Matthew Chantry, Zied Ben Bouallegue, Peter Dueben, Carla Bromberg, Jared Sisk, Luke Barrington, Aaron Bell, and Fei Sha. 2024. WeatherBench 2: A benchmark for the next generation of data-driven global weather models. arXiv:2308.15560 [physics.ao-ph] https:\/\/arxiv.org\/abs\/2308.15560"},{"key":"e_1_3_2_2_26_1","volume-title":"Shraddha Singh, Julian Kuehnert, Kumar Ankur, Aman Gupta, Christopher E Phillips, et al.","author":"Schmude Johannes","year":"2024","unstructured":"Johannes Schmude, Sujit Roy, Will Trojak, Johannes Jakubik, Daniel Salles Civitarese, Shraddha Singh, Julian Kuehnert, Kumar Ankur, Aman Gupta, Christopher E Phillips, et al., 2024. Prithvi wxc: Foundation model for weather and climate. arXiv preprint arXiv:2409.13598(2024). https:\/\/openreview.net\/forum?id=SyBPtQfAZ"},{"key":"e_1_3_2_2_27_1","unstructured":"Jimeng Shi Azam Shirali Bowen Jin Sizhe Zhou Wei Hu Rahuul Rangaraj Shaowen Wang Jiawei Han Zhaonan Wang Upmanu Lall Yanzhao Wu Leonardo Bobadilla and Giri Narasimhan. 2025. Deep Learning and Foundation Models for Weather Prediction: A Survey. arXiv:2501.06907 [cs.LG] https:\/\/arxiv.org\/abs\/2501.06907"},{"key":"e_1_3_2_2_28_1","doi-asserted-by":"publisher","DOI":"10.1038\/s41612-018-0013-0"},{"key":"e_1_3_2_2_29_1","volume-title":"SimMIM: A Simple Framework for Masked Image Modeling. In International Conference on Computer Vision and Pattern Recognition (CVPR).","author":"Xie Zhenda","year":"2022","unstructured":"Zhenda Xie, Zheng Zhang, Yue Cao, Yutong Lin, Jianmin Bao, Zhuliang Yao, Qi Dai, and Han Hu. 2022. SimMIM: A Simple Framework for Masked Image Modeling. In International Conference on Computer Vision and Pattern Recognition (CVPR)."},{"key":"e_1_3_2_2_30_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.2409.07188"}],"event":{"name":"KDD '25: The 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining","location":"Toronto ON Canada","acronym":"KDD '25","sponsor":["SIGKDD ACM Special Interest Group on Knowledge Discovery in Data","SIGMOD ACM Special Interest Group on Management of Data"]},"container-title":["Proceedings of the 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining V.2"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3711896.3737178","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T18:06:26Z","timestamp":1777572386000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3711896.3737178"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,3]]},"references-count":30,"alternative-id":["10.1145\/3711896.3737178","10.1145\/3711896"],"URL":"https:\/\/doi.org\/10.1145\/3711896.3737178","relation":{},"subject":[],"published":{"date-parts":[[2025,8,3]]},"assertion":[{"value":"2025-08-03","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}