{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T21:05:32Z","timestamp":1776891932705,"version":"3.51.2"},"reference-count":27,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/501100011785","name":"Guangxi Science and Technology Department","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100011785","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100020884","name":"CONICYT","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100020884","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002848","name":"Comisi\u00f3n Nacional de Investigaci\u00f3n Cient\u00edfica y Tecnol\u00f3gica","doi-asserted-by":"publisher","award":["1181809"],"award-info":[{"award-number":["1181809"]}],"id":[{"id":"10.13039\/501100002848","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002848","name":"Comisi\u00f3n Nacional de Investigaci\u00f3n Cient\u00edfica y Tecnol\u00f3gica","doi-asserted-by":"publisher","award":["ID16I10466"],"award-info":[{"award-number":["ID16I10466"]}],"id":[{"id":"10.13039\/501100002848","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100002850","name":"CONICYT FONDECYT","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100002850","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Neurocomputing"],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1016\/j.neucom.2026.133279","type":"journal-article","created":{"date-parts":[[2026,3,12]],"date-time":"2026-03-12T07:52:28Z","timestamp":1773301948000},"page":"133279","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["Rethinking Adam for time series forecasting: A simple heuristic to improve optimization under distribution shifts"],"prefix":"10.1016","volume":"682","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-0597-6576","authenticated-orcid":false,"given":"Yuze","family":"Dong","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4720-5946","authenticated-orcid":false,"given":"Jinsong","family":"Wu","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/j.neucom.2026.133279_bib0005","doi-asserted-by":"crossref","first-page":"72284","DOI":"10.52202\/075280-3164","article-title":"Resetting the optimizer in deep rl: an empirical study","volume":"36","author":"Asadi","year":"2023","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.neucom.2026.133279_bib0010","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3533382","article-title":"Deep learning for time series forecasting: tutorial and literature survey","volume":"55","author":"Benidis","year":"2022","journal-title":"ACM Comput. Surv."},{"key":"10.1016\/j.neucom.2026.133279_bib0015","author":"Cheng"},{"key":"10.1016\/j.neucom.2026.133279_bib0020","author":"D\u00e9fossez"},{"key":"10.1016\/j.neucom.2026.133279_bib0025","doi-asserted-by":"crossref","first-page":"134567","DOI":"10.52202\/079017-4276","article-title":"Adam on local time: addressing nonstationarity in rl with relative adam timesteps","volume":"37","author":"Ellis","year":"2024","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.neucom.2026.133279_bib0030","author":"Fan"},{"key":"10.1016\/j.neucom.2026.133279_bib0035","author":"Hounie"},{"key":"10.1016\/j.neucom.2026.133279_bib0040","author":"Kingma"},{"key":"10.1016\/j.neucom.2026.133279_bib0045","first-page":"1","article-title":"Deep learning for time series forecasting: a survey","author":"Kong","year":"2025","journal-title":"Int. J. Mach. Learn. Cybern."},{"key":"10.1016\/j.neucom.2026.133279_bib0050","first-page":"52166","article-title":"Convergence of adam under relaxed assumptions","volume":"36","author":"Li","year":"2023","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.neucom.2026.133279_bib0055","doi-asserted-by":"crossref","DOI":"10.1098\/rsta.2020.0209","article-title":"Time-series forecasting with deep learning: a survey","volume":"379","author":"Lim","year":"2021","journal-title":"Philos. Trans. R. Soc. A"},{"key":"10.1016\/j.neucom.2026.133279_bib0060","author":"Lin"},{"key":"10.1016\/j.neucom.2026.133279_bib0065","author":"Liu"},{"key":"10.1016\/j.neucom.2026.133279_bib0070","author":"Loshchilov"},{"key":"10.1016\/j.neucom.2026.133279_bib0075","author":"Miller"},{"key":"10.1016\/j.neucom.2026.133279_bib0080","author":"Nie"},{"key":"10.1016\/j.neucom.2026.133279_bib0085","article-title":"Exploring progress in multivariate time series forecasting: comprehensive benchmarking and heterogeneity analysis","volume":"37","author":"Shao","year":"2024","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"10.1016\/j.neucom.2026.133279_bib0090","series-title":"The Eleventh International Conference on Learning Representations","article-title":"Micn: Multi-scale local and global context modeling for long-term series forecasting","author":"Wang","year":"2023"},{"key":"10.1016\/j.neucom.2026.133279_bib0095","author":"Wang"},{"key":"10.1016\/j.neucom.2026.133279_bib0100","author":"Wu"},{"key":"10.1016\/j.neucom.2026.133279_bib0105","first-page":"1","article-title":"Adam-family methods for nonsmooth optimization with convergence guarantees","volume":"25","author":"Xiao","year":"2024","journal-title":"J. Mach. Learn. Res."},{"key":"10.1016\/j.neucom.2026.133279_bib0110","author":"Ye"},{"key":"10.1016\/j.neucom.2026.133279_bib0115","doi-asserted-by":"crossref","DOI":"10.1109\/TKDE.2025.3569649","article-title":"Ginar+: a robust end-to-end framework for multivariate time series forecasting with missing values","volume":"37","author":"Yu","year":"2025","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"10.1016\/j.neucom.2026.133279_bib0120","doi-asserted-by":"crossref","DOI":"10.1016\/j.inffus.2024.102607","article-title":"Mgsfformer: a multi-granularity spatiotemporal fusion transformer for air quality prediction","volume":"113","author":"Yu","year":"2025","journal-title":"Inf. Fusion."},{"key":"10.1016\/j.neucom.2026.133279_bib0125","article-title":"Adaptive methods for nonconvex optimization","volume":"31","author":"Zaheer","year":"2018","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.neucom.2026.133279_bib0130","article-title":"Adaptive online learning in dynamic environments","volume":"31","author":"Zhang","year":"2018","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"10.1016\/j.neucom.2026.133279_bib0135","article-title":"Lookahead optimizer: k steps forward, 1 step back","volume":"32","author":"Zhang","year":"2019","journal-title":"Adv. Neural Inf. Process. Syst."}],"container-title":["Neurocomputing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0925231226006764?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0925231226006764?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T20:32:37Z","timestamp":1776889957000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0925231226006764"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,6]]},"references-count":27,"alternative-id":["S0925231226006764"],"URL":"https:\/\/doi.org\/10.1016\/j.neucom.2026.133279","relation":{},"ISSN":["0925-2312"],"issn-type":[{"value":"0925-2312","type":"print"}],"subject":[],"published":{"date-parts":[[2026,6]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Rethinking Adam for time series forecasting: A simple heuristic to improve optimization under distribution shifts","name":"articletitle","label":"Article Title"},{"value":"Neurocomputing","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.neucom.2026.133279","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier B.V. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"133279"}}