{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,14]],"date-time":"2026-05-14T22:47:00Z","timestamp":1778798820434,"version":"3.51.4"},"reference-count":17,"publisher":"Elsevier BV","issue":"1","license":[{"start":{"date-parts":[[2003,1,1]],"date-time":"2003-01-01T00:00:00Z","timestamp":1041379200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Neural Networks"],"published-print":{"date-parts":[[2003,1]]},"DOI":"10.1016\/s0893-6080(02)00228-9","type":"journal-article","created":{"date-parts":[[2003,2,12]],"date-time":"2003-02-12T06:53:31Z","timestamp":1045032811000},"page":"5-9","source":"Crossref","is-referenced-by-count":213,"title":["Meta-learning in Reinforcement Learning"],"prefix":"10.1016","volume":"16","author":[{"given":"Nicolas","family":"Schweighofer","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kenji","family":"Doya","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"78","reference":[{"issue":"8","key":"10.1016\/S0893-6080(02)00228-9_BIB1","doi-asserted-by":"crossref","first-page":"876","DOI":"10.1523\/JNEUROSCI.01-08-00876.1981","article-title":"Activity of norepinephrine-containing locus coeruleus neurons in behaving rats anticipates fluctuations in the sleep\u2013waking cycle","volume":"1","author":"Aston-Jones","year":"1981","journal-title":"Journal of Neuroscience"},{"key":"10.1016\/S0893-6080(02)00228-9_BIB2","doi-asserted-by":"crossref","first-page":"603","DOI":"10.1016\/S0893-6080(02)00052-7","article-title":"Opponent interactions between serotonin and dopamine","volume":"15","author":"Daw","year":"2002","journal-title":"Neural Networks"},{"issue":"3","key":"10.1016\/S0893-6080(02)00228-9_BIB3","doi-asserted-by":"crossref","first-page":"643","DOI":"10.1016\/0306-4522(93)90235-8","article-title":"Dopaminergic regulation of cortical acetylcholine release: effects of dopamine receptor agonists","volume":"54","author":"Day","year":"1993","journal-title":"Neuroscience"},{"issue":"1","key":"10.1016\/S0893-6080(02)00228-9_BIB4","doi-asserted-by":"crossref","first-page":"219","DOI":"10.1162\/089976600300015961","article-title":"Reinforcement learning in continuous time and space","volume":"12","author":"Doya","year":"2000","journal-title":"Neural Computations"},{"key":"10.1016\/S0893-6080(02)00228-9_BIB5","doi-asserted-by":"crossref","first-page":"495","DOI":"10.1016\/S0893-6080(02)00044-8","article-title":"Metalearning and neuromodulation","volume":"15","author":"Doya","year":"2002","journal-title":"Neural Networks"},{"key":"10.1016\/S0893-6080(02)00228-9_BIB6","doi-asserted-by":"crossref","first-page":"671","DOI":"10.1016\/0893-6080(90)90056-Q","article-title":"A stochastic reinforcement learning algorithm for learning real-valued functions","volume":"3","author":"Gullapalli","year":"1990","journal-title":"Neural Networks"},{"issue":"1","key":"10.1016\/S0893-6080(02)00228-9_BIB7","doi-asserted-by":"crossref","first-page":"125","DOI":"10.1046\/j.0953-816x.2001.01616.x","article-title":"D2-like dopamine receptor activation excites rat dorsal raphe 5-HT neurons in vitro","volume":"14","author":"Haj-Dahmane","year":"2001","journal-title":"European Journal of Neuroscience"},{"key":"10.1016\/S0893-6080(02)00228-9_BIB8","doi-asserted-by":"crossref","first-page":"665","DOI":"10.1016\/S0893-6080(02)00056-4","article-title":"Control of exploitation\u2013exploration meta-parameters in reinforcement learning","volume":"15","author":"Ishii","year":"2002","journal-title":"Neural Networks"},{"issue":"9","key":"10.1016\/S0893-6080(02)00228-9_BIB9","doi-asserted-by":"crossref","first-page":"346","DOI":"10.1016\/0166-2236(93)90090-9","article-title":"5-HT and motor control: a hypothesis","volume":"16","author":"Jacobs","year":"1993","journal-title":"Trends in Neuroscience"},{"key":"10.1016\/S0893-6080(02)00228-9_BIB10","unstructured":"Littman, M. L., Dean, T. L., et al (1995). On the complexity of solving Markov decision problems. Eleventh International Conference on Uncertainty in Artificial Intelligence."},{"issue":"1","key":"10.1016\/S0893-6080(02)00228-9_BIB11","doi-asserted-by":"crossref","first-page":"193","DOI":"10.1016\/0742-8413(91)90195-Y","article-title":"Monoaminergic interaction in the central nervous system: a morphological analysis in the locus coeruleus of the rat","volume":"98","author":"Maeda","year":"1991","journal-title":"Compartative Biochemistry and Physiology C"},{"issue":"1","key":"10.1016\/S0893-6080(02)00228-9_BIB12","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1152\/jn.1998.80.1.1","article-title":"Predictive reward signal of dopamine neurons","volume":"80","author":"Schultz","year":"1998","journal-title":"Journal of Neurophysiology"},{"issue":"4","key":"10.1016\/S0893-6080(02)00228-9_BIB13","doi-asserted-by":"crossref","first-page":"421","DOI":"10.1101\/lm.4.5.421","article-title":"A model of cerebellar metaplasticity","author":"Schweighofer","year":"1998","journal-title":"Learning Memory"},{"key":"10.1016\/S0893-6080(02)00228-9_BIB14","doi-asserted-by":"crossref","first-page":"119","DOI":"10.1037\/h0036128","article-title":"An opponent process theory of motivation. I. Temporal dynamics of affect","volume":"81","author":"Solomon","year":"1974","journal-title":"Psychological Review"},{"key":"10.1016\/S0893-6080(02)00228-9_BIB15","unstructured":"Sutton, R (1992). Adapting bias by gradient descent: an incremental version of the delta-bar-delta. Tenth National Conference on Artificial Intelligence. Cambridge, MA: MIT Press."},{"key":"10.1016\/S0893-6080(02)00228-9_BIB16","first-page":"1062","article-title":"Functional MRI study of short-term and long-term prediction of reward","author":"Tanaka","year":"2002","journal-title":"Proceedings of the Eighth International Conference on Functional Mapping of the Human Brain, Sendai, Japan"},{"key":"10.1016\/S0893-6080(02)00228-9_BIB17","series-title":"The role of exploration in learning control. Handbook of intelligent control: Neural, fuzzy, and adaptive approaches","author":"Thrun","year":"1992"}],"container-title":["Neural Networks"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0893608002002289?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0893608002002289?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2020,3,12]],"date-time":"2020-03-12T03:14:42Z","timestamp":1583982882000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0893608002002289"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2003,1]]},"references-count":17,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2003,1]]}},"alternative-id":["S0893608002002289"],"URL":"https:\/\/doi.org\/10.1016\/s0893-6080(02)00228-9","relation":{},"ISSN":["0893-6080"],"issn-type":[{"value":"0893-6080","type":"print"}],"subject":[],"published":{"date-parts":[[2003,1]]}}}