{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,21]],"date-time":"2026-02-21T02:03:13Z","timestamp":1771639393088,"version":"3.50.1"},"publisher-location":"Berlin, Heidelberg","reference-count":188,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"value":"9783642276446","type":"print"},{"value":"9783642276453","type":"electronic"}],"license":[{"start":{"date-parts":[[2012,1,1]],"date-time":"2012-01-01T00:00:00Z","timestamp":1325376000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2012,1,1]],"date-time":"2012-01-01T00:00:00Z","timestamp":1325376000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2012]]},"DOI":"10.1007\/978-3-642-27645-3_16","type":"book-chapter","created":{"date-parts":[[2012,3,5]],"date-time":"2012-03-05T22:18:12Z","timestamp":1330985892000},"page":"507-537","source":"Crossref","is-referenced-by-count":5,"title":["Psychological and Neuroscientific Connections with Reinforcement Learning"],"prefix":"10.1007","author":[{"given":"Ashvin","family":"Shah","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"key":"16_CR1","doi-asserted-by":"crossref","first-page":"2777","DOI":"10.1523\/JNEUROSCI.18-07-02777.1998","volume":"18","author":"J.W. Aldridge","year":"1998","unstructured":"Aldridge, J.W., Berridge, K.C.: Coding of serial order by neostriatal neurons: a \u201cnatural action\u201d approach to movement sequence. The Journal of Neuroscience\u00a018, 2777\u20132787 (1998)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR2","doi-asserted-by":"crossref","first-page":"357","DOI":"10.1146\/annurev.ne.09.030186.002041","volume":"9","author":"G.E. Alexander","year":"1986","unstructured":"Alexander, G.E., DeLong, M.R., Strick, P.L.: Parallel organization of functionally segregated circuits linking basal ganglia and cortex. Annual Review of Neuroscience\u00a09, 357\u2013381 (1986)","journal-title":"Annual Review of Neuroscience"},{"key":"16_CR3","doi-asserted-by":"crossref","first-page":"632","DOI":"10.1037\/0033-295X.114.3.632","volume":"114","author":"F.G. Ashby","year":"2007","unstructured":"Ashby, F.G., Ennis, J., Spiering, B.: A neurobiological theory of automaticity in perceptual categorization. Psychological Review\u00a0114, 632\u2013656 (2007)","journal-title":"Psychological Review"},{"key":"16_CR4","doi-asserted-by":"crossref","first-page":"208","DOI":"10.1016\/j.tics.2010.02.001","volume":"14","author":"F.G. Ashby","year":"2010","unstructured":"Ashby, F.G., Turner, B.O., Horvitz, J.C.: Cortical and basal ganglia contributions to habit learning and automaticity. Trends in Cognitive Sciences\u00a014, 208\u2013215 (2010)","journal-title":"Trends in Cognitive Sciences"},{"key":"16_CR5","doi-asserted-by":"crossref","first-page":"126","DOI":"10.1038\/nn1817","volume":"10","author":"H.E. Atallah","year":"2007","unstructured":"Atallah, H.E., Lopez-Paniagua, D., Rudy, J.W., O\u2019Reilly, R.C.: Separate neural substrates for skill learning and performance in ventral and dorsal striatum. Nature Neuroscience\u00a010, 126\u2013131 (2007)","journal-title":"Nature Neuroscience"},{"key":"16_CR6","doi-asserted-by":"crossref","first-page":"48","DOI":"10.1038\/npp.2009.131","volume":"35","author":"B.W. Balleine","year":"2010","unstructured":"Balleine, B.W., O\u2019Dohrety, J.P.: Human and rodent homologies in action control: Corticostriatal determinants of goal-directed and habitual action. Neuropsychopharmacology\u00a035, 48\u201369 (2010)","journal-title":"Neuropsychopharmacology"},{"key":"16_CR7","doi-asserted-by":"crossref","first-page":"8161","DOI":"10.1523\/JNEUROSCI.1554-07.2007","volume":"27","author":"B.W. Balleine","year":"2007","unstructured":"Balleine, B.W., Delgado, M.R., Hikosaka, O.: The role of the dorsal striatum in reward and decision-making. The Journal of Neuroscience\u00a027, 8161\u20138165 (2007)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR8","doi-asserted-by":"crossref","first-page":"43","DOI":"10.1016\/j.bbr.2008.10.034","volume":"199","author":"B.W. Balleine","year":"2009","unstructured":"Balleine, B.W., Liljeholm, M., Ostlund, S.B.: The integrative function of the basal ganglia in instrumental conditioning. Behavioural Brain Research\u00a0199, 43\u201352 (2009)","journal-title":"Behavioural Brain Research"},{"key":"16_CR9","doi-asserted-by":"crossref","first-page":"439","DOI":"10.1016\/j.pneurobio.2003.12.001","volume":"71","author":"I. Bar-Gad","year":"2003","unstructured":"Bar-Gad, I., Morris, G., Bergman, H.: Information processing, dimensionality reduction, and reinforcement learning in the basal ganglia. Progress in Neurobiology\u00a071, 439\u2013473 (2003)","journal-title":"Progress in Neurobiology"},{"key":"16_CR10","doi-asserted-by":"crossref","first-page":"1158","DOI":"10.1038\/nature04053","volume":"437","author":"T.D. Barnes","year":"2005","unstructured":"Barnes, T.D., Kubota, Y., Hu, D., Jin, D.Z., Graybiel, A.M.: Activity of striatal neurons reflects dynamic encoding and recoding of procedural memories. Nature\u00a0437, 1158\u20131161 (2005)","journal-title":"Nature"},{"key":"16_CR11","first-page":"229","volume":"4","author":"A.G. Barto","year":"1985","unstructured":"Barto, A.G.: Learning by statistical cooperation of self-interested neuron-like computing elements. Human Neurobiology\u00a04, 229\u2013256 (1985)","journal-title":"Human Neurobiology"},{"key":"16_CR12","first-page":"215","volume-title":"Models of Information Processing in the Basal Ganglia, ch. 11","author":"A.G. Barto","year":"1995","unstructured":"Barto, A.G.: Adaptive critics and the basal ganglia. In: Houk, J.C., Davis, J.L., Beiser, D.G. (eds.) Models of Information Processing in the Basal Ganglia, ch. 11, pp. 215\u2013232. MIT Press, Cambridge (1995)"},{"key":"16_CR13","doi-asserted-by":"crossref","first-page":"341","DOI":"10.1023\/A:1025696116075","volume":"13","author":"A.G. Barto","year":"2003","unstructured":"Barto, A.G., Mahadevan, S.: Recent advances in hierarchical reinforcement learning. Discrete Event Dynamic Systems\u00a013, 341\u2013379 (2003)","journal-title":"Discrete Event Dynamic Systems"},{"key":"16_CR14","doi-asserted-by":"crossref","first-page":"221","DOI":"10.1016\/0166-4328(82)90001-8","volume":"4","author":"A.G. Barto","year":"1982","unstructured":"Barto, A.G., Sutton, R.S.: Simulation of anticipatory responses in classical conditioning by a neuron-like adaptive element. Behavioral Brain Research\u00a04, 221\u2013235 (1982)","journal-title":"Behavioral Brain Research"},{"key":"16_CR15","first-page":"835","volume":"13","author":"A.G. Barto","year":"1983","unstructured":"Barto, A.G., Sutton, R.S., Anderson, C.W.: Neuronlike elements that can solve difficult learning control problems. IEEE Transactions on Systems, Man, and Cybernectics\u00a013, 835\u2013846 (1983)","journal-title":"IEEE Transactions on Systems, Man, and Cybernectics"},{"key":"16_CR16","doi-asserted-by":"crossref","first-page":"129","DOI":"10.1016\/j.neuron.2005.05.020","volume":"47","author":"H.M. Bayer","year":"2005","unstructured":"Bayer, H.M., Glimcher, P.W.: Midbrain dopamine neurons encode a quantitative reward prediction error signal. Neuron\u00a047, 129\u2013141 (2005)","journal-title":"Neuron"},{"key":"16_CR17","doi-asserted-by":"crossref","first-page":"89","DOI":"10.1016\/j.bbr.2008.09.027","volume":"199","author":"D. Belin","year":"2009","unstructured":"Belin, D., Jonkman, S., Dickinson, A., Robbins, T.W., Everitt, B.J.: Parallel and interactive learning processes within the basal ganglia: relevance for the understanding of addiction. Behavioural Brain Research\u00a0199, 89\u2013102 (2009)","journal-title":"Behavioural Brain Research"},{"key":"16_CR18","doi-asserted-by":"crossref","first-page":"391","DOI":"10.1007\/s00213-006-0578-x","volume":"191","author":"K.C. Berridge","year":"2007","unstructured":"Berridge, K.C.: The debate over dopamine\u2019s role in reward: The case for incentive salience. Psychopharmacology\u00a0191, 391\u2013431 (2007)","journal-title":"Psychopharmacology"},{"key":"16_CR19","doi-asserted-by":"crossref","first-page":"309","DOI":"10.1016\/S0165-0173(98)00019-8","volume":"28","author":"K.C. Berridge","year":"1998","unstructured":"Berridge, K.C., Robinson, T.E.: What is the role of dopamine in reward: Hedonic impact, reward learning, or incentive salience? Brain Research Reviews\u00a028, 309\u2013369 (1998)","journal-title":"Brain Research Reviews"},{"key":"16_CR20","doi-asserted-by":"crossref","first-page":"65","DOI":"10.1016\/j.coph.2008.12.014","volume":"9","author":"K.C. Berridge","year":"2009","unstructured":"Berridge, K.C., Robinson, T.E., Aldridge, J.W.: Dissecting components of reward: \u2019Liking,\u2019 \u2019wanting,\u2019 and learning. Current Opinion in Pharamacology\u00a09, 65\u201373 (2009)","journal-title":"Current Opinion in Pharamacology"},{"key":"16_CR21","doi-asserted-by":"crossref","first-page":"194","DOI":"10.1016\/j.tins.2007.03.006","volume":"30","author":"A. Bj\u00f6rklund","year":"2007","unstructured":"Bj\u00f6rklund, A., Dunnett, S.B.: Dopamine neuron systems in the brain: an update. Trends in Neurosciences\u00a030, 194\u2013202 (2007)","journal-title":"Trends in Neurosciences"},{"key":"16_CR22","doi-asserted-by":"crossref","first-page":"442","DOI":"10.1162\/neco.2007.19.2.442","volume":"19","author":"R. Bogacz","year":"2007","unstructured":"Bogacz, R., Gurney, K.: The basal ganglia and cortex implement optimal decision making between alternative actions. Neural Computation\u00a019, 442\u2013477 (2007)","journal-title":"Neural Computation"},{"key":"16_CR23","doi-asserted-by":"crossref","first-page":"262","DOI":"10.1016\/j.cognition.2008.08.011","volume":"113","author":"M.M. Botvinick","year":"2009","unstructured":"Botvinick, M.M., Niv, Y., Barto, A.G.: Hierarchically organized behavior and its neural foundations: A reinforcement-learning perspective. Cognition\u00a0113, 262\u2013280 (2009)","journal-title":"Cognition"},{"key":"16_CR24","doi-asserted-by":"crossref","first-page":"232","DOI":"10.1007\/978-1-4419-8558-3_7","volume-title":"A Neuroscientist\u2019s Guide to Classical Conditioning","author":"S.E. Brandon","year":"2002","unstructured":"Brandon, S.E., Vogel, E.G., Wagner, A.R.: Computational theories of classical conditioning. In: Moore, J.W. (ed.) A Neuroscientist\u2019s Guide to Classical Conditioning,\u00a0ch. 7, pp. 232\u2013310. Springer, New York (2002)"},{"key":"16_CR25","doi-asserted-by":"crossref","first-page":"815","DOI":"10.1016\/j.neuron.2010.11.022","volume":"68","author":"E.S. Bromberg-Martin","year":"2010","unstructured":"Bromberg-Martin, E.S., Matsumoto, M., Hikosaka, O.: Dopamine in motivational control: Rewarding, aversive, and alerting. Neuron\u00a068, 815\u2013834 (2010)","journal-title":"Neuron"},{"key":"16_CR26","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1901\/jeab.1968.11-1","volume":"11","author":"P.L. Brown","year":"1968","unstructured":"Brown, P.L., Jenkins, H.M.: Auto-shaping of the pigeon\u2019s key-peck. Journal of the Experimental Analysis of Behavior\u00a011, 1\u20138 (1968)","journal-title":"Journal of the Experimental Analysis of Behavior"},{"key":"16_CR27","doi-asserted-by":"crossref","first-page":"211","DOI":"10.1016\/j.tins.2007.03.001","volume":"30","author":"P. Calabresi","year":"2007","unstructured":"Calabresi, P., Picconi, B., Tozzi, A., DiFilippo, M.: Dopamine-mediated regulation of corticostriatal synaptic plasticity. Trends in Neuroscience\u00a030, 211\u2013219 (2007)","journal-title":"Trends in Neuroscience"},{"key":"16_CR28","doi-asserted-by":"crossref","first-page":"827","DOI":"10.1523\/JNEUROSCI.23-34-10827.2003","volume":"23","author":"C.M. Cannon","year":"2003","unstructured":"Cannon, C.M., Palmiter, R.D.: Reward without dopamine. Journal of Neuroscience\u00a023, 10,827\u201310,831 (2003)","journal-title":"Journal of Neuroscience"},{"key":"16_CR29","doi-asserted-by":"crossref","first-page":"321","DOI":"10.1016\/S0149-7634(02)00007-6","volume":"26","author":"R.N. Cardinal","year":"2002","unstructured":"Cardinal, R.N., Parkinson, J.A., Hall, J., Everitt, B.J.: Emotion and motivation: The role of the amygdala, ventral striatum, and prefrontal cortex. Neuroscience and Biobehavioural Reviews\u00a026, 321\u2013352 (2002)","journal-title":"Neuroscience and Biobehavioural Reviews"},{"key":"16_CR30","doi-asserted-by":"crossref","first-page":"113","DOI":"10.3758\/CABN.8.2.113","volume":"8","author":"M.X. Cohen","year":"2008","unstructured":"Cohen, M.X.: Neurocomputational mechanisms of reinforcement-guided learning in humans: a review. Cognitive, Affective, and Behavioral Neuroscience\u00a08, 113\u2013125 (2008)","journal-title":"Cognitive, Affective, and Behavioral Neuroscience"},{"key":"16_CR31","doi-asserted-by":"crossref","first-page":"141","DOI":"10.1016\/j.bbr.2008.09.029","volume":"199","author":"M.X. Cohen","year":"2009","unstructured":"Cohen, M.X., Frank, M.J.: Neurocomputational models of the basal ganglia in learning, memory, and choice. Behavioural Brain Research\u00a0199, 141\u2013156 (2009)","journal-title":"Behavioural Brain Research"},{"key":"16_CR32","doi-asserted-by":"crossref","first-page":"8178","DOI":"10.1523\/JNEUROSCI.1590-07.2007","volume":"27","author":"G. Corrado","year":"2007","unstructured":"Corrado, G., Doya, K.: Understanding neural coding through the model-based analysis of decision-making. The Journal of Neuroscience\u00a027, 8178\u20138180 (2007)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR33","doi-asserted-by":"crossref","first-page":"199","DOI":"10.1016\/j.conb.2006.03.006","volume":"16","author":"N.D. Daw","year":"2006","unstructured":"Daw, N.D., Doya, K.: The computational neurobiology of learning and reward. Current Opinion in Neurobiology\u00a016, 199\u2013204 (2006)","journal-title":"Current Opinion in Neurobiology"},{"key":"16_CR34","doi-asserted-by":"crossref","first-page":"2567","DOI":"10.1162\/089976602760407973","volume":"14","author":"N.D. Daw","year":"2002","unstructured":"Daw, N.D., Touretzky, D.S.: Long-term reward prediction in TD models of the dopamine system. Neural Computation\u00a014, 2567\u20132583 (2002)","journal-title":"Neural Computation"},{"key":"16_CR35","doi-asserted-by":"crossref","first-page":"603","DOI":"10.1016\/S0893-6080(02)00052-7","volume":"15","author":"N.D. Daw","year":"2002","unstructured":"Daw, N.D., Kakade, S., Dayan, P.: Opponent interactions between serotonin and dopamine. Neural Networks\u00a015, 603\u2013616 (2002)","journal-title":"Neural Networks"},{"key":"16_CR36","doi-asserted-by":"crossref","first-page":"1704","DOI":"10.1038\/nn1560","volume":"8","author":"N.D. Daw","year":"2005","unstructured":"Daw, N.D., Niv, Y., Dayan, P.: Uncertainty-based competition between prefrontal and dorsolateral striatal systems for behavioral control. Nature Neuroscience\u00a08, 1704\u20131711 (2005)","journal-title":"Nature Neuroscience"},{"key":"16_CR37","doi-asserted-by":"crossref","first-page":"1637","DOI":"10.1162\/neco.2006.18.7.1637","volume":"18","author":"N.D. Daw","year":"2006","unstructured":"Daw, N.D., Courville, A.C., Tourtezky, D.S.: Representation and timing in theories of the dopamine system. Neural Computation\u00a018, 1637\u20131677 (2006a)","journal-title":"Neural Computation"},{"key":"16_CR38","doi-asserted-by":"crossref","first-page":"876","DOI":"10.1038\/nature04766","volume":"441","author":"N.D. Daw","year":"2006","unstructured":"Daw, N.D., O\u2019Doherty, J.P., Dayan, P., Seymour, B., Dolan, R.J.: Cortical substrates for exploratory decisions in humans. Nature\u00a0441, 876\u2013879 (2006b)","journal-title":"Nature"},{"key":"16_CR39","doi-asserted-by":"crossref","first-page":"429","DOI":"10.3758\/CABN.8.4.429","volume":"8","author":"P. Dayan","year":"2008","unstructured":"Dayan, P., Daw, N.D.: Connections between computational and neurobiological perspectives on decision making. Cognitive, Affective, and Behavioral Neuroscience\u00a08, 429\u2013453 (2008)","journal-title":"Cognitive, Affective, and Behavioral Neuroscience"},{"key":"16_CR40","doi-asserted-by":"crossref","first-page":"185","DOI":"10.1016\/j.conb.2008.08.003","volume":"18","author":"P. Dayan","year":"2008","unstructured":"Dayan, P., Niv, Y.: Reinforcement learning: the good, the bad, and the ugly. Current Opinion in Neurobiology\u00a018, 185\u2013196 (2008)","journal-title":"Current Opinion in Neurobiology"},{"key":"16_CR41","doi-asserted-by":"crossref","first-page":"1153","DOI":"10.1016\/j.neunet.2006.03.002","volume":"19","author":"P. Dayan","year":"2006","unstructured":"Dayan, P., Niv, Y., Seymour, B., Daw, N.D.: The misbehavior of value and the discipline of the will. Neural Networks\u00a019, 1153\u20131160 (2006)","journal-title":"Neural Networks"},{"key":"16_CR42","doi-asserted-by":"crossref","first-page":"67","DOI":"10.1098\/rstb.1985.0010","volume":"308","author":"A. Dickinson","year":"1985","unstructured":"Dickinson, A.: Actions and habits: the development of behavioural autonomy. Philosophical Transactions of the Royal Society of London B: Biological Sciences\u00a0308, 67\u201378 (1985)","journal-title":"Philosophical Transactions of the Royal Society of London B: Biological Sciences"},{"key":"16_CR43","doi-asserted-by":"crossref","first-page":"1","DOI":"10.3758\/BF03199951","volume":"22","author":"A. Dickinson","year":"1994","unstructured":"Dickinson, A., Balleine, B.W.: Motivational control of goal-directed action. Animal Learning and Behavior\u00a022, 1\u201318 (1994)","journal-title":"Animal Learning and Behavior"},{"key":"16_CR44","doi-asserted-by":"crossref","first-page":"399","DOI":"10.1016\/B978-0-12-374620-7.00019-4","volume-title":"Handbook of Reward and Decision Making, ch. 19","author":"B.B. Doll","year":"2009","unstructured":"Doll, B.B., Frank, M.J.: The basal ganglia in reward and decision making: computational models and empirical studies. In: Dreher, J., Tremblay, L. (eds.) Handbook of Reward and Decision Making, ch. 19, pp. 399\u2013425. Academic Press, Oxford (2009)"},{"key":"16_CR45","doi-asserted-by":"crossref","first-page":"1476","DOI":"10.1126\/science.1107026","volume":"307","author":"E. Dommett","year":"2005","unstructured":"Dommett, E., Coizet, V., Blaha, C.D., Martindale, J., Lefebvre, V., Mayhew, N.W.J.E., Overton, P.G., Redgrave, P.: How visual stimuli activate dopaminergic neurons at short latency. Science\u00a0307, 1476\u20131479 (2005)","journal-title":"Science"},{"key":"16_CR46","doi-asserted-by":"crossref","first-page":"961","DOI":"10.1016\/S0893-6080(99)00046-5","volume":"12","author":"K. Doya","year":"1999","unstructured":"Doya, K.: What are the computations of the cerebellum, the basal ganglia, and the cerebral cortex? Neural Networks\u00a012, 961\u2013974 (1999)","journal-title":"Neural Networks"},{"key":"16_CR47","doi-asserted-by":"crossref","first-page":"30","DOI":"10.2976\/1.2732246\/10.2976\/1","volume":"1","author":"K. Doya","year":"2007","unstructured":"Doya, K.: Reinforcement learning: Computational theory and biological mechanisms. HFSP Journal\u00a01, 30\u201340 (2007)","journal-title":"HFSP Journal"},{"key":"16_CR48","doi-asserted-by":"crossref","first-page":"410","DOI":"10.1038\/nn2077","volume":"11","author":"K. Doya","year":"2008","unstructured":"Doya, K.: Modulators of decision making. Nature Neuroscience\u00a011, 410\u2013416 (2008)","journal-title":"Nature Neuroscience"},{"key":"16_CR49","doi-asserted-by":"crossref","first-page":"61","DOI":"10.1016\/j.bbr.2008.11.012","volume":"199","author":"J. Doyon","year":"2009","unstructured":"Doyon, J., Bellec, P., Amsel, R., Penhune, V., Monchi, O., Carrier, J., Leh\u00e9ricy, S., Benali, H.: Contributions of the basal ganglia and functionally related brain structures to motor learning. Behavioural Brain Research\u00a0199, 61\u201375 (2009)","journal-title":"Behavioural Brain Research"},{"key":"16_CR50","doi-asserted-by":"crossref","first-page":"299","DOI":"10.1901\/jeab.1980.33-299","volume":"33","author":"D.A. Eckerman","year":"1980","unstructured":"Eckerman, D.A., Hienz, R.D., Stern, S., Kowlowitz, V.: Shaping the location of a pigeon\u2019s peck: Effect of rate and size of shaping steps. Journal of the Experimental Analysis of Behavior\u00a033, 299\u2013310 (1980)","journal-title":"Journal of the Experimental Analysis of Behavior"},{"key":"16_CR51","doi-asserted-by":"crossref","DOI":"10.1037\/10627-000","volume-title":"Schedules of Reinforcement","author":"C.B. Ferster","year":"1957","unstructured":"Ferster, C.B., Skinner, B.F.: Schedules of Reinforcement. Appleton-Century-Crofts, New York (1957)"},{"key":"16_CR52","doi-asserted-by":"crossref","first-page":"1898","DOI":"10.1126\/science.1077349","volume":"299","author":"C.D. Fiorillo","year":"2003","unstructured":"Fiorillo, C.D., Tobler, P.N., Schultz, W.: Discrete coding of reward probability and uncertainty by dopamine neurons. Science\u00a0299, 1898\u20131902 (2003)","journal-title":"Science"},{"key":"16_CR53","doi-asserted-by":"crossref","first-page":"51","DOI":"10.1162\/0898929052880093","volume":"17","author":"M.J. Frank","year":"2005","unstructured":"Frank, M.J.: Dynamic dopamine modulation in the basal ganglia: a neurocomputational account of cognitive deficits in medicated and nonmedicated Parkinsonism. Journal of Cognitive Neuroscience\u00a017, 51\u201372 (2005)","journal-title":"Journal of Cognitive Neuroscience"},{"key":"16_CR54","doi-asserted-by":"crossref","first-page":"300","DOI":"10.1037\/0033-295X.113.2.300","volume":"113","author":"M.J. Frank","year":"2006","unstructured":"Frank, M.J., Claus, E.D.: Anatomy of a decision: Striato-orbitofrontal interactions in reinforcement learning, decision making, and reversal. Psychological Review\u00a0113, 300\u2013326 (2006)","journal-title":"Psychological Review"},{"key":"16_CR55","doi-asserted-by":"crossref","first-page":"1940","DOI":"10.1126\/science.1102941","volume":"306","author":"M.J. Frank","year":"2004","unstructured":"Frank, M.J., Seeberger, L.C., O\u2019Reilly, R.C.: By carrot or by stick: Cognitive reinforcement learning in parkinsonism. Science\u00a0306, 1940\u20131943 (2004)","journal-title":"Science"},{"key":"16_CR56","doi-asserted-by":"crossref","first-page":"710","DOI":"10.2307\/1420328","volume":"71","author":"R. Gardner","year":"1958","unstructured":"Gardner, R.: Multiple-choice decision behavior. American Journal of Psychology\u00a071, 710\u2013717 (1958)","journal-title":"American Journal of Psychology"},{"key":"16_CR57","first-page":"501","volume":"1","author":"J.P. Gl\u00e4scher","year":"2010","unstructured":"Gl\u00e4scher, J.P., O\u2019Doherty, J.P.: Model-based approaches to neuroimaging combining reinforcement learning theory with fMRI data. Wiley Interdisciplinary Reviews: Cognitive Science\u00a01, 501\u2013510 (2010)","journal-title":"Wiley Interdisciplinary Reviews: Cognitive Science"},{"key":"16_CR58","doi-asserted-by":"crossref","first-page":"585","DOI":"10.1016\/j.neuron.2010.04.016","volume":"66","author":"J.P. Gl\u00e4scher","year":"2010","unstructured":"Gl\u00e4scher, J.P., Daw, N.D., Dayan, P., O\u2019Doherty, J.P.: States versus rewards: Dissociable neural prediction error signals underlying model-based and model-free reinforcement learning. Neuron\u00a066, 585\u2013595 (2010)","journal-title":"Neuron"},{"key":"16_CR59","doi-asserted-by":"crossref","DOI":"10.7551\/mitpress\/2302.001.0001","volume-title":"Decisions, Uncertainty, and the Brain: The Science of Neuroeconomics","author":"P.W. Glimcher","year":"2003","unstructured":"Glimcher, P.W.: Decisions, Uncertainty, and the Brain: The Science of Neuroeconomics. MIT Press, Cambridge (2003)"},{"key":"16_CR60","doi-asserted-by":"crossref","first-page":"447","DOI":"10.1126\/science.1102566","volume":"306","author":"P.W. Glimcher","year":"2004","unstructured":"Glimcher, P.W., Rustichini, A.: Neuroeconomics: The consilience of brain and decision. Science\u00a0306, 447\u2013452 (2004)","journal-title":"Science"},{"key":"16_CR61","first-page":"281","volume-title":"Memory and Mind: A Festschrift for Gordon H. Bower","author":"M.A. Gluck","year":"2008","unstructured":"Gluck, M.A.: Behavioral and neural correlates of error correction in classical conditioning and human category learning. In: Gluck, M.A., Anderson, J.R., Kosslyn, S.M. (eds.) Memory and Mind: A Festschrift for Gordon H. Bower,\u00a0ch. 18, pp. 281\u2013305. Lawrence Earlbaum Associates, New York (2008)"},{"key":"16_CR62","doi-asserted-by":"crossref","first-page":"535","DOI":"10.1146\/annurev.neuro.29.051605.113038","volume":"30","author":"J.I. Gold","year":"2007","unstructured":"Gold, J.I., Shadlen, M.N.: The neural basis of decision making. Annual Review of Neuroscience\u00a030, 535\u2013574 (2007)","journal-title":"Annual Review of Neuroscience"},{"key":"16_CR63","doi-asserted-by":"crossref","first-page":"447","DOI":"10.1016\/0896-6273(95)90300-3","volume":"14","author":"P.S. Goldman-Rakic","year":"1995","unstructured":"Goldman-Rakic, P.S.: Cellular basis of working memory. Neuron\u00a014, 447\u2013485 (1995)","journal-title":"Neuron"},{"key":"16_CR64","doi-asserted-by":"crossref","first-page":"106","DOI":"10.2307\/1418393","volume":"68","author":"J.T. Goodnow","year":"1955","unstructured":"Goodnow, J.T.: Determinants of choice-distribution in two-choice situations. The American Journal of Psychology\u00a068, 106\u2013116 (1955)","journal-title":"The American Journal of Psychology"},{"key":"16_CR65","doi-asserted-by":"crossref","first-page":"33","DOI":"10.1126\/science.138.3536.33","volume":"138","author":"I. Gormezano","year":"1962","unstructured":"Gormezano, I., Schneiderman, N., Deaux, E.G., Fuentes, I.: Nictitating membrane: Classical conditioning and extinction in the albino rabbit. Science\u00a0138, 33\u201334 (1962)","journal-title":"Science"},{"key":"16_CR66","doi-asserted-by":"crossref","first-page":"590","DOI":"10.1016\/j.humov.2007.05.009","volume":"26","author":"S.T. Grafton","year":"2007","unstructured":"Grafton, S.T., Hamilton, A.F.: Evidence for a distributed hierarchy of action representation in the brain. Human Movement Science\u00a026, 590\u2013616 (2007)","journal-title":"Human Movement Science"},{"key":"16_CR67","doi-asserted-by":"crossref","first-page":"638","DOI":"10.1016\/j.conb.2005.10.006","volume":"15","author":"A.M. Graybiel","year":"2005","unstructured":"Graybiel, A.M.: The basal ganglia: learning new tricks and loving it. Current Opinion in Neurobiology\u00a015, 638\u2013644 (2005)","journal-title":"Current Opinion in Neurobiology"},{"key":"16_CR68","doi-asserted-by":"crossref","first-page":"359","DOI":"10.1146\/annurev.neuro.29.051605.112851","volume":"31","author":"A.M. Graybiel","year":"2008","unstructured":"Graybiel, A.M.: Habits, rituals, and the evaluative brain. Annual Review of Neuroscience\u00a031, 359\u2013387 (2008)","journal-title":"Annual Review of Neuroscience"},{"key":"16_CR69","doi-asserted-by":"crossref","first-page":"1826","DOI":"10.1126\/science.8091209","volume":"265","author":"A.M. Graybiel","year":"1994","unstructured":"Graybiel, A.M., Aosaki, T., Flahrety, A.W., Kimura, M.: The basal ganglia and adaptive motor control. Science\u00a0265, 1826\u20131831 (1994)","journal-title":"Science"},{"key":"16_CR70","doi-asserted-by":"crossref","first-page":"769","DOI":"10.1037\/0033-2909.130.5.769","volume":"130","author":"L. Green","year":"2004","unstructured":"Green, L., Myerson, J.: A discounting framework for choice with delayed and probabilistic rewards. Psychological Bulletin\u00a0130, 769\u2013792 (2004)","journal-title":"Psychological Bulletin"},{"key":"16_CR71","volume-title":"2005 AAAI Spring Symposium Series: Developmental Robotics","author":"R. Grupen","year":"2005","unstructured":"Grupen, R., Huber, M.: A framework for the development of robot behavior. In: 2005 AAAI Spring Symposium Series: Developmental Robotics. American Association for the Advancement of Artificial Intelligence, Palo Alta (2005)"},{"key":"16_CR72","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1007\/s12559-009-9010-2","volume":"1","author":"K. Gurney","year":"2009","unstructured":"Gurney, K.: Reverse engineering the vertebrate brain: Methodological principles for a biologically grounded programme of cognitive modelling. Cognitive Computation\u00a01, 29\u201341 (2009)","journal-title":"Cognitive Computation"},{"key":"16_CR73","doi-asserted-by":"crossref","first-page":"401","DOI":"10.1007\/PL00007984","volume":"84","author":"K. Gurney","year":"2001","unstructured":"Gurney, K., Prescott, T.J., Redgrave, P.: A computational model of action selection in the basal ganglia. I. A new functional anatomy. Biological Cybernetics\u00a084, 401\u2013410 (2001)","journal-title":"Biological Cybernetics"},{"key":"16_CR74","doi-asserted-by":"crossref","first-page":"453","DOI":"10.1016\/j.tins.2004.06.003","volume":"27","author":"K. Gurney","year":"2004","unstructured":"Gurney, K., Prescott, T.J., Wickens, J.R., Redgrave, P.: Computational models of the basal ganglia: From robots to membranes. Trends in Neuroscience\u00a027, 453\u2013459 (2004)","journal-title":"Trends in Neuroscience"},{"key":"16_CR75","doi-asserted-by":"crossref","first-page":"317","DOI":"10.1016\/j.jchemneu.2003.10.003","volume":"26","author":"S.N. Haber","year":"2003","unstructured":"Haber, S.N.: The primate basal ganglia: Parallel and integrative networks. Journal of Chemical Neuroanatomy\u00a026, 317\u2013330 (2003)","journal-title":"Journal of Chemical Neuroanatomy"},{"key":"16_CR76","doi-asserted-by":"crossref","first-page":"8368","DOI":"10.1523\/JNEUROSCI.0271-06.2006","volume":"26","author":"S.N. Haber","year":"2006","unstructured":"Haber, S.N., Kim, K.S., Mailly, P., Calzavara, R.: Reward-related cortical inputs define a large striatal region in primates that interface with associative cortical inputs, providing a substrate for incentive-based learning. The Journal of Neuroscience\u00a026, 8368\u20138376 (2006)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR77","doi-asserted-by":"crossref","first-page":"1242","DOI":"10.1016\/j.neunet.2006.06.007","volume":"19","author":"M. Haruno","year":"2006","unstructured":"Haruno, M., Kawato, M.: Heterarchical reinforcement-learning model for integration of multiple cortico-striatal loops: fMRI examination in stimulus-action-reward association learning. Neural Networks\u00a019, 1242\u20131254 (2006)","journal-title":"Neural Networks"},{"key":"16_CR78","doi-asserted-by":"crossref","first-page":"701","DOI":"10.1016\/j.neubiorev.2009.11.019","volume":"34","author":"T.E. Hazy","year":"2010","unstructured":"Hazy, T.E., Frank, M.J., O\u2019Reilly, R.C.: Neural mechanisms of acquired phasic dopamine repsonses in learning. Neuroscience and Biobehavioral Reviews\u00a034, 701\u2013720 (2010)","journal-title":"Neuroscience and Biobehavioral Reviews"},{"key":"16_CR79","doi-asserted-by":"crossref","first-page":"267","DOI":"10.1901\/jeab.1961.4-267","volume":"4","author":"R.J. Herrnstein","year":"1961","unstructured":"Herrnstein, R.J.: Relative and absolute strength of response as a function of frequency of reinforcement. Journal of the Experimental Analysis of Behavior\u00a04, 267\u2013272 (1961)","journal-title":"Journal of the Experimental Analysis of Behavior"},{"key":"16_CR80","doi-asserted-by":"crossref","first-page":"229","DOI":"10.1196\/annals.1390.012","volume":"1104","author":"O. Hikosaka","year":"2007","unstructured":"Hikosaka, O.: Basal ganglia mechanisms of reward-oriented eye movement. Annals of the New York Academy of Science\u00a01104, 229\u2013249 (2007)","journal-title":"Annals of the New York Academy of Science"},{"key":"16_CR81","doi-asserted-by":"crossref","first-page":"304","DOI":"10.1038\/1124","volume":"1","author":"J.R. Hollerman","year":"1998","unstructured":"Hollerman, J.R., Schultz, W.: Dopamine neurons report an error in the temporal prediction of reward during learning. Nature Neuroscience\u00a01, 304\u2013309 (1998)","journal-title":"Nature Neuroscience"},{"key":"16_CR82","doi-asserted-by":"crossref","first-page":"651","DOI":"10.1016\/S0306-4522(00)00019-1","volume":"96","author":"J.C. Horvitz","year":"2000","unstructured":"Horvitz, J.C.: Mesolimbocortical and nigrostriatal dopamine responses to salient non-reward events. Neuroscience\u00a096, 651\u2013656 (2000)","journal-title":"Neuroscience"},{"key":"16_CR83","doi-asserted-by":"crossref","first-page":"95","DOI":"10.1093\/cercor\/5.2.95","volume":"5","author":"J.C. Houk","year":"1995","unstructured":"Houk, J.C., Wise, S.P.: Distributed modular architectures linking basal ganglia, cerebellum, and cerebral cortex: Their role in planning and controlling action. Cerebral Cortex\u00a05, 95\u2013110 (1995)","journal-title":"Cerebral Cortex"},{"key":"16_CR84","first-page":"249","volume-title":"Models of Information Processing in the Basal Ganglia, ch. 13","author":"J.C. Houk","year":"1995","unstructured":"Houk, J.C., Adams, J.L., Barto, A.G.: A model of how the basal ganglia generate and use neural signals that predict reinforcement. In: Houk, J.C., Davis, J.L., Beiser, D.G. (eds.) Models of Information Processing in the Basal Ganglia, ch. 13, pp. 249\u2013270. MIT Press, Cambridge (1995)"},{"key":"16_CR85","doi-asserted-by":"crossref","first-page":"1573","DOI":"10.1098\/rstb.2007.2063","volume":"362","author":"J.C. Houk","year":"2007","unstructured":"Houk, J.C., Bastianen, C., Fansler, D., Fishbach, A., Fraser, D., Reber, P.J., Roy, S.A., Simo, L.S.: Action selection and refinement in subcortical loops through basal ganglia and cerebellum. Philosophical Transactions of the Royal Society of London B: Biological Sciences\u00a0362, 1573\u20131583 (2007)","journal-title":"Philosophical Transactions of the Royal Society of London B: Biological Sciences"},{"key":"16_CR86","volume-title":"Principles of Behavior","author":"C.L. Hull","year":"1943","unstructured":"Hull, C.L.: Principles of Behavior. Appleton-Century-Crofts, New York (1943)"},{"key":"16_CR87","doi-asserted-by":"crossref","first-page":"385","DOI":"10.1016\/j.pneurobio.2009.11.003","volume":"90","author":"M.D. Humphries","year":"2010","unstructured":"Humphries, M.D., Prescott, T.J.: The ventral basal ganglia, a selection mechanism at the crossroads of space, strategy, and reward. Progress in Neurobiology\u00a090, 385\u2013417 (2010)","journal-title":"Progress in Neurobiology"},{"key":"16_CR88","doi-asserted-by":"crossref","first-page":"9861","DOI":"10.1523\/JNEUROSCI.6157-08.2009","volume":"29","author":"M. Ito","year":"2009","unstructured":"Ito, M., Doya, K.: Validation of decision-making models and analysis of decision variables in the rat basal ganglia. The Journal of Neuroscience\u00a029, 9861\u20139874 (2009)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR89","doi-asserted-by":"crossref","first-page":"363","DOI":"10.1016\/0306-4522(94)90536-3","volume":"63","author":"D. Joel","year":"1994","unstructured":"Joel, D., Weiner, I.: The organization of the basal ganglia-thalamocortical circuits: Open interconnected rather than closed segregated. Neuroscience\u00a063, 363\u2013379 (1994)","journal-title":"Neuroscience"},{"key":"16_CR90","doi-asserted-by":"crossref","first-page":"535","DOI":"10.1016\/S0893-6080(02)00047-3","volume":"15","author":"D. Joel","year":"2002","unstructured":"Joel, D., Niv, Y., Ruppin, E.: Actor-critic models of the basal ganglia: New anatomical and computational perspectives. Neural Networks\u00a015, 535\u2013547 (2002)","journal-title":"Neural Networks"},{"key":"16_CR91","doi-asserted-by":"crossref","first-page":"615","DOI":"10.1016\/j.conb.2009.10.001","volume":"19","author":"M. Joshua","year":"2009","unstructured":"Joshua, M., Adler, A., Bergman, H.: The dynamics of dopamine in control of motor behavior. Current Opinion in Neurobiology\u00a019, 615\u2013620 (2009)","journal-title":"Current Opinion in Neurobiology"},{"key":"16_CR92","first-page":"279","volume-title":"Punishment and Aversive Behavior","author":"L.J. Kamin","year":"1969","unstructured":"Kamin, L.J.: Predictability, surprise, attention, and conditioning. In: Campbell, B.A., Church, R.M. (eds.) Punishment and Aversive Behavior, pp. 279\u2013296. Appleton-Century-Crofts, New York (1969)"},{"key":"16_CR93","doi-asserted-by":"crossref","first-page":"455","DOI":"10.3758\/BF03205056","volume":"15","author":"E.J. Kehoe","year":"1987","unstructured":"Kehoe, E.J., Schreurs, B.G., Graham, P.: Temporal primacy overrides prior training in serial compound conditioning of the rabbit\u2019s nictitating membrane response. Animal Learning and Behavior\u00a015, 455\u2013464 (1987)","journal-title":"Animal Learning and Behavior"},{"key":"16_CR94","first-page":"701","volume":"29","author":"H. Kim","year":"2009","unstructured":"Kim, H., Sul, J.H., Huh, N., Lee, D., Jung, M.W.: Role of striatum in updating values of chosen actions. The Journal of Neuroscience\u00a029, 14,701\u201314,712 (2009)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR95","doi-asserted-by":"crossref","first-page":"543","DOI":"10.1016\/j.neuron.2010.07.021","volume":"67","author":"K.T. Kishida","year":"2010","unstructured":"Kishida, K.T., King-Casas, B., Montague, P.R.: Neuroeconomic approaches to mental disorders. Neuron\u00a067, 543\u2013554 (2010)","journal-title":"Neuron"},{"key":"16_CR96","volume-title":"The Hedonistic Neuron: A Theory of Memory, Learning and Intelligence","author":"A.H. Klopf","year":"1982","unstructured":"Klopf, A.H.: The Hedonistic Neuron: A Theory of Memory, Learning and Intelligence. Hemisphere Publishing Corporation, Washington DC (1982)"},{"key":"16_CR97","doi-asserted-by":"crossref","first-page":"7837","DOI":"10.1523\/JNEUROSCI.1600-08.2008","volume":"28","author":"S. Kobayashi","year":"2008","unstructured":"Kobayashi, S., Schultz, W.: Influence of reward delays on responses of dopamine neurons. The Journal of Neuroscience\u00a028, 7837\u20137846 (2008)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR98","first-page":"1015","volume-title":"Advances in Neural Information Processing Systems (NIPS)","author":"G.D. Konidaris","year":"2009","unstructured":"Konidaris, G.D., Barto, A.G.: Skill discovery in continuous reinforcement learning domains using skill chaining. In: Bengio, Y., Schuurmans, D., Lafferty, J., Williams, C.K.I., Culotta, A. (eds.) Advances in Neural Information Processing Systems (NIPS), vol.\u00a022, pp. 1015\u20131023. MIT Press, Cambridge (2009)"},{"key":"16_CR99","doi-asserted-by":"crossref","first-page":"451","DOI":"10.1016\/j.neuron.2008.02.021","volume":"58","author":"B. Lau","year":"2008","unstructured":"Lau, B., Glimcher, P.W.: Value representations in the primate striatum during matching behavior. Neuron\u00a058, 451\u2013463 (2008)","journal-title":"Neuron"},{"key":"16_CR100","doi-asserted-by":"crossref","first-page":"145","DOI":"10.1152\/jn.1992.67.1.145","volume":"67","author":"T. Ljungberg","year":"1992","unstructured":"Ljungberg, T., Apicella, P., Schultz, W.: Responses of monkey dopamine neurons during learning of behavioral reactions. Journal of Neurophysiology\u00a067, 145\u2013163 (1992)","journal-title":"Journal of Neurophysiology"},{"key":"16_CR101","doi-asserted-by":"crossref","first-page":"3034","DOI":"10.1162\/neco.2008.11-07-654","volume":"20","author":"E.A. Ludvig","year":"2008","unstructured":"Ludvig, E.A., Sutton, R.S., Kehoe, E.J.: Stimulus representation and the timing of reward-prediction errors in models of the dopamine system. Neural Computation\u00a020, 3034\u20133054 (2008)","journal-title":"Neural Computation"},{"key":"16_CR102","doi-asserted-by":"crossref","first-page":"343","DOI":"10.3758\/CABN.9.4.343","volume":"9","author":"T.V. Maia","year":"2009","unstructured":"Maia, T.V.: Reinforcement learning, conditioning, and the brain: Successes and challenges. Cognitive, Affective, and Behavioral Neuroscience\u00a09, 343\u2013364 (2009)","journal-title":"Cognitive, Affective, and Behavioral Neuroscience"},{"key":"16_CR103","doi-asserted-by":"crossref","first-page":"154","DOI":"10.1038\/nn.2723","volume":"14","author":"T.V. Maia","year":"2011","unstructured":"Maia, T.V., Frank, M.J.: From reinforcement learning models to psychiatric and neurobiological disorders. Nature Neuroscience\u00a014, 154\u2013162 (2011)","journal-title":"Nature Neuroscience"},{"key":"16_CR104","doi-asserted-by":"crossref","first-page":"229","DOI":"10.1126\/science.1084204","volume":"301","author":"K. Matsumoto","year":"2003","unstructured":"Matsumoto, K., Suzuki, W., Tanaka, K.: Neuronal correlates of goal-based motor selection in the prefrontal cortex. Science\u00a0301, 229\u2013232 (2003)","journal-title":"Science"},{"key":"16_CR105","doi-asserted-by":"crossref","first-page":"1819","DOI":"10.1152\/jn.00784.2006","volume":"97","author":"Y. Matsuzaka","year":"2007","unstructured":"Matsuzaka, Y., Picard, N., Strick, P.: Skill representation in the primary motor cortex after long-term practice. Journal of Neurophysiology\u00a097, 1819\u20131832 (2007)","journal-title":"Journal of Neurophysiology"},{"key":"16_CR106","doi-asserted-by":"crossref","first-page":"401","DOI":"10.1016\/j.tins.2005.06.006","volume":"28","author":"J.G. McHaffie","year":"2005","unstructured":"McHaffie, J.G., Stanford, T.R., Stein, B.E., Coizet, V., Redgrave, P.: Subcortical loops through the basal ganglia. Trends in Neurosciences\u00a028, 401\u2013407 (2005)","journal-title":"Trends in Neurosciences"},{"key":"16_CR107","doi-asserted-by":"crossref","first-page":"926","DOI":"10.1093\/cercor\/12.9.926","volume":"12","author":"F.A. Middleton","year":"2002","unstructured":"Middleton, F.A., Strick, P.L.: Basal-ganglia\u201cprojections\u201d to the prefrontal cortex of the primate. Cerebral Cortex\u00a012, 926\u2013935 (2002)","journal-title":"Cerebral Cortex"},{"key":"16_CR108","doi-asserted-by":"crossref","first-page":"167","DOI":"10.1146\/annurev.neuro.24.1.167","volume":"24","author":"E.K. Miller","year":"2001","unstructured":"Miller, E.K., Cohen, J.D.: An integrative theory of prefrontal cortex function. Annual Review of Neuroscience\u00a024, 167\u2013202 (2001)","journal-title":"Annual Review of Neuroscience"},{"key":"16_CR109","doi-asserted-by":"crossref","first-page":"1255","DOI":"10.1016\/0024-3205(81)90231-9","volume":"29","author":"J.D. Miller","year":"1981","unstructured":"Miller, J.D., Sanghera, M.K., German, D.C.: Mesencephalic dopaminergic unit activity in the behaviorally conditioned rat. Life Sciences\u00a029, 1255\u20131263 (1981)","journal-title":"Life Sciences"},{"key":"16_CR110","doi-asserted-by":"crossref","first-page":"381","DOI":"10.1016\/S0301-0082(96)00042-1","volume":"50","author":"J.W. Mink","year":"1996","unstructured":"Mink, J.W.: The basal ganglia: Focused selection and inhibition of competing motor programs. Progress in Neurobiology\u00a050, 381\u2013425 (1996)","journal-title":"Progress in Neurobiology"},{"key":"16_CR111","doi-asserted-by":"crossref","first-page":"215","DOI":"10.1080\/09540091003682553","volume":"22","author":"M. Mirolli","year":"2010","unstructured":"Mirolli, M., Mannella, F., Baldassarre, G.: The roles of the amygdala in the affective regulation of body, brain, and behaviour. Connection Science\u00a022, 215\u2013245 (2010)","journal-title":"Connection Science"},{"key":"16_CR112","doi-asserted-by":"crossref","first-page":"1936","DOI":"10.1523\/JNEUROSCI.16-05-01936.1996","volume":"16","author":"P.R. Montague","year":"1996","unstructured":"Montague, P.R., Dayan, P., Sejnowski, T.J.: A framework for mesencephalic dopamine systems based on predictive Hebbian learning. Journal of Neuroscience\u00a016, 1936\u20131947 (1996)","journal-title":"Journal of Neuroscience"},{"key":"16_CR113","doi-asserted-by":"crossref","first-page":"760","DOI":"10.1038\/nature03015","volume":"431","author":"P.R. Montague","year":"2004","unstructured":"Montague, P.R., Hyman, S.E., Cohen, J.D.: Computational roles for dopamine in behavioural control. Nature\u00a0431, 760\u2013767 (2004)","journal-title":"Nature"},{"key":"16_CR114","doi-asserted-by":"crossref","first-page":"417","DOI":"10.1146\/annurev.neuro.29.051605.112903","volume":"29","author":"P.R. Montague","year":"2006","unstructured":"Montague, P.R., King-Casas, B., Cohen, J.D.: Imaging valuation models in human choice. Annual Review of Neuroscience\u00a029, 417\u2013448 (2006)","journal-title":"Annual Review of Neuroscience"},{"key":"16_CR115","doi-asserted-by":"crossref","first-page":"116","DOI":"10.1101\/lm.4.1.116","volume":"4","author":"J.W. Moore","year":"1997","unstructured":"Moore, J.W., Choi, J.S.: Conditioned response timing and integration in the cerebellum. Learning and Memory\u00a04, 116\u2013129 (1997)","journal-title":"Learning and Memory"},{"key":"16_CR116","doi-asserted-by":"crossref","first-page":"1057","DOI":"10.1038\/nn1743","volume":"9","author":"G. Morris","year":"2006","unstructured":"Morris, G., Nevet, A., Arkadir, D., Vaadia, E., Bergman, H.: Midbrain dopamine neurons encode decisions for future action. Nature Neuroscience\u00a09, 1057\u20131063 (2006)","journal-title":"Nature Neuroscience"},{"key":"16_CR117","doi-asserted-by":"crossref","first-page":"631","DOI":"10.1016\/j.neuron.2006.03.045","volume":"50","author":"H. Mushiake","year":"2006","unstructured":"Mushiake, H., Saito, N., Sakamoto, K., Itoyama, Y., Tanji, J.: Activity in the lateral prefrontal cortex reflects multiple steps of future events in action plans. Neuron\u00a050, 631\u2013641 (2006)","journal-title":"Neuron"},{"key":"16_CR118","doi-asserted-by":"crossref","first-page":"269","DOI":"10.1016\/S0896-6273(03)00869-9","volume":"41","author":"H. Nakahara","year":"2004","unstructured":"Nakahara, H., Itoh, H., Kawagoe, R., Takikawa, Y., Hikosaka, O.: Dopamine neurons can represent context-dependent prediction error. Neuron\u00a041, 269\u2013280 (2004)","journal-title":"Neuron"},{"key":"16_CR119","unstructured":"Ng, A., Harada, D., Russell, S.: Policy invariance under reward transformations: theory and applications to reward shaping. In: Proceedings of the Sixteenth International Conference on Machine Learning, pp. 278\u2013287 (1999)"},{"key":"16_CR120","doi-asserted-by":"crossref","first-page":"521","DOI":"10.1007\/s00213-006-0510-4","volume":"191","author":"S.M. Nicola","year":"2007","unstructured":"Nicola, S.M.: The nucleus accumbens as part of a basal ganglia action selection circuit. Psychopharmacology\u00a0191, 521\u2013550 (2007)","journal-title":"Psychopharmacology"},{"key":"16_CR121","doi-asserted-by":"crossref","first-page":"139","DOI":"10.1016\/j.jmp.2008.12.005","volume":"53","author":"Y. Niv","year":"2009","unstructured":"Niv, Y.: Reinforcement learning in the brain. Journal of Mathematical Psychology\u00a053, 139\u2013154 (2009)","journal-title":"Journal of Mathematical Psychology"},{"key":"16_CR122","doi-asserted-by":"crossref","first-page":"6","DOI":"10.1186\/1744-9081-1-6","volume":"1","author":"Y. Niv","year":"2005","unstructured":"Niv, Y., Duff, M.O., Dayan, P.: Dopamine, uncertainty, and TD learning. Behavioral and Brain Functions\u00a01, 6 (2005)","journal-title":"Behavioral and Brain Functions"},{"key":"16_CR123","doi-asserted-by":"crossref","first-page":"987","DOI":"10.1038\/nn0806-987","volume":"9","author":"Y. Niv","year":"2006","unstructured":"Niv, Y., Daw, N.D., Dayan, P.: Choice values. Nature Neuroscience\u00a09, 987\u2013988 (2006a)","journal-title":"Nature Neuroscience"},{"key":"16_CR124","doi-asserted-by":"crossref","first-page":"375","DOI":"10.1016\/j.tics.2006.06.010","volume":"10","author":"Y. Niv","year":"2006","unstructured":"Niv, Y., Joel, D., Dayan, P.: A normative perspective on motivation. Trends in Cognitive Sciences\u00a010, 375\u2013381 (2006b)","journal-title":"Trends in Cognitive Sciences"},{"key":"16_CR125","doi-asserted-by":"crossref","first-page":"692","DOI":"10.1523\/JNEUROSCI.4828-09.2010","volume":"30","author":"K. Nomoto","year":"2010","unstructured":"Nomoto, K., Schultz, W., Watanabe, T., Sakagami, M.: Temporally extended dopamine responses to perceptually demanding reward-predictive stimuli. The Journal of Neuroscience\u00a030, 10,692\u201310,702 (2010)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR126","doi-asserted-by":"crossref","first-page":"452","DOI":"10.1126\/science.1094285","volume":"304","author":"J.P. O\u2019Doherty","year":"2004","unstructured":"O\u2019Doherty, J.P., Dayan, P., Schultz, J., Deichmann, R., Friston, K., Dolan, R.J.: Dissociable roles of ventral and dorsal striatum in instrumental conditioning. Science\u00a0304, 452\u2013454 (2004)","journal-title":"Science"},{"key":"16_CR127","doi-asserted-by":"crossref","first-page":"419","DOI":"10.1037\/h0058775","volume":"47","author":"J. Olds","year":"1954","unstructured":"Olds, J., Milner, P.: Positive reinforcement produced by electrical stimulation of septal area and other regions of rat brain. Journal of Comparative and Physiological Psychology\u00a047, 419\u2013427 (1954)","journal-title":"Journal of Comparative and Physiological Psychology"},{"key":"16_CR128","doi-asserted-by":"crossref","first-page":"283","DOI":"10.1162\/089976606775093909","volume":"18","author":"R.C. O\u2019Reilly","year":"2006","unstructured":"O\u2019Reilly, R.C., Frank, M.J.: Making working memory work: a computational model of learning in the prefrontal cortex and basal ganglia. Neural Computation\u00a018, 283\u2013328 (2006)","journal-title":"Neural Computation"},{"key":"16_CR129","doi-asserted-by":"crossref","first-page":"563","DOI":"10.1146\/annurev.neuro.25.112701.142937","volume":"25","author":"M.G. Packard","year":"2002","unstructured":"Packard, M.G., Knowlton, B.J.: Learning and memory functions of the basal ganglia. Annual Review of Neuroscience\u00a025, 563\u2013593 (2002)","journal-title":"Annual Review of Neuroscience"},{"key":"16_CR130","doi-asserted-by":"crossref","first-page":"873","DOI":"10.1038\/nature03287","volume":"433","author":"A. Pasupathy","year":"2005","unstructured":"Pasupathy, A., Miller, E.K.: Different time courses of learning-related activity in the prefrontal cortex and striatum. Nature\u00a0433, 873\u2013876 (2005)","journal-title":"Nature"},{"key":"16_CR131","volume-title":"Conditioned Reflexes: An Investigation of the Physiological Activity of the Cerebral Cortex","author":"I.P. Pavlov","year":"1927","unstructured":"Pavlov, I.P.: Conditioned Reflexes: An Investigation of the Physiological Activity of the Cerebral Cortex. Oxford University Press, Toronto (1927)"},{"key":"16_CR132","doi-asserted-by":"crossref","first-page":"831","DOI":"10.1523\/JNEUROSCI.3177-09.2009","volume":"29","author":"C.M. Pennartz","year":"2009","unstructured":"Pennartz, C.M., Berke, J.D., Graybiel, A.M., Ito, R., Lansink, C.S., van der Meer, M., Redish, A.D., Smith, K.S., Voorn, P.: Corticostriatal interactions during learning, memory processing, and decision making. The Journal of Neuroscience\u00a029, 12,831\u201312,838 (2009)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR133","doi-asserted-by":"crossref","first-page":"1042","DOI":"10.1038\/nature05051","volume":"442","author":"M. Pessiglione","year":"2006","unstructured":"Pessiglione, M., Seymour, B., Flandin, G., Dolan, R.J., Frith, C.D.: Dopamine-dependent prediction errors underpin reward-seeking behaviour in humans. Nature\u00a0442, 1042\u20131045 (2006)","journal-title":"Nature"},{"key":"16_CR134","doi-asserted-by":"crossref","first-page":"175","DOI":"10.1016\/j.neuron.2005.09.025","volume":"48","author":"E.A. Phelps","year":"2005","unstructured":"Phelps, E.A., LeDoux, J.E.: Contributions of the amygdala to emotion processing: From animal models to human behavior. Neuron\u00a048, 175\u2013187 (2005)","journal-title":"Neuron"},{"key":"16_CR135","doi-asserted-by":"crossref","first-page":"5356","DOI":"10.1523\/JNEUROSCI.3880-04.2005","volume":"25","author":"R.A. Poldrack","year":"2005","unstructured":"Poldrack, R.A., Sabb, F.W., Foerde, K., Tom, S.M., Asarnow, R.F., Bookheimer, S.Y., Knowlton, B.J.: The neural correlates of motor skill automaticity. The Journal of Neuroscience\u00a025, 5356\u20135364 (2005)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR136","doi-asserted-by":"crossref","first-page":"571","DOI":"10.1016\/j.anbehav.2004.12.009","volume":"70","author":"L. Pompilio","year":"2005","unstructured":"Pompilio, L., Kacelnik, A.: State-dependent learning and suboptimal choice: when starlings prefer long over short delays to food. Animal Behaviour\u00a070, 571\u2013578 (2005)","journal-title":"Animal Behaviour"},{"key":"16_CR137","doi-asserted-by":"crossref","first-page":"967","DOI":"10.1038\/nrn2022","volume":"7","author":"P. Redgrave","year":"2006","unstructured":"Redgrave, P., Gurney, K.: The short-latency dopamine signal: a role in discovering novel actions? Nature Reviews Neuroscience\u00a07, 967\u2013975 (2006)","journal-title":"Nature Reviews Neuroscience"},{"key":"16_CR138","doi-asserted-by":"crossref","first-page":"322","DOI":"10.1016\/j.brainresrev.2007.10.007","volume":"58","author":"P. Redgrave","year":"2008","unstructured":"Redgrave, P., Gurney, K., Reynolds, J.: What is reinforced by phasic dopamine signals? Brain Research Reviews\u00a058, 322\u2013339 (2008)","journal-title":"Brain Research Reviews"},{"key":"16_CR139","doi-asserted-by":"crossref","first-page":"760","DOI":"10.1038\/nrn2915","volume":"11","author":"P. Redgrave","year":"2010","unstructured":"Redgrave, P., Rodriguez, M., Smith, Y., Rodriguez-Oroz, M.C., Lehericy, S., Bergman, H., Agid, Y., DeLong, M.R., Obeso, J.A.: Goal-directed and habitual control in the basal ganglia: implications for Parkinson\u2019s disease. Nature Reviews Neuroscience\u00a011, 760\u2013772 (2010)","journal-title":"Nature Reviews Neuroscience"},{"key":"16_CR140","doi-asserted-by":"crossref","first-page":"415","DOI":"10.1017\/S0140525X0800472X","volume":"31","author":"A.D. Redish","year":"2008","unstructured":"Redish, A.D., Jensen, S., Johnson, A.: A unified framework for addiction: Vulnerabilities in the decision process. Behavioral and Brain Sciences\u00a031, 415\u2013487 (2008)","journal-title":"Behavioral and Brain Sciences"},{"key":"16_CR141","first-page":"64","volume-title":"Classical Conditioning II: Current Research and Theory","author":"R.A. Rescorla","year":"1972","unstructured":"Rescorla, R.A., Wagner, A.R.: A theory of pavlovian conditioning: Variations in the effectiveness of reinforcement and nonreinforcement. In: Black, A.H., Prokasy, W.F. (eds.) Classical Conditioning II: Current Research and Theory, pp. 64\u201399. Appleton-Century-Crofts, New York (1972)"},{"key":"16_CR142","doi-asserted-by":"crossref","first-page":"267","DOI":"10.1901\/jeab.1981.36-267","volume":"36","author":"W.K. Richardson","year":"1981","unstructured":"Richardson, W.K., Warzak, W.J.: Stimulus stringing by pigeons. Journal of the Experimental Analysis of Behavior\u00a036, 267\u2013276 (1981)","journal-title":"Journal of the Experimental Analysis of Behavior"},{"key":"16_CR143","doi-asserted-by":"crossref","first-page":"1615","DOI":"10.1038\/nn2013","volume":"10","author":"M.R. Roesch","year":"2007","unstructured":"Roesch, M.R., Calu, D.J., Schoenbaum, G.: Dopamine neurons encode the better option in rats deciding between differently delayed or sized rewards. Nature Neuroscience\u00a010, 1615\u20131624 (2007)","journal-title":"Nature Neuroscience"},{"key":"16_CR144","doi-asserted-by":"crossref","first-page":"365","DOI":"10.1523\/JNEUROSCI.2572-09.2009","volume":"29","author":"M.R. Roesch","year":"2009","unstructured":"Roesch, M.R., Singh, T., Brown, P.L., Mullins, S.E., Schoenbaum, G.: Ventral striatal neurons encode the value of the chosen action in rats deciding between differently delayed or sized rewards. The Journal of Neuroscience\u00a029, 13,365\u201313,376 (2009)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR145","doi-asserted-by":"crossref","first-page":"213","DOI":"10.1196\/annals.1390.024","volume":"1104","author":"K. Samejima","year":"2007","unstructured":"Samejima, K., Doya, K.: Multiple representations of belief states and action values in corticobasal ganglia loops. Annals of the New York Academy of Sciences\u00a01104, 213\u2013228 (2007)","journal-title":"Annals of the New York Academy of Sciences"},{"key":"16_CR146","doi-asserted-by":"crossref","first-page":"1337","DOI":"10.1126\/science.1115270","volume":"310","author":"K. Samejima","year":"2005","unstructured":"Samejima, K., Ueda, Y., Doya, K., Kimura, M.: Representation of action-specific reward values in the striatum. Science\u00a0310, 1337\u20131340 (2005)","journal-title":"Science"},{"key":"16_CR147","doi-asserted-by":"crossref","first-page":"9913","DOI":"10.1523\/JNEUROSCI.23-30-09913.2003","volume":"23","author":"T. Satoh","year":"2003","unstructured":"Satoh, T., Nakai, S., Sato, T., Kimura, M.: Correlated coding of motivation and outcome of decision by dopamine neurons. The Journal of Neuroscience\u00a023, 9913\u20139923 (2003)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR148","doi-asserted-by":"crossref","first-page":"1439","DOI":"10.1152\/jn.1986.56.5.1439","volume":"56","author":"W. Schultz","year":"1986","unstructured":"Schultz, W.: Responses of midbrain dopamine neurons to behavioral trigger stimuli in the monkey. Journal of Neurophysiology\u00a056, 1439\u20131461 (1986)","journal-title":"Journal of Neurophysiology"},{"key":"16_CR149","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1152\/jn.1998.80.1.1","volume":"80","author":"W. Schultz","year":"1998","unstructured":"Schultz, W.: Predictive reward signal of dopamine neurons. Journal of Neurophysiology\u00a080, 1\u201327 (1998)","journal-title":"Journal of Neurophysiology"},{"key":"16_CR150","doi-asserted-by":"crossref","first-page":"8","DOI":"10.1146\/annurev.psych.56.091103.070229","volume":"57","author":"W. Schultz","year":"2006","unstructured":"Schultz, W.: Behavioral theories and the neurophysiology of reward. Annual Review of Psychology\u00a057, 8\u2013115 (2006)","journal-title":"Annual Review of Psychology"},{"key":"16_CR151","doi-asserted-by":"crossref","first-page":"259","DOI":"10.1146\/annurev.neuro.28.061604.135722","volume":"30","author":"W. Schultz","year":"2007","unstructured":"Schultz, W.: Multiple dopamine functions at different time courses. Annual Review of Neuroscience\u00a030, 259\u2013288 (2007)","journal-title":"Annual Review of Neuroscience"},{"key":"16_CR152","doi-asserted-by":"crossref","first-page":"24","DOI":"10.1186\/1744-9081-6-24","volume":"6","author":"W. Schultz","year":"2010","unstructured":"Schultz, W.: Dopamine signals for reward value and risk: basic and recent data. Behavioral and Brain Functions\u00a06, 24 (2010)","journal-title":"Behavioral and Brain Functions"},{"key":"16_CR153","doi-asserted-by":"crossref","first-page":"900","DOI":"10.1523\/JNEUROSCI.13-03-00900.1993","volume":"13","author":"W. Schultz","year":"1993","unstructured":"Schultz, W., Apicella, P., Ljungberg, T.: Responses of monkey dopamine neurons to reward and conditioned stimuli during successive steps of learning a delayed response task. The Journal of Neuroscience\u00a013, 900\u2013913 (1993)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR154","doi-asserted-by":"crossref","first-page":"1593","DOI":"10.1126\/science.275.5306.1593","volume":"275","author":"W. Schultz","year":"1997","unstructured":"Schultz, W., Dayan, P., Montague, P.R.: A neural substrate of prediction and reward. Science\u00a0275, 1593\u20131599 (1997)","journal-title":"Science"},{"key":"16_CR155","doi-asserted-by":"crossref","first-page":"321","DOI":"10.1016\/S0166-2236(03)00122-X","volume":"26","author":"W. Schultz","year":"2003","unstructured":"Schultz, W., Tremblay, L., Hollerman, J.R.: Changes in behavior-related neuronal activity in the striatum during learning. Trends in Neuroscience\u00a026, 321\u2013328 (2003)","journal-title":"Trends in Neuroscience"},{"key":"16_CR156","doi-asserted-by":"crossref","first-page":"203","DOI":"10.1146\/annurev.neuro.051508.135546","volume":"33","author":"C.A. Seger","year":"2010","unstructured":"Seger, C.A., Miller, E.K.: Category learning in the brain. Annual Review of Neuroscience\u00a033, 203\u2013219 (2010)","journal-title":"Annual Review of Neuroscience"},{"key":"16_CR157","first-page":"670","volume-title":"Proceedings of the Ninth International Joint Conference on Artificial Intelligence","author":"O.J. Selfridge","year":"1985","unstructured":"Selfridge, O.J., Sutton, R.S., Barto, A.G.: Training and tracking in robotics. In: Joshi, A. (ed.) Proceedings of the Ninth International Joint Conference on Artificial Intelligence, pp. 670\u2013672. Morgan Kaufmann, San Mateo (1985)"},{"key":"16_CR158","doi-asserted-by":"crossref","unstructured":"Shah, A.: Biologically-based functional mechanisms of motor skill acquisition. PhD thesis, University of Massachusetts Amherst (2008)","DOI":"10.1186\/1471-2202-8-S2-P203"},{"key":"16_CR159","doi-asserted-by":"crossref","first-page":"55","DOI":"10.1016\/j.brainres.2009.07.006","volume":"1299","author":"A. Shah","year":"2009","unstructured":"Shah, A., Barto, A.G.: Effect on movement selection of an evolving sensory representation: A multiple controller model of skill acquisition. Brain Research\u00a01299, 55\u201373 (2009)","journal-title":"Brain Research"},{"key":"16_CR160","doi-asserted-by":"crossref","first-page":"233","DOI":"10.1002\/bdm.413","volume":"15","author":"D.R. Shanks","year":"2002","unstructured":"Shanks, D.R., Tunney, R.J., McCarthy, J.D.: A re-examination of probability matching and rational choice. Journal of Behavioral Decision Making\u00a015, 233\u2013250 (2002)","journal-title":"Journal of Behavioral Decision Making"},{"key":"16_CR161","doi-asserted-by":"crossref","first-page":"37","DOI":"10.1037\/h0045959","volume":"57","author":"S. Siegel","year":"1959","unstructured":"Siegel, S., Goldstein, D.A.: Decision making behaviour in a two-choice uncertain outcome situation. Journal of Experimental Psychology\u00a057, 37\u201342 (1959)","journal-title":"Journal of Experimental Psychology"},{"key":"16_CR162","volume-title":"The Behavior of Organisms","author":"B.F. Skinner","year":"1938","unstructured":"Skinner, B.F.: The Behavior of Organisms. Appleton-Century-Crofts, New York (1938)"},{"key":"16_CR163","doi-asserted-by":"crossref","first-page":"115","DOI":"10.1146\/annurev.psych.54.101601.145124","volume":"54","author":"J.E.R. Staddon","year":"2003","unstructured":"Staddon, J.E.R., Cerutti, D.T.: Operant behavior. Annual Review of Psychology\u00a054, 115\u2013144 (2003)","journal-title":"Annual Review of Psychology"},{"key":"16_CR164","first-page":"9","volume":"3","author":"R.S. Sutton","year":"1988","unstructured":"Sutton, R.S.: Learning to predict by methods of temporal differences. Machine Learning\u00a03, 9\u201344 (1988)","journal-title":"Machine Learning"},{"key":"16_CR165","doi-asserted-by":"crossref","first-page":"135","DOI":"10.1037\/0033-295X.88.2.135","volume":"88","author":"R.S. Sutton","year":"1981","unstructured":"Sutton, R.S., Barto, A.G.: Toward a modern theory of adaptive networks: Expectation and prediction. Psychological Review\u00a088, 135\u2013170 (1981)","journal-title":"Psychological Review"},{"key":"16_CR166","unstructured":"Sutton, R.S., Barto, A.G.: A temporal-difference model of classical conditioning. In: Proceedings of the Ninth Annual Conference of the Cognitive Science Society, pp. 355\u2013378 (1987)"},{"key":"16_CR167","volume-title":"Reinforcement Learning: An Introduction","author":"R.S. Sutton","year":"1998","unstructured":"Sutton, R.S., Barto, A.G.: Reinforcement Learning: An Introduction. MIT Press, Cambridge (1998)"},{"key":"16_CR168","doi-asserted-by":"crossref","first-page":"37","DOI":"10.1152\/physrev.00014.2007","volume":"88","author":"J. Tanji","year":"2008","unstructured":"Tanji, J., Hoshi, E.: Role of the lateral prefrontal cortex in executive behavioral control. Physiological Reviews\u00a088, 37\u201357 (2008)","journal-title":"Physiological Reviews"},{"key":"16_CR169","doi-asserted-by":"crossref","DOI":"10.5962\/bhl.title.55072","volume-title":"Animal Intelligence: Experimental Studies","author":"E.L. Thorndike","year":"1911","unstructured":"Thorndike, E.L.: Animal Intelligence: Experimental Studies. Macmillan, New York (1911)"},{"key":"16_CR170","doi-asserted-by":"crossref","first-page":"2617","DOI":"10.1111\/j.1460-9568.2005.04411.x","volume":"22","author":"A.J. Tindell","year":"2005","unstructured":"Tindell, A.J., Berridge, K.C., Zhang, J., Pecina, S., Aldridge, J.W.: Ventral pallidal neurons code incentive motivation: Amplification by mesolimbic sensitization and amphetamine. European Journal of Neuroscience\u00a022, 2617\u20132634 (2005)","journal-title":"European Journal of Neuroscience"},{"key":"16_CR171","doi-asserted-by":"crossref","first-page":"402","DOI":"10.1523\/JNEUROSCI.23-32-10402.2003","volume":"23","author":"P.N. Tobler","year":"2003","unstructured":"Tobler, P.N., Dickinson, A., Schultz, W.: Coding of predicted reward omission by dopamine neurons in a conditioned inhibition paradigm. The Journal of Neuroscience\u00a023, 10,402\u201310,410 (2003)","journal-title":"The Journal of Neuroscience"},{"key":"16_CR172","doi-asserted-by":"crossref","first-page":"1642","DOI":"10.1126\/science.1105370","volume":"307","author":"P.N. Tobler","year":"2005","unstructured":"Tobler, P.N., Fiorillo, C.D., Schultz, W.: Adaptive coding of reward value by dopamine neurons. Science\u00a0307, 1642\u20131645 (2005)","journal-title":"Science"},{"key":"16_CR173","doi-asserted-by":"crossref","first-page":"189","DOI":"10.1037\/h0061626","volume":"55","author":"E.C. Tolman","year":"1948","unstructured":"Tolman, E.C.: Cognitive maps in rats and men. The Psychological Review\u00a055, 189\u2013208 (1948)","journal-title":"The Psychological Review"},{"key":"16_CR174","first-page":"44","volume":"56","author":"E.C. Tolman","year":"1949","unstructured":"Tolman, E.C.: There is more than one kind of learning. Psychological Review\u00a056, 44\u201355 (1949)","journal-title":"Psychological Review"},{"key":"16_CR175","doi-asserted-by":"crossref","first-page":"43","DOI":"10.1038\/35083500","volume":"412","author":"P. Waelti","year":"2001","unstructured":"Waelti, P., Dickinson, A., Schultz, W.: Dopamine responses comply with basic assumptions of formal learning theory. Nature\u00a0412, 43\u201348 (2001)","journal-title":"Nature"},{"key":"16_CR176","doi-asserted-by":"crossref","first-page":"31","DOI":"10.1146\/annurev.neuro.30.051606.094334","volume":"30","author":"J.D. Wallis","year":"2007","unstructured":"Wallis, J.D.: Orbitofrontal cortex and its contribution to decision-making. Annual Review of Neuroscience\u00a030, 31\u201356 (2007)","journal-title":"Annual Review of Neuroscience"},{"key":"16_CR177","doi-asserted-by":"crossref","DOI":"10.1037\/10868-000","volume-title":"Behavior: An Introduction to Comparative Psychology","author":"J.B. Watson","year":"1914","unstructured":"Watson, J.B.: Behavior: An Introduction to Comparative Psychology. Holt, New York (1914)"},{"key":"16_CR178","doi-asserted-by":"crossref","first-page":"119","DOI":"10.1016\/j.bbr.2008.10.030","volume":"199","author":"J.R. Wickens","year":"2009","unstructured":"Wickens, J.R.: Synaptic plasticity in the basal ganglia. Behavioural Brain Research\u00a0199, 119\u2013128 (2009)","journal-title":"Behavioural Brain Research"},{"key":"16_CR179","doi-asserted-by":"crossref","first-page":"192","DOI":"10.1196\/annals.1390.016","volume":"1104","author":"J.R. Wickens","year":"2007","unstructured":"Wickens, J.R., Budd, C.S., Hyland, B.I., Arbuthnott, G.W.: Striatal contributions to reward and decision making. Making sense of regional variations in a reiterated processing matrix. Annals of the New York Academy of Sciences\u00a01104, 192\u2013212 (2007)","journal-title":"Annals of the New York Academy of Sciences"},{"key":"16_CR180","first-page":"96","volume-title":"1960 WESCON Convention Record Part IV","author":"B. Widrow","year":"1960","unstructured":"Widrow, B., Hoff, M.E.: Adaptive switching circuits. In: 1960 WESCON Convention Record Part IV, pp. 96\u2013104. Institute of Radio Engineers, New York (1960)"},{"key":"16_CR181","doi-asserted-by":"crossref","first-page":"361","DOI":"10.1093\/acprof:oso\/9780195159561.003.0009","volume-title":"The Synaptic Organization of the Brain, ch. 9","author":"C.J. Wilson","year":"2004","unstructured":"Wilson, C.J.: Basal ganglia. In: Shepherd, G.M. (ed.) The Synaptic Organization of the Brain, ch. 9, 5th edn., pp. 361\u2013414. Oxford University Press, Oxford (2004)","edition":"5"},{"key":"16_CR182","doi-asserted-by":"crossref","first-page":"483","DOI":"10.1038\/nrn1406","volume":"5","author":"R.A. Wise","year":"2004","unstructured":"Wise, R.A.: Dopamine, learning and motivation. Nature Reviews Neuroscience\u00a05, 483\u2013494 (2004)","journal-title":"Nature Reviews Neuroscience"},{"key":"16_CR183","doi-asserted-by":"crossref","first-page":"511","DOI":"10.1016\/j.humov.2007.05.005","volume":"27","author":"D. Wolpert","year":"2007","unstructured":"Wolpert, D.: Probabilistic models in human sensorimotor control. Human Movement Science\u00a027, 511\u2013524 (2007)","journal-title":"Human Movement Science"},{"key":"16_CR184","doi-asserted-by":"crossref","first-page":"245","DOI":"10.1162\/0899766053011555","volume":"17","author":"F. W\u00f6rg\u00f6tter","year":"2005","unstructured":"W\u00f6rg\u00f6tter, F., Porr, B.: Temporal sequence learning, prediction, and control: A review of different models and their relation to biological mechanisms. Neural Computation\u00a017, 245\u2013319 (2005)","journal-title":"Neural Computation"},{"key":"16_CR185","doi-asserted-by":"crossref","first-page":"1253","DOI":"10.1016\/j.neuroimage.2007.04.001","volume":"36","author":"J. Wrase","year":"2007","unstructured":"Wrase, J., Kahnt, T., Schlagenhauf, F., Beck, A., Cohen, M.X., Knutson, B., Heinz, A.: Different neural systems adjust motor behavior in response to reward and punishment. NeuroImage\u00a036, 1253\u20131262 (2007)","journal-title":"NeuroImage"},{"key":"16_CR186","doi-asserted-by":"crossref","first-page":"8122","DOI":"10.1523\/JNEUROSCI.20-21-08122.2000","volume":"20","author":"C.L. Wyvell","year":"2000","unstructured":"Wyvell, C.L., Berridge, K.C.: Intra-accumbens amphetamine increases the conditioned incentive salience of sucrose reward: Enhancement of reward \u201cwanting\u201d without enhanced \u201cliking\u201d or response reinforcement. Journal of Neuroscience\u00a020, 8122\u20138130 (2000)","journal-title":"Journal of Neuroscience"},{"key":"16_CR187","doi-asserted-by":"crossref","first-page":"1437","DOI":"10.1111\/j.1460-9568.2008.06422.x","volume":"28","author":"H.H. Yin","year":"2008","unstructured":"Yin, H.H., Ostlund, S.B., Balleine, B.W.: Reward-guided learning beyond dopamine in the nucleus accumbens: the integrative functions of cortico-basal ganglia networks. European Journal of Neuroscience\u00a028, 1437\u20131448 (2008)","journal-title":"European Journal of Neuroscience"},{"key":"16_CR188","doi-asserted-by":"crossref","first-page":"681","DOI":"10.1016\/j.neuron.2005.04.026","volume":"46","author":"A. Yu","year":"2005","unstructured":"Yu, A., Dayan, P.: Uncertainty, neuromodulation and attention. Neuron\u00a046, 681\u2013692 (2005)","journal-title":"Neuron"}],"container-title":["Adaptation, Learning, and Optimization","Reinforcement Learning"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-27645-3_16","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,2,11]],"date-time":"2023-02-11T16:15:13Z","timestamp":1676132113000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-642-27645-3_16"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012]]},"ISBN":["9783642276446","9783642276453"],"references-count":188,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-27645-3_16","relation":{},"ISSN":["1867-4534","1867-4542"],"issn-type":[{"value":"1867-4534","type":"print"},{"value":"1867-4542","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012]]}}}