{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,2]],"date-time":"2026-01-02T07:44:26Z","timestamp":1767339866160},"reference-count":59,"publisher":"Public Library of Science (PLoS)","issue":"9","license":[{"start":{"date-parts":[[2010,9,9]],"date-time":"2010-09-09T00:00:00Z","timestamp":1283990400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["www.ploscompbiol.org"],"crossmark-restriction":false},"short-container-title":["PLoS Comput Biol"],"DOI":"10.1371\/journal.pcbi.1000903","type":"journal-article","created":{"date-parts":[[2010,9,9]],"date-time":"2010-09-09T19:16:22Z","timestamp":1284059782000},"page":"e1000903","update-policy":"http:\/\/dx.doi.org\/10.1371\/journal.pcbi.corrections_policy","source":"Crossref","is-referenced-by-count":36,"title":["Pavlovian-Instrumental Interaction in \u2018Observing Behavior\u2019"],"prefix":"10.1371","volume":"6","author":[{"given":"Ulrik R.","family":"Beierholm","sequence":"first","affiliation":[]},{"given":"Peter","family":"Dayan","sequence":"additional","affiliation":[]}],"member":"340","published-online":{"date-parts":[[2010,9,9]]},"reference":[{"key":"ref1","doi-asserted-by":"crossref","first-page":"681","DOI":"10.1037\/h0040090","article-title":"The misbehavior of organisms.","volume":"16","author":"K Breland","year":"1961","journal-title":"Am Psychol"},{"key":"ref2","doi-asserted-by":"crossref","first-page":"511","DOI":"10.1901\/jeab.1969.12-511","article-title":"Auto-maintenance in the pigeon: sustained pecking despite contingent non-reinforcement.","volume":"12","author":"DR Williams","year":"1969","journal-title":"J Exp Anal Behav"},{"key":"ref3","first-page":"302","article-title":"Relation between classical conditioning and instrumental learning.","author":"F Sheffield","year":"1965"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"1153","DOI":"10.1016\/j.neunet.2006.03.002","article-title":"The misbehavior of value and the discipline of the will.","volume":"19","author":"P Dayan","year":"2006","journal-title":"Neural Netw"},{"key":"ref5","doi-asserted-by":"crossref","first-page":"717","DOI":"10.1016\/j.physbeh.2005.08.061","article-title":"Neural bases of food-seeking: Affect arousal and reward in corticostriatolimbic circuits.","volume":"86","author":"B Balleine","year":"2005","journal-title":"Physiol Behav"},{"key":"ref6","doi-asserted-by":"crossref","first-page":"1704","DOI":"10.1038\/nn1560","article-title":"Uncertainty-based competition between prefrontal and dorsolateral striatal systems for behavioral control.","volume":"8","author":"N Daw","year":"2005","journal-title":"Nat Neurosci"},{"key":"ref7","first-page":"51","article-title":"The role of value systems in decision-making.","author":"P Dayan","year":"2008"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"431","DOI":"10.1037\/h0053932","article-title":"The role of observing responses in discrimination learning. Part I.","volume":"59","author":"LB Wyckoff","year":"1952","journal-title":"Psychol Rev"},{"key":"ref9","doi-asserted-by":"crossref","first-page":"693","DOI":"10.1017\/S0140525X00017969","article-title":"Observing and conditioned reinforcement.","volume":"6","author":"J Dinsmoor","year":"1983","journal-title":"Behav Brain Sci"},{"key":"ref10","doi-asserted-by":"crossref","first-page":"119","DOI":"10.1016\/j.neuron.2009.06.009","article-title":"Midbrain dopamine neurons signal preference for advance information about upcoming rewards.","volume":"63","author":"ES Bromberg-Martin","year":"2009","journal-title":"Neuron"},{"key":"ref11","doi-asserted-by":"crossref","first-page":"131","DOI":"10.1037\/h0046740","article-title":"The acquisition of observing responses in the absence of differential external reinforcement.","volume":"49","author":"W Prokasy","year":"1956","journal-title":"J Comp Physiol Psychol"},{"key":"ref12","doi-asserted-by":"crossref","first-page":"201","DOI":"10.1006\/lmot.1999.1030","article-title":"Observing Behavior in Pigeons: The Effect of Reinforcement Probability and Response Cost Using a Symmetrical Choice Procedure.","volume":"220","author":"KL Roper","year":"1999","journal-title":"Learn Motiv"},{"key":"ref13","first-page":"81","article-title":"Preference for unpredictability is reversed when unpredictable nonreward is aversive.","author":"H Daly","year":"1992"},{"key":"ref14","doi-asserted-by":"crossref","first-page":"185","DOI":"10.2307\/1913656","article-title":"Temporal resolution of uncertainty and dynamic choice theory.","volume":"46","author":"D Kreps","year":"1978","journal-title":"Econometrica"},{"key":"ref15","doi-asserted-by":"crossref","first-page":"55","DOI":"10.1162\/003355301556347","article-title":"Psychological Expected Utility Theory and Anticipatory Feelings?","volume":"116","author":"A Caplin","year":"2001","journal-title":"Q J Econ"},{"key":"ref16","first-page":"666","article-title":"Anticipation and the valuation of delayed consumption.","volume":"97","author":"G Loewenstein","year":"1987","journal-title":"Econ J (London)"},{"key":"ref17","doi-asserted-by":"crossref","first-page":"179","DOI":"10.1002\/(SICI)1099-0771(200004\/06)13:2<179::AID-BDM332>3.0.CO;2-J","article-title":"Living with uncertainty: attractiveness and resolution timing.","volume":"13","author":"D Lovallo","year":"2000","journal-title":"J Behav Decis Mak"},{"key":"ref18","article-title":"The mathematical theory of information, volume 97","author":"C Shannon","year":"1949"},{"key":"ref19","doi-asserted-by":"crossref","first-page":"1936","DOI":"10.1523\/JNEUROSCI.16-05-01936.1996","article-title":"A framework for mesencephalic dopamine systems based on predictive hebbian learning.","volume":"16","author":"PR Montague","year":"1996","journal-title":"J Neurosci"},{"key":"ref20","doi-asserted-by":"crossref","first-page":"1593","DOI":"10.1126\/science.275.5306.1593","article-title":"A neural substrate of prediction and reward.","volume":"275","author":"W Schultz","year":"1997","journal-title":"Science"},{"key":"ref21","doi-asserted-by":"crossref","DOI":"10.1109\/TNN.1998.712192","article-title":"Reinforcement Learning: An Introduction","author":"RS Sutton","year":"1998"},{"key":"ref22","doi-asserted-by":"crossref","first-page":"9","DOI":"10.1007\/BF00115009","article-title":"Learning to predict by the methods of temporal differences.","volume":"3","author":"RS Sutton","year":"1988","journal-title":"Mach Learn"},{"key":"ref23","first-page":"497","article-title":"Time-derivative models of Pavlovian reinforcement","author":"R Sutton","year":"1990"},{"key":"ref24","doi-asserted-by":"crossref","first-page":"92","DOI":"10.1016\/0023-9690(81)90026-6","article-title":"Blocking acquisition of the rabbit&apos;s nictitating membrane response to serial conditioned stimuli.","volume":"12","author":"E Kehoe","year":"1981","journal-title":"Learn Motiv"},{"key":"ref25","doi-asserted-by":"crossref","first-page":"871","DOI":"10.1016\/S0306-4522(98)00697-6","article-title":"A neural network model with dopamine-like reinforcement signal that learns a spatial delayed response task.","volume":"91","author":"RE Suri","year":"1999","journal-title":"Neuroscience"},{"key":"ref26","doi-asserted-by":"crossref","first-page":"98","DOI":"10.1016\/0893-6080(88)90137-2","article-title":"Neural dynamics of adaptive timing and temporal discrimination during associative learning.","volume":"1","author":"S Grossberg","year":"1988","journal-title":"Neural Netw"},{"key":"ref27","doi-asserted-by":"crossref","first-page":"3034","DOI":"10.1162\/neco.2008.11-07-654","article-title":"Stimulus representation and the timing of reward-prediction errors in models of the dopamine system.","volume":"20","author":"EA Ludvig","year":"2008","journal-title":"Neural Comput"},{"key":"ref28","doi-asserted-by":"crossref","first-page":"307","DOI":"10.1146\/annurev.neuro.27.070203.144247","article-title":"The neural basis of temporal processing.","volume":"27","author":"MD Mauk","year":"2004","journal-title":"Annu Rev Neurosci"},{"key":"ref29","doi-asserted-by":"crossref","first-page":"283","DOI":"10.1162\/089976606775093909","article-title":"Making working memory work: A computational model of learning in the prefrontal cortex and basal ganglia.","volume":"18","author":"R O'Reilly","year":"2006","journal-title":"Neural Comput"},{"key":"ref30","doi-asserted-by":"crossref","first-page":"137","DOI":"10.3758\/CABN.1.2.137","article-title":"Interactions between frontal cortex and basal ganglia in working memory: a computational model.","volume":"1","author":"M Frank","year":"2001","journal-title":"Cogn Affect Behav Neurosci"},{"key":"ref31","doi-asserted-by":"crossref","first-page":"572","DOI":"10.1038\/376572a0","article-title":"Modulation of memory fields by dopamine d1 receptors in prefrontal cortex.","volume":"376","author":"GV Williams","year":"1995","journal-title":"Nature"},{"key":"ref32","doi-asserted-by":"crossref","first-page":"10402","DOI":"10.1523\/JNEUROSCI.23-32-10402.2003","article-title":"Coding of predicted reward omission by dopamine neurons in a conditioned inhibition paradigm.","volume":"23","author":"PN Tobler","year":"2003","journal-title":"The Journal of neuroscience : the official journal of the Society for Neuroscience"},{"key":"ref33","doi-asserted-by":"crossref","first-page":"1898","DOI":"10.1126\/science.1077349","article-title":"Discrete coding of reward probability and uncertainty by dopamine neurons.","volume":"299","author":"CD Fiorillo","year":"2003","journal-title":"Science"},{"key":"ref34","doi-asserted-by":"crossref","first-page":"129","DOI":"10.1016\/j.neuron.2005.05.020","article-title":"Midbrain dopamine neurons encode a quantitative reward prediction error signal.","volume":"47","author":"HM Bayer","year":"2005","journal-title":"Neuron"},{"key":"ref35","doi-asserted-by":"crossref","first-page":"1107","DOI":"10.1037\/0033-2909.86.5.1107","article-title":"Choosing between predictable and unpredictable shock conditions: Data and theory.","volume":"86","author":"P Badia","year":"1979","journal-title":"Psychol Bull"},{"key":"ref36","doi-asserted-by":"crossref","first-page":"435","DOI":"10.1037\/h0022578","article-title":"Conditions affecting acquisition of observing responses in the absence of differential reward.","volume":"60","author":"KM Mitchell","year":"1965","journal-title":"J Comp Physiol Psychol"},{"key":"ref37","doi-asserted-by":"crossref","first-page":"114","DOI":"10.2466\/pr0.1965.16.1.114","article-title":"Acquisition of observing responses (RO) with water reward.","volume":"16","author":"DJ Levis","year":"1965","journal-title":"Psychol Rep"},{"key":"ref38","doi-asserted-by":"crossref","first-page":"3","DOI":"10.1037\/0097-7403.15.1.3","article-title":"Preference for unpredictable food rewards occurs with high proportion of reinforced trials or alcohol if rewards are not delayed.","volume":"15","author":"HB Daly","year":"1989","journal-title":"J Exp Psychol Anim Behav Process"},{"key":"ref39","doi-asserted-by":"crossref","first-page":"1642","DOI":"10.1126\/science.1105370","article-title":"Adaptive coding of reward value by dopamine neurons.","volume":"307","author":"PN Tobler","year":"2005","journal-title":"Science"},{"key":"ref40","doi-asserted-by":"crossref","first-page":"2613","DOI":"10.1523\/JNEUROSCI.18-07-02613.1998","article-title":"Neuronal signals in the monkey ventral striatum related to progress through a predictable series of trials.","volume":"18","author":"M Shidara","year":"1998","journal-title":"J Neurosci"},{"key":"ref41","doi-asserted-by":"crossref","first-page":"276","DOI":"10.1037\/h0076778","article-title":"theory of attention: Variations in the associability of stimuli with reinforcement.","volume":"2","author":"NJA Mackintosh","year":"1975","journal-title":"Psychol Rev"},{"key":"ref42","first-page":"441","article-title":"A Mathematical Model of Reward and Aversive Nonreward: Its Application in Over 30 Appetitive Learning Situations.","volume":"11","author":"HB Daly","year":"1982","journal-title":"New York"},{"key":"ref43","article-title":"Variations in the Effectiveness of Reinforcement and Nonreinforcement","author":"R Rescorla","year":"1972"},{"key":"ref44","first-page":"96","article-title":"Adaptive switching circuits.","author":"B Widrow","year":"1960","journal-title":"IRE WESCON Convention Record"},{"key":"ref45","first-page":"355","article-title":"A temporal-difference model of classical conditioning.","author":"R Sutton","year":"1987","journal-title":"Proc Annu Conf Cogn Sci Soc"},{"key":"ref46","doi-asserted-by":"crossref","first-page":"329","DOI":"10.1037\/h0041135","article-title":"Uncertainty and conflict - a point of contact between information-theory and behavior-theory concepts.","volume":"64","author":"D Berlyne","year":"1957","journal-title":"Psychol Rev"},{"key":"ref47","doi-asserted-by":"crossref","first-page":"32","DOI":"10.1080\/09548980902759086","article-title":"Prospective and retrospective temporal difference learning.","volume":"20","author":"P Dayan","year":"2009","journal-title":"Network"},{"key":"ref48","doi-asserted-by":"crossref","first-page":"6","DOI":"10.1186\/1744-9081-1-6","article-title":"Dopamine, uncertainty and TD learning.","volume":"1","author":"Y Niv","year":"2005","journal-title":"Behavioral Brain Function"},{"key":"ref49","doi-asserted-by":"crossref","first-page":"375","DOI":"10.1016\/j.tics.2006.06.010","article-title":"A normative perspective on motivation.","volume":"10","author":"Y Niv","year":"2006","journal-title":"Trends Cogn Sci"},{"key":"ref50","doi-asserted-by":"crossref","first-page":"3","DOI":"10.1016\/S0166-4328(02)00282-6","article-title":"Motivational views of reinforcement: implications for understanding the behavioral functions of nucleus accumbens dopamine.","volume":"137","author":"JD Salamone","year":"2002","journal-title":"Behav Brain Res"},{"key":"ref51","article-title":"A common mechanism for adaptive scaling of reward and novelty.","author":"N Bunzeck","year":"2010","journal-title":"Human Brain Mapping"},{"key":"ref52","doi-asserted-by":"crossref","first-page":"219","DOI":"10.1901\/jeab.1990.53-219","article-title":"Suboptimal choice in a percentage-reinforcement procedure: effects of signal condition and terminal-link length.","volume":"53","author":"ML Spetch","year":"1990","journal-title":"J Exp Anal Behav"},{"key":"ref53","doi-asserted-by":"crossref","first-page":"289","DOI":"10.3758\/LB.37.4.289","article-title":"Preference for 50% reinforcement over 75% reinforcement by pigeons.","volume":"37","author":"C Gipson","year":"2009","journal-title":"Learn Behav"},{"key":"ref54","doi-asserted-by":"crossref","first-page":"99","DOI":"10.1002\/cne.20723","article-title":"Adaptive gain and the role of the locus coeruleus-norepinephrine system in optimal performance.","volume":"493","author":"G Aston-Jones","year":"2005","journal-title":"J Comp Neurol"},{"key":"ref55","doi-asserted-by":"crossref","first-page":"20","DOI":"10.1006\/lmot.1997.0951","article-title":"The role of S- in human observing behavior: bad news is sometimes better than no news.","volume":"28","author":"DA Lieberman","year":"1997","journal-title":"Learn Motiv"},{"key":"ref56","doi-asserted-by":"crossref","first-page":"193","DOI":"10.1901\/jeab.1983.40-193","article-title":"Human observing:maintaned by stimuli correlated with reinforcement but not extinction.","volume":"40","author":"E Fantino","year":"1983","journal-title":"Journal of the experimental analysis of behavior"},{"key":"ref57","doi-asserted-by":"crossref","first-page":"68","DOI":"10.1037\/h0046882","article-title":"Toward a quantitative theory of secondary reinforcement.","volume":"66","author":"L Wyckoff","year":"1959","journal-title":"Psychol Rev"},{"key":"ref58","doi-asserted-by":"crossref","first-page":"239","DOI":"10.1901\/jeab.1980.34-239","article-title":"Reinforcement of human observing behavior by a stimulue correlated with extinction or increased effort.","volume":"34","author":"M Perone","year":"1980","journal-title":"J Exp Anal Behav"},{"key":"ref59","doi-asserted-by":"crossref","first-page":"81","DOI":"10.1037\/h0043178","article-title":"On the possible psychophysical laws.","volume":"66","author":"RD Luce","year":"1959","journal-title":"Psychol Rev"}],"container-title":["PLoS Computational Biology"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/dx.plos.org\/10.1371\/journal.pcbi.1000903","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,6,4]],"date-time":"2019-06-04T09:52:56Z","timestamp":1559641976000},"score":1,"resource":{"primary":{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1000903"}},"subtitle":[],"editor":[{"given":"Tim","family":"Behrens","sequence":"first","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2010,9,9]]},"references-count":59,"journal-issue":{"issue":"9","published-online":{"date-parts":[[2010,9,9]]}},"URL":"https:\/\/doi.org\/10.1371\/journal.pcbi.1000903","relation":{},"ISSN":["1553-7358"],"issn-type":[{"value":"1553-7358","type":"electronic"}],"subject":[],"published":{"date-parts":[[2010,9,9]]}}}