{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,31]],"date-time":"2026-03-31T09:43:48Z","timestamp":1774950228514,"version":"3.50.1"},"reference-count":47,"publisher":"Public Library of Science (PLoS)","issue":"8","license":[{"start":{"date-parts":[[2014,8,14]],"date-time":"2014-08-14T00:00:00Z","timestamp":1407974400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["www.ploscompbiol.org"],"crossmark-restriction":false},"short-container-title":["PLoS Comput Biol"],"DOI":"10.1371\/journal.pcbi.1003779","type":"journal-article","created":{"date-parts":[[2014,8,14]],"date-time":"2014-08-14T14:12:59Z","timestamp":1408025579000},"page":"e1003779","update-policy":"https:\/\/doi.org\/10.1371\/journal.pcbi.corrections_policy","source":"Crossref","is-referenced-by-count":113,"title":["Optimal Behavioral Hierarchy"],"prefix":"10.1371","volume":"10","author":[{"given":"Alec","family":"Solway","sequence":"first","affiliation":[]},{"given":"Carlos","family":"Diuk","sequence":"additional","affiliation":[]},{"given":"Natalia","family":"C\u00f3rdova","sequence":"additional","affiliation":[]},{"given":"Debbie","family":"Yee","sequence":"additional","affiliation":[]},{"given":"Andrew G.","family":"Barto","sequence":"additional","affiliation":[]},{"given":"Yael","family":"Niv","sequence":"additional","affiliation":[]},{"given":"Matthew M.","family":"Botvinick","sequence":"additional","affiliation":[]}],"member":"340","published-online":{"date-parts":[[2014,8,14]]},"reference":[{"key":"ref1","unstructured":"Hebb DO (1949) The organization of behavior: A neuropsychological theory. New York, NY: John Wiley &amp; Sons."},{"key":"ref2","doi-asserted-by":"crossref","unstructured":"Miller GA, Galanter E, Pribram KH (1960) Plans and the structure of behavior. New York, NY: Holt, Rinehart &amp; Winston.","DOI":"10.1037\/10039-000"},{"key":"ref3","unstructured":"Tinbergen N (1951) The study of instinct. Oxford, England: Clarendon Press."},{"key":"ref4","unstructured":"Tolman EC (1932) Purposive behavior in animals and men. New York, NY: Century."},{"key":"ref5","doi-asserted-by":"crossref","first-page":"201","DOI":"10.1016\/j.tics.2008.02.009","article-title":"Hierarchical models of behavior and prefrontal function","volume":"12","author":"MM Botvinick","year":"2008","journal-title":"Trends in Cognitive Sciences"},{"key":"ref6","doi-asserted-by":"crossref","unstructured":"Shallice T, Cooper RP (2011) The organization of mind. Oxford, England: Oxford University Press.","DOI":"10.1093\/acprof:osobl\/9780199579242.001.0001"},{"key":"ref7","doi-asserted-by":"crossref","first-page":"574","DOI":"10.1111\/j.1467-7687.2006.00535.x","article-title":"Imitation of hierarchical action structure by young children","volume":"9","author":"A Whiten","year":"2006","journal-title":"Developmental Science"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"4057","DOI":"10.1162\/jocn_a_00078","article-title":"Prediction error associated with the perceptual segmentation of naturalistic events","volume":"23","author":"JM Zacks","year":"2011","journal-title":"Journal of Cognitive Neuroscience"},{"key":"ref9","doi-asserted-by":"crossref","first-page":"119","DOI":"10.1006\/nlme.1998.3843","article-title":"The basal ganglia and chunking of action repertoires","volume":"70","author":"AM Graybiel","year":"1998","journal-title":"Neurobiology of Learning and Memory"},{"key":"ref10","unstructured":"Barto AG, Konidaris GD, Vigorito CM (2013) Behavioral Hierarchy: Exploration and Representation, Springer. pp. 13\u201346."},{"key":"ref11","doi-asserted-by":"crossref","first-page":"262","DOI":"10.1016\/j.cognition.2008.08.011","article-title":"Hierarchically organized behavior and its neural foundations: A reinforcement learning perspective","volume":"113","author":"MM Botvinick","year":"2009","journal-title":"Cognition"},{"key":"ref12","doi-asserted-by":"crossref","first-page":"325","DOI":"10.1023\/A:1017944732463","article-title":"Structure in the space of value functions","volume":"49","author":"D Foster","year":"2002","journal-title":"Machine Learning"},{"key":"ref13","doi-asserted-by":"crossref","first-page":"1036","DOI":"10.1037\/0033-295X.111.4.1036","article-title":"An integrated theory of the mind","volume":"111","author":"JR Anderson","year":"2004","journal-title":"Psychological Review"},{"key":"ref14","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1613\/jair.575","article-title":"Decision-theoretic planning: structural assumptions and computational leverage","volume":"11","author":"C Boutilier","year":"1999","journal-title":"Journal of Artificial Intelligence Research"},{"key":"ref15","doi-asserted-by":"crossref","unstructured":"Laird JE (2012) The Soar cognitive architecture. Cambridge, MA: The MIT Press.","DOI":"10.7551\/mitpress\/7688.001.0001"},{"key":"ref16","unstructured":"Newell A, Simon HA (1972) Human problem solving. Englewood Cliffs, NJ: Prentice-Hall."},{"key":"ref17","doi-asserted-by":"crossref","unstructured":"Sutton RS, Barto AG (1998) Reinforcement learning: An introduction. The MIT Press.","DOI":"10.1016\/S1474-6670(17)38315-5"},{"key":"ref18","doi-asserted-by":"crossref","first-page":"181","DOI":"10.1016\/S0004-3702(99)00052-1","article-title":"Between MDPs and semi-MDPs: A framework for temporal abstraction in reinforcement learning","volume":"112","author":"RS Sutton","year":"1999","journal-title":"Artificial Intelligence"},{"key":"ref19","doi-asserted-by":"crossref","unstructured":"Sutton RS (1990) Integrated architectures for learning, planning, and reacting based on approximating dynamic programming. In: Proceedings of the 7th International Conference on Machine Learning. pp. 216\u2013224.","DOI":"10.1016\/B978-1-55860-141-3.50030-4"},{"key":"ref20","volume":"volume 21","unstructured":"Simsek \u00d6, Barto AG (2008) Skill characterization based on betweenness. In: Koller D, Schuurmans D, Bengio Y, Bottou L, editors, Advances in Neural Information Processing Systems. <volume>volume 21<\/volume> , pp. 1497\u20131504."},{"key":"ref21","doi-asserted-by":"crossref","unstructured":"van Dijk SG, Polani D (2011) Grounding subgoals in information transitions. In: IEEE Symposium on Adaptive Dynamic Programming And Reinforcement Learning (ADPRL). IEEE, pp. 105\u2013111.","DOI":"10.1109\/ADPRL.2011.5967384"},{"key":"ref22","doi-asserted-by":"crossref","first-page":"132","DOI":"10.1109\/TAMD.2010.2050205","article-title":"Intrinsically motivated hierarchical skill learning in structured environments","volume":"2","author":"CM Vigorito","year":"2010","journal-title":"IEEE Transactions on Autonomous Mental Development"},{"key":"ref23","unstructured":"MacKay DJC (2003) Information theory, inference and learning algorithms. Cambridge University Press."},{"key":"ref24","unstructured":"Hauskrecht M, Meuleau N, Kaelbling LP, Dean T, Boutilier C (1998) Hierarchical solution of Markov decision processes using macro-actions. In: Proceedings of the Fourteenth Conference on Uncertainty in Artificial Intelligence. San Francisco, CA: Morgan Kaufmann, pp. 220\u2013229."},{"key":"ref25","doi-asserted-by":"crossref","first-page":"1118","DOI":"10.1073\/pnas.0706851105","article-title":"Maps of random walks on complex networks reveal community structure","volume":"105","author":"M Rosvall","year":"2008","journal-title":"Proceedings of the National Academy of Sciences"},{"key":"ref26","unstructured":"Cover TM, Thomas JA (2012) Elements of information theory. Hoboken, NJ: John Wiley &amp; Sons."},{"key":"ref27","doi-asserted-by":"crossref","first-page":"630","DOI":"10.1038\/35036586","article-title":"Minimization of boolean complexity in human concept learning","volume":"407","author":"J Feldman","year":"2000","journal-title":"Nature"},{"key":"ref28","doi-asserted-by":"crossref","first-page":"685","DOI":"10.1037\/a0029347","article-title":"Exploring the conceptual universe","volume":"119","author":"C Kemp","year":"2012","journal-title":"Psychological Review"},{"key":"ref29","doi-asserted-by":"crossref","first-page":"234","DOI":"10.1162\/neco.1992.4.2.234","article-title":"Learning complex, extended sequences using the principle of history compression","volume":"4","author":"J Schmidhuber","year":"1992","journal-title":"Neural Computation"},{"key":"ref30","volume":"volume 7","unstructured":"Thrun S, Schwartz A (1995) Finding structure in reinforcement learning. In: Tesauro G, Touretzky DS, Leen TK, editors, Advances in Neural Information Processing Systems, <volume>volume 7<\/volume> . pp. 385\u2013392."},{"key":"ref31","doi-asserted-by":"crossref","unstructured":"van Dijk SG, Polani D, Nehaniv CL (2011) Hierarchical behaviours: getting the most bang for your bit. In: Kampis G, Karsai I, Szathm\u00e1ry E, editors, Advances in Artificial Life: Darwin Meets von Neumann, Springer. pp. 342\u2013349.","DOI":"10.1007\/978-3-642-21314-4_43"},{"key":"ref32","volume":"volume 5506","unstructured":"Kazemitabar SJ, Beigy H (2009) Automatic discovery of subgoals in reinforcement learning using strongly connected components. In: K\u00f6ppen M, Kasabov N, Coghill G, editors, Advances in Neuro-Information Processing. Springer, <volume>volume 5506<\/volume> , pp.829\u2013834."},{"key":"ref33","doi-asserted-by":"crossref","first-page":"113","DOI":"10.3233\/IDA-2011-0513","article-title":"Automatic skill acquisition in reinforcement learning using graph centrality measures","volume":"16","author":"P Moradi","year":"2012","journal-title":"Intelligent Data Analysis"},{"key":"ref34","doi-asserted-by":"crossref","first-page":"875","DOI":"10.1037\/a0017144","article-title":"Bayes and the simplicity principle in perception","volume":"116","author":"J Feldman","year":"2009","journal-title":"Psychological Review"},{"key":"ref35","doi-asserted-by":"crossref","first-page":"2745","DOI":"10.1073\/pnas.0708424105","article-title":"Bayesian learning of visual chunks by human observers","volume":"105","author":"G Orb\u00e1n","year":"2008","journal-title":"Proceedings of the National Academy of Sciences"},{"key":"ref36","doi-asserted-by":"crossref","first-page":"487","DOI":"10.1037\/a0016797","article-title":"Compression in visual working memory: Using statistical regularities to form more efficient memory representations","volume":"138","author":"TF Brady","year":"2009","journal-title":"Journal of Experimental Psychology: General"},{"key":"ref37","doi-asserted-by":"crossref","first-page":"346","DOI":"10.1016\/j.cognition.2011.11.003","article-title":"What&apos;s magic about magic numbers? Chunking and data compression in short-term memory","volume":"122","author":"F Mathy","year":"2012","journal-title":"Cognition"},{"key":"ref38","unstructured":"Finley S, Newport EL (2010) Morpheme segmentation from distributional information. In: Boston University Conference on Language Development (BUCLD) Online Proceedings Supplement."},{"key":"ref39","doi-asserted-by":"crossref","first-page":"19","DOI":"10.1016\/S1364-6613(02)00005-0","article-title":"Simplicity: A unifying principle in cognitive science?","volume":"7","author":"N Chater","year":"2003","journal-title":"Trends in Cognitive Sciences"},{"key":"ref40","doi-asserted-by":"crossref","first-page":"1352","DOI":"10.1111\/j.1551-6709.2011.01188.x","article-title":"MDLChunker: A MDL-based cognitive model of inductive learning","volume":"35","author":"V Robinet","year":"2011","journal-title":"Cognitive Science"},{"key":"ref41","doi-asserted-by":"crossref","first-page":"486","DOI":"10.1038\/nn.3331","article-title":"Neural representations of events arise from temporal community structure","volume":"16","author":"AC Schapiro","year":"2013","journal-title":"Nature Neuroscience"},{"key":"ref42","doi-asserted-by":"crossref","first-page":"331","DOI":"10.1207\/s15427633scc0304_5","article-title":"\u2018Fine-to-coarse\u2019 route planning and navigation in regionalized environments","volume":"3","author":"JM Wiener","year":"2003","journal-title":"Spatial Cognition & Computation"},{"key":"ref43","first-page":"1331","article-title":"Tower of Hanoi: Evidence for the cost of goal retrieval","volume":"27","author":"JR Anderson","year":"2001","journal-title":"Journal of Experimental Psychology: Learning, Memory, and Cognition"},{"key":"ref44","doi-asserted-by":"crossref","first-page":"341","DOI":"10.1023\/A:1025696116075","article-title":"Recent advances in hierarchical reinforcement learning","volume":"13","author":"AG Barto","year":"2003","journal-title":"Discrete Event Dynamic Systems"},{"key":"ref45","doi-asserted-by":"crossref","first-page":"1350016","DOI":"10.1142\/S0219525913500161","article-title":"Informational constraints-driven organization in goal-directed behavior","volume":"16","author":"SG van Dijk","year":"2013","journal-title":"Advances in Complex Systems"},{"key":"ref46","doi-asserted-by":"crossref","first-page":"172","DOI":"10.1109\/TKDE.2007.190689","article-title":"On modularity clustering","volume":"20","author":"U Brandes","year":"2008","journal-title":"IEEE Transactions on Knowledge and Data Engineering"},{"key":"ref47","first-page":"1","article-title":"GA: a package for genetic algorithms in R. Journal of Statistical Software","volume":"53","author":"L Scrucca","year":"2013"}],"container-title":["PLoS Computational Biology"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/dx.plos.org\/10.1371\/journal.pcbi.1003779","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,5,8]],"date-time":"2020-05-08T18:14:08Z","timestamp":1588961648000},"score":1,"resource":{"primary":{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1003779"}},"subtitle":[],"editor":[{"given":"Olaf","family":"Sporns","sequence":"first","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2014,8,14]]},"references-count":47,"journal-issue":{"issue":"8","published-online":{"date-parts":[[2014,8,14]]}},"URL":"https:\/\/doi.org\/10.1371\/journal.pcbi.1003779","relation":{},"ISSN":["1553-7358"],"issn-type":[{"value":"1553-7358","type":"electronic"}],"subject":[],"published":{"date-parts":[[2014,8,14]]}}}