{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,28]],"date-time":"2026-02-28T18:33:34Z","timestamp":1772303614605,"version":"3.50.1"},"reference-count":71,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2018,10,22]],"date-time":"2018-10-22T00:00:00Z","timestamp":1540166400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Biol Cybern"],"published-print":{"date-parts":[[2018,12]]},"DOI":"10.1007\/s00422-018-0785-7","type":"journal-article","created":{"date-parts":[[2018,10,22]],"date-time":"2018-10-22T09:44:59Z","timestamp":1540201499000},"page":"547-573","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":72,"title":["Deep active inference"],"prefix":"10.1007","volume":"112","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-0507-7598","authenticated-orcid":false,"given":"Kai","family":"Ueltzh\u00f6ffer","sequence":"first","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2018,10,22]]},"reference":[{"key":"785_CR1","doi-asserted-by":"publisher","first-page":"47","DOI":"10.3389\/fpsyt.2013.00047","volume":"4","author":"RA Adams","year":"2013","unstructured":"Adams RA, Stephan KE, Brown H, Frith CD, Friston KJ (2013) The computational anatomy of psychosis. Front Psychiatry 4:47","journal-title":"Front Psychiatry"},{"issue":"3","key":"785_CR2","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1016\/j.cub.2004.01.029","volume":"14","author":"D Alais","year":"2004","unstructured":"Alais D, Burr D (2004) The ventriloquist effect results from near-optimal bimodal integration. Curr Biol 14(3):257\u2013262","journal-title":"Curr Biol"},{"key":"785_CR3","unstructured":"Baez JC, Pollard BS (2015) Relative entropy in biological systems. \n                    arXiv:1512.02742"},{"key":"785_CR4","doi-asserted-by":"crossref","unstructured":"Baltieri M, Buckley CL (2017) An active inference implementation of phototaxis. \n                    arXiv:1707.01806","DOI":"10.7551\/ecal_a_011"},{"key":"785_CR5","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1126\/science.1195870","volume":"331","author":"P Berkes","year":"2011","unstructured":"Berkes P, Orb\u00e1n G, Lengyel M, Fiser J (2011) Spontaneous cortical activity reveals hallmarks of an optimal internal model of the environment. Science 331:83\u201387","journal-title":"Science"},{"key":"785_CR6","unstructured":"Brockman G, Cheung V, Pettersson L, Schneider J, Schulman J, Tang J, Zaremba W (2016) Openai gym. \n                    arXiv:1606.01540"},{"key":"785_CR7","first-page":"43","volume":"3","author":"H Brown","year":"2012","unstructured":"Brown H, Friston KJ (2012) Free-energy and illusions: the cornsweet effect. Front Psychol 3:43","journal-title":"Front Psychol"},{"key":"785_CR8","doi-asserted-by":"crossref","unstructured":"Campbell JO (2016) Universal Darwinism as a process of Bayesian inference. \n                    arXiv:1606.07937","DOI":"10.3389\/fnsys.2016.00049"},{"key":"785_CR9","doi-asserted-by":"crossref","unstructured":"Caticha A (2004) Relative entropy and inductive inference. In: AIP conference proceedings, 707","DOI":"10.1063\/1.1751358"},{"key":"785_CR10","unstructured":"Chung J, Kastner K, Dinh L, Goel K, Courville A, Bengio Y (2015) A recurrent latent variable model for sequential data. \n                    arXiv:1506.02216"},{"issue":"2","key":"785_CR11","doi-asserted-by":"publisher","first-page":"89","DOI":"10.1080\/00207727008920220","volume":"1","author":"R Conant","year":"1970","unstructured":"Conant R, Ashby W (1970) Every good regulator of a system must be a model of that system. Int J Syst Sci 1(2):89\u201397","journal-title":"Int J Syst Sci"},{"key":"785_CR12","doi-asserted-by":"publisher","first-page":"587","DOI":"10.1038\/nrn2457","volume":"9","author":"TB Crapse","year":"2008","unstructured":"Crapse TB, Sommer MA (2008) Corollary discharge across the animal kingdom. Nat Rev Neurosci 9:587\u2013600","journal-title":"Nat Rev Neurosci"},{"key":"785_CR13","unstructured":"Dosovitskiy A, Koltun V (2017) Learning to act by predicting the future. ICLR"},{"key":"785_CR14","first-page":"625","volume":"11","author":"D Erhan","year":"2010","unstructured":"Erhan D, Bengio Y, Courville A, Manzagol PA, Vincent P (2010) Why does unsupervised pre-training help deep learning? JMLR 11:625\u2013660","journal-title":"JMLR"},{"key":"785_CR15","doi-asserted-by":"publisher","first-page":"429","DOI":"10.1038\/415429a","volume":"415","author":"M Ernst","year":"2002","unstructured":"Ernst M, Banks M (2002) Humans integrate visual and haptic information in a statistically optimal fashion. Nature 415:429\u2013433","journal-title":"Nature"},{"key":"785_CR16","doi-asserted-by":"publisher","first-page":"815","DOI":"10.1098\/rstb.2005.1622","volume":"360","author":"KJ Friston","year":"2005","unstructured":"Friston KJ (2005) A theory of cortical responses. Phil Trans R Soc B 360:815\u2013836","journal-title":"Phil Trans R Soc B"},{"issue":"11","key":"785_CR17","doi-asserted-by":"publisher","first-page":"e1000211","DOI":"10.1371\/journal.pcbi.1000211","volume":"4","author":"KJ Friston","year":"2008","unstructured":"Friston KJ (2008) Hierarchical models in the brain. PLoS Comput Biol 4(11):e1000211","journal-title":"PLoS Comput Biol"},{"issue":"2","key":"785_CR18","doi-asserted-by":"publisher","first-page":"127","DOI":"10.1038\/nrn2787","volume":"11","author":"KJ Friston","year":"2010","unstructured":"Friston KJ (2010) The free-energy principle: a unified brain theory? Nat Rev Neurosci 11(2):127\u2013138","journal-title":"Nat Rev Neurosci"},{"key":"785_CR19","doi-asserted-by":"publisher","first-page":"2100","DOI":"10.3390\/e14112100","volume":"14","author":"KJ Friston","year":"2012","unstructured":"Friston KJ (2012) A free energy principle for biological systems. Entropy 14:2100\u20132121","journal-title":"Entropy"},{"key":"785_CR20","doi-asserted-by":"publisher","first-page":"20130475","DOI":"10.1098\/rsif.2013.0475","volume":"10","author":"KJ Friston","year":"2013","unstructured":"Friston KJ (2013) Life as we know it. J R Soc Interface 10:20130475","journal-title":"J R Soc Interface"},{"key":"785_CR21","doi-asserted-by":"publisher","first-page":"1211","DOI":"10.1098\/rstb.2008.0300","volume":"364","author":"KJ Friston","year":"2009","unstructured":"Friston KJ, Kiebel SJ (2009) Predictive coding under the free-energy principle. Philos Trans R Soc B 364:1211\u20131221","journal-title":"Philos Trans R Soc B"},{"key":"785_CR22","doi-asserted-by":"publisher","first-page":"70","DOI":"10.1016\/j.jphysparis.2006.10.001","volume":"100","author":"KJ Friston","year":"2006","unstructured":"Friston KJ, Kilner J, Harrison L (2006) A free energy principle for the brain. J Physiol Paris 100:70\u201387","journal-title":"J Physiol Paris"},{"issue":"3","key":"785_CR23","doi-asserted-by":"publisher","first-page":"227","DOI":"10.1007\/s00422-010-0364-z","volume":"192","author":"KJ Friston","year":"2010","unstructured":"Friston KJ, Daunizeau J, Kilner J, Kiebel SJ (2010) Action and behavior: a free-energy formulation. Biol Cybern 192(3):227\u2013260","journal-title":"Biol Cybern"},{"key":"785_CR24","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1007\/s00422-011-0424-z","volume":"104","author":"KJ Friston","year":"2011","unstructured":"Friston KJ, Mattout J, Kilner J (2011) Action understanding and active inference. Biol Cybern 104:137\u2013160","journal-title":"Biol Cybern"},{"issue":"4","key":"785_CR25","doi-asserted-by":"publisher","first-page":"187","DOI":"10.1080\/17588928.2015.1020053","volume":"6","author":"KJ Friston","year":"2015","unstructured":"Friston KJ, Rigoli F, Ognibene D, Mathys C, Fitzgerald T, Pezzulo G (2015) Active inference and epistemic value. Cogn Neurosci 6(4):187\u2013214","journal-title":"Cogn Neurosci"},{"key":"785_CR26","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1162\/NECO_a_00912","volume":"29","author":"KJ Friston","year":"2017","unstructured":"Friston KJ, Frith CD, Pezzulo G, Hobson JA, Ondobaka S (2017a) Active inference, curiosity and insight. Neural Comput 29:1\u201351","journal-title":"Neural Comput"},{"key":"785_CR27","doi-asserted-by":"publisher","first-page":"388","DOI":"10.1016\/j.neubiorev.2017.04.009","volume":"77","author":"KJ Friston","year":"2017","unstructured":"Friston KJ, Rosch R, Parr T, Price C, Bowman H (2017b) Deep temporal models and active inference. Neurosci Biobehav Rev 77:388\u2013402","journal-title":"Neurosci Biobehav Rev"},{"key":"785_CR28","unstructured":"Goodfellow I, Pouget-Abadie J, Mirza M, Xu B, Warde-Farley D, Ozair S, Courville A, Bengio Y (2014) Generative adversarial networks. \n                    arXiv:1406.2661"},{"key":"785_CR29","unstructured":"Goodfellow I, Bengio Y, Courville A (2016) Deep Learning. MIT Press, Cambridge. \n                    http:\/\/www.deeplearningbook.org"},{"key":"785_CR30","doi-asserted-by":"publisher","first-page":"471","DOI":"10.1038\/nature20101","volume":"538","author":"A Graves","year":"2016","unstructured":"Graves A, Wayne G, Reynolds M, Harley T, Danihelka I, Grabska-Barwinska A, G\u00f3mez Caolmenarejo S, Grefenstette E, Ramalho T, Agapiou J, Puigdomen\u00e8ch Badia A, Hermann KM, Zwols Y, Ostrovski G, Cain A, King H, Summerfield C, Blunsum P, Kavukcuoglu K, Hassabis D (2016) Hybrid computing using a neural network with dynamic external memory. Nature 538:471\u2013476","journal-title":"Nature"},{"key":"785_CR31","unstructured":"Ha D, Schmidhuber J (2018) World models. \n                    arXiv:1803.10122"},{"issue":"3","key":"785_CR32","doi-asserted-by":"publisher","first-page":"649","DOI":"10.1016\/j.neuron.2016.03.020","volume":"90","author":"R Haefner","year":"2016","unstructured":"Haefner R, Berkes P, Fiser J (2016) Perceptual decision-making as probabilistic inference by neural sampling. Neuron 90(3):649\u2013660","journal-title":"Neuron"},{"key":"785_CR33","unstructured":"Hansen N (2016) The CMA evolution strategy: a tutorial. \n                    arXiv:1604.00772"},{"key":"785_CR34","unstructured":"Harper M (2009) The replicator equation as an inference dynamic. \n                    arXiv:0911.1763"},{"key":"785_CR35","doi-asserted-by":"publisher","first-page":"504","DOI":"10.1126\/science.1127647","volume":"313","author":"GE Hinton","year":"2006","unstructured":"Hinton GE, Salakhutdinov RR (2006) Reducing the dimensionality of data with neural networks. Science 313:504\u2013507","journal-title":"Science"},{"key":"785_CR36","doi-asserted-by":"publisher","first-page":"359","DOI":"10.1016\/0893-6080(89)90020-8","volume":"2","author":"K Hornik","year":"1989","unstructured":"Hornik K, Stinchcombe M, White H (1989) Multilayer feedforward networks are universal approximators. Neural Netw 2:359\u2013366","journal-title":"Neural Netw"},{"key":"785_CR37","unstructured":"Husz\u00e1r F (2017) Variational inference using implicit distributions. \n                    arXiv:1702.08235"},{"key":"785_CR38","unstructured":"Karpathy A, Johnson J, Fei-Fei L (2015) Visualizing and understanding recurrent networks. \n                    arXiv:1506.02078"},{"key":"785_CR39","unstructured":"Karras T, Aila T, Laine S, Lehtinen J (2018) Progressive growing of gans for improved quality, stability, and variation. ICLR"},{"key":"785_CR40","doi-asserted-by":"crossref","unstructured":"Kempka M, Wydmuch M, Runc G, Toczek J, Ja\u015bkowski W (2016) Vizdoom: a doom-based AI research platform for visual reinforcement learning. \n                    arXiv:1605.02097","DOI":"10.1109\/CIG.2016.7860433"},{"key":"785_CR41","unstructured":"Kingma DP, Ba J (2014) Adam: a method for stochastic optimization. \n                    arXiv:1412.6980"},{"key":"785_CR42","unstructured":"Kingma DP, Welling M (2014) Auto-encoding variational bayes. ICLR"},{"key":"785_CR43","unstructured":"Kingma DP, Salimans T, Jozefowicz R, Chen X, Sutskever I, Welling M (2016) Improving variational inference with inverse autoregressive flow. \n                    arXiv:1606.04934"},{"issue":"12","key":"785_CR44","doi-asserted-by":"publisher","first-page":"712","DOI":"10.1016\/j.tins.2004.10.007","volume":"27","author":"D Knill","year":"2004","unstructured":"Knill D, Pouget A (2004) The bayesian brain: the role of uncertainty in neural coding and computation. Trends Neurosci 27(12):712\u2013719","journal-title":"Trends Neurosci"},{"key":"785_CR45","unstructured":"Le QV, Jaitly N, Hinton GE (2015) A simple way to initialize recurrent networks of rectified linear units. \n                    arXiv:1504.00941"},{"key":"785_CR46","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun Y, Bengio Y, Hinton GE (2015) Deep learning. Nature 521:436\u2013444","journal-title":"Nature"},{"key":"785_CR47","unstructured":"Ledig C, Theis L, Husz\u00e1r F, Caballero J, Cunningham A, Acosta A, Aitken A, Tejani A, Totz J, Wang Z, Shi W (2016) Photo-realistic single image super-resolution using a generative adversarial network. \n                    arXiv:1609.04802"},{"key":"785_CR48","unstructured":"Liu MY, Breuel T, Kautz J (2017) Unsupervised image-to-image translation networks. Neural Information Processing Systems (NIPS). \n                    arXiv:1703.00848"},{"key":"785_CR49","unstructured":"Maal\u00f8e L, S\u00f8nderby CK, S\u00f8nderby SK, Winther O (2016) Auxiliary deep generative models. \n                    arXiv:1602.05473"},{"key":"785_CR50","unstructured":"Maheswaranathan N, Metz L, Tucker G, Sohl-Dickenstein J (2018) Guided evolutionary strategies: escaping the curse of dimensionality in random search. \n                    arXiv:1806.10230"},{"key":"785_CR51","unstructured":"Mescheder L, Nowozin S, Geiger A (2017) Adversarial variational Bayes: unifying variational autoencoders and generative adversarial networks. \n                    arXiv:1701.04722"},{"key":"785_CR52","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1038\/nature14236","volume":"518","author":"V Mnih","year":"2015","unstructured":"Mnih V, Kavukcuoglu K, Silver D, Rusu AA, Veness J, Bellemare MG, Graves A, Riedmiller M, Fidjeland AK, Ostrovski G, Petersen S, Beattie C, Sadik A, Antonoglou I, King H, Kumaran D, Wierstra D, Legg S, Hassabis D (2015) Human-level control through deep reinforcement learning. Nature 518:529\u2013533","journal-title":"Nature"},{"key":"785_CR53","doi-asserted-by":"crossref","unstructured":"Moore A (1991) Variable resolution dynamic programming: efficiently learning action maps in multivariate real-valued state-spaces. In: Proceedings of the eight international conference on machine learning. Morgan Kaufmann","DOI":"10.1016\/B978-1-55860-200-7.50069-6"},{"issue":"30","key":"785_CR54","doi-asserted-by":"publisher","first-page":"12491","DOI":"10.1073\/pnas.1101430108","volume":"108","author":"R Moreno-Bote","year":"2011","unstructured":"Moreno-Bote R, Knill D, Pouget A (2011) Bayesian sampling in visual perception. Proc Natl Acad Sci USA 108(30):12491\u201312496","journal-title":"Proc Natl Acad Sci USA"},{"key":"785_CR55","doi-asserted-by":"crossref","unstructured":"Pathak D, Pulkit A, Efros AA, Darrell T (2017) Curiosity-driven exploration by self-supervised prediction. \n                    arXiv:1705.05363","DOI":"10.1109\/CVPRW.2017.70"},{"key":"785_CR56","unstructured":"Platt JC, Barr AH (1988) Constrained differential optimization. In: Neural information processing systems. American Institute of Physics, New York, pp 612\u2013621"},{"key":"785_CR57","unstructured":"Radford A, Narasimhan K, Salimans T, Sutskever I (2018) Improving language understanding by generative pre-training. Technical report, OpenAI"},{"key":"785_CR58","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.plrev.2017.09.001","volume":"24","author":"MJD Ramstead","year":"2017","unstructured":"Ramstead MJD, Badcock PB, Friston KJ (2017) Answering schr\u00f6dinger\u2019s question: a free-energy formulation. Phys Life Rev 24:1\u201316","journal-title":"Phys Life Rev"},{"key":"785_CR59","unstructured":"Rezende DJ, Mohamed S (2015) Variational inference with normalizing flows. JMLR 37"},{"key":"785_CR60","unstructured":"Rezende DJ, Mohamed S, Wierstra D (2014) Stochastic backpropagation and approximate inference in deep generative models. ICML"},{"key":"785_CR61","unstructured":"Rezende DJ, Ali\u00a0Eslami SM, Mohamed S, Battaglia P, Jaderberg M, Heess N (2016) Unsupervised learning of 3d structure from images. \n                    arXiv:1607.00662"},{"key":"785_CR62","unstructured":"Salimans T, Ho J, Chen X, Sutskever I (2017) Evolution strategies as a scalable alternative to reinforcement learning. \n                    arXiv:1703.03864"},{"key":"785_CR63","doi-asserted-by":"publisher","first-page":"16575","DOI":"10.1038\/srep16575","volume":"5","author":"P Schwartenbeck","year":"2015","unstructured":"Schwartenbeck P, Fitzgerald T, Mathys C, Dolan R, Kronbichler M, Friston KJ (2015) Evidence for surprise minimization over value maximization in choice behavior. Sci Rep 5:16575","journal-title":"Sci Rep"},{"key":"785_CR64","doi-asserted-by":"publisher","first-page":"545","DOI":"10.1126\/science.268.5210.545","volume":"268","author":"HT Siegelmann","year":"1995","unstructured":"Siegelmann HT (1995) Computation beyond the turing limit. Science 268:545\u2013548","journal-title":"Science"},{"key":"785_CR65","unstructured":"Theano Development Team (2016) Theano: a Python framework for fast computation of mathematical expressions. \n                    arXiv:1605.02688"},{"key":"785_CR66","doi-asserted-by":"crossref","unstructured":"Todorov E, Erez T, Tassa Y (2012) Mujoco: A physics engine for model-based control. In: Proceedings of the IEEE\/RSJ international conference on intelligent robots and systems (IROS)","DOI":"10.1109\/IROS.2012.6386109"},{"key":"785_CR67","unstructured":"Tomczak JM, Welling M (2016) Improving variational auto-encoders using householder flow. \n                    arXiv:1611.09630"},{"key":"785_CR68","unstructured":"Tran D, Ranganath R, Blei D (2017) Hierarchical implicit models and likelihood-free variational inference. \n                    arXiv:1702.08896"},{"issue":"2","key":"785_CR69","doi-asserted-by":"publisher","first-page":"147","DOI":"10.1016\/j.tree.2015.11.009","volume":"31","author":"RA Watson","year":"2016","unstructured":"Watson RA, Szathm\u00e1ry E (2016) How can evolution learn? Trends Ecol Evol 31(2):147\u2013157","journal-title":"Trends Ecol Evol"},{"issue":"4","key":"785_CR70","doi-asserted-by":"publisher","first-page":"1314","DOI":"10.1523\/JNEUROSCI.3733-05.2006","volume":"26","author":"KF Wong","year":"2006","unstructured":"Wong KF, Wang XJ (2006) A recurrent network mechanism of time integration in perceptual decisions. J Neurosci 26(4):1314\u20131328","journal-title":"J Neurosci"},{"key":"785_CR71","doi-asserted-by":"crossref","unstructured":"Zhu JY, Park T, Isola P, Efros AA (2017) Unpaired image-to-image translation using cycle-consistent adversarial networks. \n                    arXiv:1703.10593","DOI":"10.1109\/ICCV.2017.244"}],"container-title":["Biological Cybernetics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00422-018-0785-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00422-018-0785-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00422-018-0785-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,10,21]],"date-time":"2019-10-21T20:42:27Z","timestamp":1571690547000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00422-018-0785-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,10,22]]},"references-count":71,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2018,12]]}},"alternative-id":["785"],"URL":"https:\/\/doi.org\/10.1007\/s00422-018-0785-7","relation":{},"ISSN":["0340-1200","1432-0770"],"issn-type":[{"value":"0340-1200","type":"print"},{"value":"1432-0770","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,10,22]]},"assertion":[{"value":"17 September 2017","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 October 2018","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 October 2018","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}