{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T05:00:49Z","timestamp":1743051649362,"version":"3.40.3"},"publisher-location":"Cham","reference-count":51,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031287183"},{"type":"electronic","value":"9783031287190"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-28719-0_14","type":"book-chapter","created":{"date-parts":[[2023,3,21]],"date-time":"2023-03-21T18:03:51Z","timestamp":1679421831000},"page":"192-209","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Capsule Networks as\u00a0Generative Models"],"prefix":"10.1007","author":[{"given":"Alex B.","family":"Kiefer","sequence":"first","affiliation":[]},{"given":"Beren","family":"Millidge","sequence":"additional","affiliation":[]},{"given":"Alexander","family":"Tschantz","sequence":"additional","affiliation":[]},{"given":"Christopher L.","family":"Buckley","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,3,22]]},"reference":[{"key":"14_CR1","unstructured":"Bahdanau, D., Cho, K., Bengio, Y.: Neural machine translation by jointly learning to align and translate (2014). arXiv preprint arXiv:1409.0473"},{"key":"14_CR2","unstructured":"Beal, M.J.: Variational algorithms for approximate Bayesian inference. Technical report (2003)"},{"key":"14_CR3","doi-asserted-by":"publisher","first-page":"198","DOI":"10.1016\/j.jmp.2015.11.003","volume":"76","author":"R Bogacz","year":"2017","unstructured":"Bogacz, R.: A tutorial on the free-energy framework for modelling perception and learning. J. Math. Psychol. 76, 198\u2013211 (2017)","journal-title":"J. Math. Psychol."},{"key":"14_CR4","unstructured":"Bricken, T., Pehlevan, C.: Attention approximates sparse distributed memory. arXiv preprint arXiv:2111.05498 (2021)"},{"key":"14_CR5","unstructured":"Brown, T.B., et al.: Language models are few-shot learners. arXiv preprint arXiv:2005.14165 (2020)"},{"key":"14_CR6","doi-asserted-by":"publisher","first-page":"55","DOI":"10.1016\/j.jmp.2017.09.004","volume":"81","author":"CL Buckley","year":"2017","unstructured":"Buckley, C.L., Kim, C.S., McGregor, S., Seth, A.K.: The free energy principle for action and perception: a mathematical review. J. Math. Psychol. 81, 55\u201379 (2017)","journal-title":"J. Math. Psychol."},{"issue":"4","key":"14_CR7","doi-asserted-by":"publisher","first-page":"264","DOI":"10.1038\/nrn3687","volume":"15","author":"G Buzs\u00e1ki","year":"2014","unstructured":"Buzs\u00e1ki, G., Mizuseki, K.: The log-dynamic brain: how skewed distributions affect network operations. Nat. Rev. Neurosci. 15(4), 264\u2013278 (2014)","journal-title":"Nat. Rev. Neurosci."},{"key":"14_CR8","first-page":"15084","volume":"34","author":"L Chen","year":"2021","unstructured":"Chen, L., et al.: Decision transformer: reinforcement learning via sequence modeling. Adv. Neural. Inf. Process. Syst. 34, 15084\u201315097 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"issue":"6","key":"14_CR9","doi-asserted-by":"publisher","first-page":"327","DOI":"10.1038\/nrn3011","volume":"12","author":"CI De Zeeuw","year":"2011","unstructured":"De Zeeuw, C.I., Hoebeek, F.E., Bosman, L.W., Schonewille, M., Witter, L., Koekkoek, S.K.: Spatiotemporal firing patterns in the cerebellum. Nat. Rev. Neurosci. 12(6), 327\u2013344 (2011)","journal-title":"Nat. Rev. Neurosci."},{"issue":"2","key":"14_CR10","doi-asserted-by":"publisher","first-page":"288","DOI":"10.1007\/s10955-017-1806-y","volume":"168","author":"M Demircigil","year":"2017","unstructured":"Demircigil, M., Heusel, J., L\u00f6we, M., Upgang, S., Vermet, F.: On a model of associative memory with huge storage capacity. J. Stat. Phys. 168(2), 288\u2013299 (2017)","journal-title":"J. Stat. Phys."},{"key":"14_CR11","unstructured":"Dosovitskiy, A., et al.: An image is worth 16$$\\times $$16 words: transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)"},{"issue":"1456","key":"14_CR12","doi-asserted-by":"publisher","first-page":"815","DOI":"10.1098\/rstb.2005.1622","volume":"360","author":"K Friston","year":"2005","unstructured":"Friston, K.: A theory of cortical responses. Philos. Trans. Roy. Soc. B Biol. Sci. 360(1456), 815\u2013836 (2005)","journal-title":"Philos. Trans. Roy. Soc. B Biol. Sci."},{"key":"14_CR13","first-page":"181","volume":"3","author":"DJ Graham","year":"2006","unstructured":"Graham, D.J., Field, D.J.: Sparse coding in the neocortex. Evol. Nerv. Syst. 3, 181\u2013187 (2006)","journal-title":"Evol. Nerv. Syst."},{"key":"14_CR14","unstructured":"Greff, K., Srivastava, R.K., Schmidhuber, J.: Highway and residual networks learn unrolled iterative estimation. arXiv preprint arXiv:1612.07771 (2016)"},{"key":"14_CR15","unstructured":"Gregor, K., Danihelka, I., Graves, A., Rezende, D., Wierstra, D.: Draw: a recurrent neural network for image generation. In: International Conference on Machine Learning, pp. 1462\u20131471. PMLR (2015)"},{"key":"14_CR16","unstructured":"Hinton, G.: How to represent part-whole hierarchies in a neural network. arXiv preprint arXiv:2102.12627 (2021)"},{"key":"14_CR17","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1007\/978-3-642-21735-7_6","volume-title":"Artificial Neural Networks and Machine Learning \u2013 ICANN 2011","author":"GE Hinton","year":"2011","unstructured":"Hinton, G.E., Krizhevsky, A., Wang, S.D.: Transforming auto-encoders. In: Honkela, T., Duch, W., Girolami, M., Kaski, S. (eds.) ICANN 2011. LNCS, vol. 6791, pp. 44\u201351. Springer, Heidelberg (2011). https:\/\/doi.org\/10.1007\/978-3-642-21735-7_6"},{"key":"14_CR18","unstructured":"Hinton, G.E., Sabour, S., Frosst, N.: Matrix capsules with EM routing. In: International Conference on Learning Representations (2018)"},{"key":"14_CR19","unstructured":"Jastrzbski, S., Arpit, D., Ballas, N., Verma, V., Che, T., Bengio, Y.: Residual connections encourage iterative inference. arXiv preprint arXiv:1710.04773 (2017)"},{"key":"14_CR20","volume-title":"Sparse Distributed Memory","author":"P Kanerva","year":"1988","unstructured":"Kanerva, P.: Sparse Distributed Memory. MIT Press, Cambridge (1988)"},{"key":"14_CR21","unstructured":"Krotov, D., Hopfield, J.: Large associative memory problem in neurobiology and machine learning. arXiv preprint arXiv:2008.06996 (2020)"},{"key":"14_CR22","unstructured":"Krotov, D., Hopfield, J.J.: Dense associative memory for pattern recognition. Advance in Neural Information Processing System, vol. 29, pp. 1172\u20131180 (2016)"},{"issue":"11","key":"14_CR23","doi-asserted-by":"publisher","first-page":"571","DOI":"10.1016\/S0166-2236(00)01657-X","volume":"23","author":"VA Lamme","year":"2000","unstructured":"Lamme, V.A., Roelfsema, P.R.: The distinct modes of vision offered by feedforward and recurrent processing. Trends Neurosci. 23(11), 571\u2013579 (2000)","journal-title":"Trends Neurosci."},{"key":"14_CR24","unstructured":"Makhzani, A., Frey, B.J.: k-sparse autoencoders. CoRR abs\/1312.5663 (2014)"},{"issue":"12","key":"14_CR25","doi-asserted-by":"publisher","first-page":"2943","DOI":"10.1093\/cercor\/bhr384","volume":"22","author":"L Melloni","year":"2012","unstructured":"Melloni, L., van Leeuwen, S., Alink, A., M\u00fcller, N.G.: Interaction between bottom-up saliency and top-down control: how saliency maps are created in the human brain. Cereb. Cortex 22(12), 2943\u20132952 (2012)","journal-title":"Cereb. Cortex"},{"key":"14_CR26","unstructured":"Millidge, B., Salvatori, T., Song, Y., Lukasiewicz, T., Bogacz, R.: Universal hopfield networks: a general framework for single-shot associative memory models. arXiv preprint arXiv:2202.04557 (2022)"},{"key":"14_CR27","unstructured":"Millidge, B., Seth, A., Buckley, C.L.: Predictive coding: a theoretical and experimental review. arXiv preprint arXiv:2107.12979 (2021)"},{"key":"14_CR28","unstructured":"Naz\u00e1bal, A., Williams, C.K.I.: Inference for generative capsule models. CoRR abs\/2103.06676 (2021), https:\/\/arxiv.org\/abs\/2103.06676"},{"issue":"6583","key":"14_CR29","doi-asserted-by":"publisher","first-page":"607","DOI":"10.1038\/381607a0","volume":"381","author":"BA Olshausen","year":"1996","unstructured":"Olshausen, B.A., Field, D.J.: Emergence of simple-cell receptive field properties by learning a sparse code for natural images. Nature 381(6583), 607\u2013609 (1996)","journal-title":"Nature"},{"issue":"4","key":"14_CR30","doi-asserted-by":"publisher","first-page":"481","DOI":"10.1016\/j.conb.2004.07.007","volume":"14","author":"BA Olshausen","year":"2004","unstructured":"Olshausen, B.A., Field, D.J.: Sparse coding of sensory inputs. Curr. Opin. Neurobiol. 14(4), 481\u2013487 (2004)","journal-title":"Curr. Opin. Neurobiol."},{"key":"14_CR31","unstructured":"Paik, I., Kwak, T., Kim, I.: Capsule networks need an improved routing algorithm. ArXiv abs\/1907.13327 (2019)"},{"key":"14_CR32","unstructured":"Parmar, N., et al.: Image transformer. In: International Conference on Machine Learning, pp. 4055\u20134064. PMLR (2018)"},{"key":"14_CR33","doi-asserted-by":"crossref","unstructured":"Pearl, J.: Probabilistic Reasoning in Intelligent Systems: Networks of Plausible Inference. Morgan kaufmann, Burlington (1988)","DOI":"10.1016\/B978-0-08-051489-5.50008-4"},{"issue":"8","key":"14_CR34","first-page":"9","volume":"1","author":"A Radford","year":"2019","unstructured":"Radford, A., Wu, J., Child, R., Luan, D., Amodei, D., Sutskever, I., et al.: Language models are unsupervised multitask learners. OpenAI Blog 1(8), 9 (2019)","journal-title":"OpenAI Blog"},{"key":"14_CR35","unstructured":"Ramsauer, H., et al.: Hopfield networks is all you need. arXiv preprint arXiv:2008.02217 (2020)"},{"key":"14_CR36","unstructured":"Rawlinson, D., Ahmed, A., Kowadlo, G.: Sparse unsupervised capsules generalize better. ArXiv abs\/1804.06094 (2018)"},{"key":"14_CR37","unstructured":"Reed, S., Zolna, K., et al.: A generalist agent. arXiv preprint arXiv:2205.06175 (2022)"},{"key":"14_CR38","doi-asserted-by":"crossref","unstructured":"Ribeiro, F.D.S., Leontidis, G., Kollias, S.D.: Capsule routing via variational bayes. In: AAAI, pp. 3749\u20133756 (2020)","DOI":"10.1609\/aaai.v34i04.5785"},{"key":"14_CR39","unstructured":"Sabour, S., Frosst, N., Hinton, G.E.: Dynamic routing between capsules. In: Advances in Neural Information Processing Systems, vol. 30 (2017)"},{"issue":"1","key":"14_CR40","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1016\/S0306-4522(00)00548-0","volume":"103","author":"N Schweighofer","year":"2001","unstructured":"Schweighofer, N., Doya, K., Lay, F.: Unsupervised learning of granule cell sparse codes enhances cerebellar adaptive control. Neuroscience 103(1), 35\u201350 (2001)","journal-title":"Neuroscience"},{"key":"14_CR41","volume-title":"Handbook of Brain Microcircuits","author":"GM Shepherd","year":"2018","unstructured":"Shepherd, G.M., Grillner, S.: Handbook of Brain Microcircuits. Oxford University Press, Oxford (2018)"},{"key":"14_CR42","unstructured":"Smith, L., Schut, L., Gal, Y., van der Wilk, M.: Capsule networks - a probabilistic perspective. CoRR abs\/2004.03553 (2020). https:\/\/arxiv.org\/abs\/2004.03553"},{"key":"14_CR43","doi-asserted-by":"crossref","DOI":"10.7551\/mitpress\/9780262028707.001.0001","volume-title":"Principles of Neural Design","author":"P Sterling","year":"2015","unstructured":"Sterling, P., Laughlin, S.: Principles of Neural Design. MIT Press, Cambridge (2015)"},{"issue":"2","key":"14_CR44","first-page":"77","volume":"135","author":"J Theeuwes","year":"2010","unstructured":"Theeuwes, J.: Top-down and bottom-up control of visual selection. Acta Physiol. (Oxf) 135(2), 77\u201399 (2010)","journal-title":"Acta Physiol. (Oxf)"},{"key":"14_CR45","doi-asserted-by":"crossref","unstructured":"Tschantz, A., Millidge, B., Seth, A.K., Buckley, C.L.: Hybrid predictive coding: Inferring, fast and slow. arXiv preprint arXiv:2204.02169 (2022)","DOI":"10.1371\/journal.pcbi.1011280"},{"issue":"1\u20132","key":"14_CR46","doi-asserted-by":"publisher","first-page":"167","DOI":"10.2478\/v10053-008-0022-3","volume":"3","author":"R VanRullen","year":"2007","unstructured":"VanRullen, R.: The power of the feed-forward sweep. Adv. Cogn. Psychol. 3(1\u20132), 167 (2007)","journal-title":"Adv. Cogn. Psychol."},{"key":"14_CR47","unstructured":"Vaswani, A., Shazeer, N., et al.: Attention is all you need. In: Advances in Neural Information Processing Systems, pp. 5998\u20136008 (2017)"},{"key":"14_CR48","doi-asserted-by":"crossref","unstructured":"Wainwright, M.J., Jordan, M.I., et al.: Graphical models, exponential families, and variational inference. Found. Trends\u00ae Mach. Learn. 1(1\u20132), 1\u2013305 (2008)","DOI":"10.1561\/2200000001"},{"issue":"11","key":"14_CR49","doi-asserted-by":"publisher","first-page":"2100","DOI":"10.1162\/jocn.2008.21173","volume":"21","author":"R Weidner","year":"2009","unstructured":"Weidner, R., Krummenacher, J., Reimann, B., M\u00fcller, H.J., Fink, G.R.: Sources of top-down control in visual search. J. Cogn. Neurosci. 21(11), 2100\u20132113 (2009)","journal-title":"J. Cogn. Neurosci."},{"issue":"6","key":"14_CR50","doi-asserted-by":"publisher","first-page":"2907","DOI":"10.1152\/jn.00594.2010","volume":"105","author":"BD Willmore","year":"2011","unstructured":"Willmore, B.D., Mazer, J.A., Gallant, J.L.: Sparse coding in striate and extrastriate visual cortex. J. Neurophysiol. 105(6), 2907\u20132919 (2011)","journal-title":"J. Neurophysiol."},{"key":"14_CR51","unstructured":"Zheng, Q., Zhang, A., Grover, A.: Online decision transformer. arXiv preprint arXiv:2202.05607 (2022)"}],"container-title":["Communications in Computer and Information Science","Active Inference"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-28719-0_14","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,16]],"date-time":"2024-10-16T19:47:26Z","timestamp":1729108046000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-28719-0_14"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031287183","9783031287190"],"references-count":51,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-28719-0_14","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"type":"print","value":"1865-0929"},{"type":"electronic","value":"1865-0937"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"22 March 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"Code for the capsules network is adapted fromand can be found at:. Code reproducing the toy model experiments and figure in Appendix B can be found at:.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Code Availability"}},{"value":"IWAI","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Workshop on Active Inference","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Grenoble","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"France","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2022","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"19 September 2022","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"19 September 2022","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"3","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"iwai-ws2022","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/iwaiworkshop.github.io\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}