{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,9]],"date-time":"2026-04-09T10:41:06Z","timestamp":1775731266658,"version":"3.50.1"},"publisher-location":"Cham","reference-count":37,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031771378","type":"print"},{"value":"9783031771385","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,12,31]],"date-time":"2024-12-31T00:00:00Z","timestamp":1735603200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,12,31]],"date-time":"2024-12-31T00:00:00Z","timestamp":1735603200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-77138-5_4","type":"book-chapter","created":{"date-parts":[[2024,12,30]],"date-time":"2024-12-30T11:46:31Z","timestamp":1735559191000},"page":"49-71","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["Learning in\u00a0Hybrid Active Inference Models"],"prefix":"10.1007","author":[{"given":"Poppy","family":"Collis","sequence":"first","affiliation":[]},{"given":"Ryan","family":"Singh","sequence":"additional","affiliation":[]},{"given":"Paul F.","family":"Kinghorn","sequence":"additional","affiliation":[]},{"given":"Christopher L.","family":"Buckley","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,12,31]]},"reference":[{"key":"4_CR1","unstructured":"Abdulsamad, H., Peters, J.: Hierarchical decomposition of nonlinear dynamics and control for system identification and policy distillation. In: Bayen, A.M., et al. (eds.) Proceedings of the 2nd Conference on Learning for Dynamics and Control. Proceedings of Machine Learning Research, vol.\u00a0120, pp. 904\u2013914. PMLR (2020)"},{"key":"4_CR2","doi-asserted-by":"publisher","first-page":"155","DOI":"10.1109\/OJCSYS.2023.3277308","volume":"2","author":"H Abdulsamad","year":"2023","unstructured":"Abdulsamad, H., Peters, J.: Model-based reinforcement learning via stochastic hybrid models. IEEE Open J. Control Syst. 2, 155\u2013170 (2023)","journal-title":"IEEE Open J. Control Syst."},{"key":"4_CR3","doi-asserted-by":"crossref","unstructured":"Bemporad, A., Borrelli, F., Morari, M.: Piecewise linear optimal controllers for hybrid systems. In: Proceedings of the 2000 American Control Conference. ACC (IEEE Cat. No. 00CH36334), vol.\u00a02, pp. 1190\u20131194 (2000)","DOI":"10.1109\/ACC.2000.876688"},{"issue":"1","key":"4_CR4","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1016\/S0005-1098(01)00174-1","volume":"38","author":"A Bemporad","year":"2002","unstructured":"Bemporad, A., Morari, M., Dua, V., Pistikopoulos, E.N.: The explicit linear quadratic regulator for constrained systems. Automatica 38(1), 3\u201320 (2002)","journal-title":"Automatica"},{"key":"4_CR5","unstructured":"Block, A., Jadbabaie, A., Pfrommer, D., Simchowitz, M., Tedrake, R.: Provable guarantees for generative behavior cloning: bridging low-level stability and high-level behavior (2023)"},{"issue":"3","key":"4_CR6","doi-asserted-by":"publisher","first-page":"541","DOI":"10.1109\/TCST.2005.860527","volume":"14","author":"F Borrelli","year":"2006","unstructured":"Borrelli, F., Bemporad, A., Fodor, M., Hrovat, D.: An MPC\/hybrid system approach to traction control. IEEE Trans. Control Syst. Technol. 14(3), 541\u2013552 (2006)","journal-title":"IEEE Trans. Control Syst. Technol."},{"key":"4_CR7","doi-asserted-by":"crossref","unstructured":"Coulom, R.: Efficient selectivity and backup operators in Monte-Carlo tree search. In: van\u00a0den Herik, H.J., Ciancarini, P., Donkers, H.H.L.M.J. (eds.) Computers and Games, pp. 72\u201383. Springer, Heidelberg (2007)","DOI":"10.1007\/978-3-540-75538-8_7"},{"key":"4_CR8","doi-asserted-by":"publisher","DOI":"10.1016\/j.jmp.2020.102447","volume":"99","author":"L Da Costa","year":"2020","unstructured":"Da Costa, L., Parr, T., Sajid, N., Veselic, S., Neacsu, V., Friston, K.: Active inference on discrete state-spaces: a synthesis. J. Math. Psychol. 99, 102447 (2020)","journal-title":"J. Math. Psychol."},{"issue":"2","key":"4_CR9","doi-asserted-by":"publisher","first-page":"337","DOI":"10.1007\/s10994-016-5580-x","volume":"104","author":"C Daniel","year":"2016","unstructured":"Daniel, C., van Hoof, H., Peters, J., Neumann, G.: Probabilistic inference for determining options in reinforcement learning. Mach. Learn. 104(2), 337\u2013357 (2016)","journal-title":"Mach. Learn."},{"key":"4_CR10","unstructured":"Dayan, P., Hinton, G.E.: Feudal reinforcement learning. In: Hanson, S., Cowan, J., Giles, C. (eds.) Advances in Neural Information Processing Systems, vol.\u00a05. Morgan-Kaufmann (1992)"},{"key":"4_CR11","unstructured":"Fox, E., Sudderth, E., Jordan, M., Willsky, A.: Nonparametric Bayesian learning of switching linear dynamical systems. In: Koller, D., Schuurmans, D., Bengio, Y., Bottou, L. (eds.) Advances in Neural Information Processing Systems, vol.\u00a021. Curran Associates, Inc. (2008)"},{"key":"4_CR12","doi-asserted-by":"crossref","unstructured":"Friston, K., et al.: Supervised structure learning (2023)","DOI":"10.1016\/j.biopsycho.2024.108891"},{"issue":"4","key":"4_CR13","doi-asserted-by":"publisher","first-page":"381","DOI":"10.1162\/NETN_a_00018","volume":"1","author":"KJ Friston","year":"2017","unstructured":"Friston, K.J., Parr, T., de Vries, B.: The graphical brain: belief propagation and active inference. Netw. Neurosci. 1(4), 381\u2013414 (2017)","journal-title":"Netw. Neurosci."},{"key":"4_CR14","doi-asserted-by":"publisher","DOI":"10.1016\/j.heares.2020.107998","volume":"399","author":"KJ Friston","year":"2021","unstructured":"Friston, K.J., Sajid, N., Quiroga-Martinez, D.R., Parr, T., Price, C.J., Holmes, E.: Active listening. Hear. Res. 399, 107998 (2021)","journal-title":"Hear. Res."},{"issue":"4","key":"4_CR15","doi-asserted-by":"publisher","first-page":"831","DOI":"10.1162\/089976600300015619","volume":"12","author":"Z Ghahramani","year":"2000","unstructured":"Ghahramani, Z., Hinton, G.E.: Variational learning for switching state-space models. Neural Comput. 12(4), 831\u2013864 (2000)","journal-title":"Neural Comput."},{"key":"4_CR16","doi-asserted-by":"publisher","first-page":"236","DOI":"10.1016\/S1364-6613(00)01662-4","volume":"5","author":"F Gobet","year":"2001","unstructured":"Gobet, F., et al.: Chunking mechanisms in human learning. Trends Cogn. Sci. 5, 236\u2013243 (2001)","journal-title":"Trends Cogn. Sci."},{"key":"4_CR17","unstructured":"Gou, S.Z., Liu, Y.: DQN with model-based exploration: efficient learning on environments with sparse rewards. CoRR abs\/1903.09295 (2019)"},{"key":"4_CR18","unstructured":"Hafner, D., Lee, K.H., Fischer, I., Abbeel, P.: Deep hierarchical planning from pixels (2022)"},{"key":"4_CR19","doi-asserted-by":"crossref","unstructured":"Heins, C., et al.: pymdp: a Python library for active inference in discrete state spaces. arXiv preprint arXiv:2201.03904 (2022)","DOI":"10.21105\/joss.04098"},{"issue":"12","key":"4_CR20","doi-asserted-by":"publisher","first-page":"1565","DOI":"10.3390\/e23121565","volume":"23","author":"MT Koudahl","year":"2021","unstructured":"Koudahl, M.T., Kouw, W.M., de Vries, B.: On epistemics in expected free energy for linear gaussian state space models. Entropy 23(12), 1565 (2021)","journal-title":"Entropy"},{"key":"4_CR21","doi-asserted-by":"crossref","unstructured":"LaValle, S.M.: Planning Algorithms, chap.\u00a02. Cambridge University Press, Cambridge (2006)","DOI":"10.1017\/CBO9780511546877"},{"key":"4_CR22","unstructured":"Linderman, S.W., Miller, A.C., Adams, R.P., Blei, D.M., Paninski, L., Johnson, M.J.: Recurrent switching linear dynamical systems (2016)"},{"key":"4_CR23","doi-asserted-by":"crossref","unstructured":"Millidge, B., Tschantz, A., Seth, A.K., Buckley, C.L.: On the relationship between active inference and control as inference (2020)","DOI":"10.1007\/978-3-030-64919-7_1"},{"key":"4_CR24","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1038\/nature14236","volume":"518","author":"V Mnih","year":"2015","unstructured":"Mnih, V., et al.: Human-level control through deep reinforcement learning. Nature 518, 529\u2013533 (2015)","journal-title":"Nature"},{"key":"4_CR25","unstructured":"Murphy, K.P.: Machine Learning: A Probabilistic Perspective. MIT Press (2012)"},{"key":"4_CR26","volume-title":"Human Problem Solving","author":"A Newell","year":"1972","unstructured":"Newell, A., Simon, H.A.: Human Problem Solving. Prentice-Hall, Englewood Cliffs (1972)"},{"key":"4_CR27","unstructured":"OpenAI: Continuous mountain car environment (2021). Accessed 25 May 2024"},{"key":"4_CR28","doi-asserted-by":"crossref","unstructured":"Parr, T., Pezzulo, G., Friston, K.: Active Inference: The Free Energy Principle in Mind, Brain, and Behavior. MIT Press (2022)","DOI":"10.7551\/mitpress\/12441.001.0001"},{"issue":"9","key":"4_CR29","doi-asserted-by":"publisher","first-page":"2319","DOI":"10.1162\/neco_a_01102","volume":"30","author":"T Parr","year":"2018","unstructured":"Parr, T., Friston, K.J.: The discrete and continuous brain: from decisions to movement-and back again. Neural Comput. 30(9), 2319\u20132347 (2018)","journal-title":"Neural Comput."},{"issue":"8","key":"4_CR30","doi-asserted-by":"publisher","first-page":"2473","DOI":"10.1007\/s00213-019-05240-0","volume":"236","author":"T Parr","year":"2019","unstructured":"Parr, T., Friston, K.J.: The computational pharmacology of oculomotion. Psychopharmacology 236(8), 2473\u20132484 (2019)","journal-title":"Psychopharmacology"},{"key":"4_CR31","unstructured":"Priorelli, M., Stoianov, I.P.: Hierarchical hybrid modeling for flexible tool use (2024)"},{"issue":"5","key":"4_CR32","doi-asserted-by":"publisher","first-page":"1327","DOI":"10.1007\/s00170-021-07682-3","volume":"117","author":"M Schwenzer","year":"2021","unstructured":"Schwenzer, M., Ay, M., Bergs, T., Abel, D.: Review on model predictive control: an engineering perspective. Int. J. Adv. Manuf. Technol. 117(5), 1327\u20131349 (2021)","journal-title":"Int. J. Adv. Manuf. Technol."},{"issue":"2","key":"4_CR33","doi-asserted-by":"publisher","first-page":"346","DOI":"10.1109\/TAC.1981.1102596","volume":"26","author":"E Sontag","year":"1981","unstructured":"Sontag, E.: Nonlinear regulation: the piecewise linear approach. IEEE Trans. Autom. Control 26(2), 346\u2013358 (1981)","journal-title":"IEEE Trans. Autom. Control"},{"issue":"1","key":"4_CR34","doi-asserted-by":"publisher","first-page":"181","DOI":"10.1016\/S0004-3702(99)00052-1","volume":"112","author":"RS Sutton","year":"1999","unstructured":"Sutton, R.S., Precup, D., Singh, S.: Between MDPs and semi-MDPs: a framework for temporal abstraction in reinforcement learning. Artif. Intell. 112(1), 181\u2013211 (1999)","journal-title":"Artif. Intell."},{"key":"4_CR35","doi-asserted-by":"crossref","unstructured":"Tessler, C., Givony, S., Zahavy, T., Mankowitz, D., Mannor, S.: A deep hierarchical approach to lifelong learning in minecraft. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 31, no. 1 (2017)","DOI":"10.1609\/aaai.v31i1.10744"},{"key":"4_CR36","unstructured":"Vezhnevets, A.S., et al.: FeUdal networks for hierarchical reinforcement learning. In: Precup, D., Teh, Y.W. (eds.) Proceedings of the 34th International Conference on Machine Learning. Proceedings of Machine Learning Research, vol.\u00a070, pp. 3540\u20133549. PMLR (2017)"},{"key":"4_CR37","unstructured":"Zoltowski, D.M., Pillow, J.W., Linderman, S.W.: Unifying and generalizing models of neural dynamics during decision-making (2020)"}],"container-title":["Communications in Computer and Information Science","Active Inference"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-77138-5_4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,30]],"date-time":"2024-12-30T12:05:17Z","timestamp":1735560317000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-77138-5_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,31]]},"ISBN":["9783031771378","9783031771385"],"references-count":37,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-77138-5_4","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"value":"1865-0929","type":"print"},{"value":"1865-0937","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,12,31]]},"assertion":[{"value":"31 December 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"IWAI","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Workshop on Active Inference","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Oxford","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"United Kingdom","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"9 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"11 September 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"5","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"iwai-ws2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/iwaiworkshop.github.io\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}