{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,5]],"date-time":"2026-05-05T20:28:05Z","timestamp":1778012885312,"version":"3.51.4"},"reference-count":125,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2023,11,17]],"date-time":"2023-11-17T00:00:00Z","timestamp":1700179200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,11,17]],"date-time":"2023-11-17T00:00:00Z","timestamp":1700179200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Nat Mach Intell"],"DOI":"10.1038\/s42256-023-00754-x","type":"journal-article","created":{"date-parts":[[2023,11,17]],"date-time":"2023-11-17T17:02:31Z","timestamp":1700240551000},"page":"1181-1188","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":30,"title":["A social path to human-like artificial intelligence"],"prefix":"10.1038","volume":"5","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-6212-9104","authenticated-orcid":false,"given":"Edgar A.","family":"Du\u00e9\u00f1ez-Guzm\u00e1n","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-9698-0865","authenticated-orcid":false,"given":"Suzanne","family":"Sadedin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jane X.","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4412-1686","authenticated-orcid":false,"given":"Kevin R.","family":"McKee","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3153-916X","authenticated-orcid":false,"given":"Joel Z.","family":"Leibo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,11,17]]},"reference":[{"key":"754_CR1","unstructured":"Krizhevsky, A., Sutskever, I. & Hinton, G. E. Imagenet classification with deep convolutional neural networks. Adv. NeurIPS 25, 1097\u20131105 (2012)."},{"key":"754_CR2","doi-asserted-by":"crossref","unstructured":"Deng, J. et al. Imagenet: a large-scale hierarchical image database. IEEE Conf. Comput. Vis. Pattern Recog. 248\u2013255 (2009).","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"754_CR3","unstructured":"Kaplan, J. et al. Scaling laws for neural language models. Preprint at https:\/\/arXiv.org\/abs\/2001.08361 (2020)."},{"key":"754_CR4","unstructured":"Bommasani, R. et al. On the opportunities and risks of foundation models. Preprint at https:\/\/arXiv.org\/abs\/2108.07258 (2021)."},{"key":"754_CR5","unstructured":"Hoffmann, J. et al. Training compute-optimal large language models. Preprint at https:\/\/arXiv.org\/abs\/2203.15556 (2022)."},{"key":"754_CR6","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1162\/daed_a_01902","volume":"151","author":"L Fei-Fei","year":"2022","unstructured":"Fei-Fei, L. & Krishna, R. Searching for computer vision north stars. Daedalus 151, 85\u201399 (2022).","journal-title":"Daedalus"},{"key":"754_CR7","first-page":"23716","volume":"35","author":"J-B Alayrac","year":"2022","unstructured":"Alayrac, J.-B. et al. Flamingo: a visual language model for few-shot learning. Adv. NeurIPS 35, 23716\u201323736 (2022).","journal-title":"Adv. NeurIPS"},{"key":"754_CR8","doi-asserted-by":"crossref","unstructured":"Young, T. Experiments and calculations relative to physical optics (The 1803 Bakerian lecture). Phil. Trans. R. Soc. 94, 1\u201316 (1804).","DOI":"10.1098\/rstl.1804.0001"},{"key":"754_CR9","unstructured":"Sutton, R. S. & Barto, A. G. Reinforcement Learning: An Introduction (MIT Press, 2018)."},{"key":"754_CR10","unstructured":"Schaul, T., Borsa, D., Modayil, J. & Pascanu, R. Ray interference: a source of plateaus in deep reinforcement learning. Preprint at https:\/\/arXiv.org\/abs\/1904.11455 (2019)."},{"key":"754_CR11","unstructured":"Ortega, P. A. et al. Shaking the foundations: delusions in sequence models for interaction and control. Preprint at https:\/\/arXiv.org\/abs\/2110.10819 (2021)."},{"key":"754_CR12","unstructured":"Huang, J. et al. Large language models can self-improve. Preprint at https:\/\/arXiv.org\/abs\/2210.11610 (2022)."},{"key":"754_CR13","unstructured":"Shumailov, I. et al. The curse of recursion: training on generated data makes models forget. Preprint at https:\/\/arXiv.org\/abs\/2305.17493 (2023)."},{"key":"754_CR14","unstructured":"Wang, R., Lehman, J., Clune, J. & Stanley, K. O. Paired open-ended trailblazer (POET): endlessly generating increasingly complex and diverse learning environments and their solutions. Preprint at https:\/\/arXiv.org\/abs\/1901.01753 (2019)."},{"key":"754_CR15","doi-asserted-by":"crossref","unstructured":"Portelas, R., Colas, C., Weng, L., Hofmann, K. & Oudeyer, P.-Y. Automatic curriculum learning for deep RL: a short survey. Proc. 29th International Joint Conference on Artificial Intelligence Survey Track (2020).","DOI":"10.24963\/ijcai.2020\/671"},{"key":"754_CR16","doi-asserted-by":"publisher","first-page":"1287","DOI":"10.1613\/jair.1.12087","volume":"69","author":"C Linke","year":"2020","unstructured":"Linke, C., Ady, N. M., White, M., Degris, T. & White, A. Adapting behavior via intrinsic reward: a survey and empirical study. J Artif. Intell. Res. 69, 1287\u20131332 (2020).","journal-title":"J Artif. Intell. Res."},{"key":"754_CR17","doi-asserted-by":"publisher","first-page":"6","DOI":"10.3389\/neuro.12.006.2007","volume":"1","author":"P-Y Oudeyer","year":"2007","unstructured":"Oudeyer, P.-Y. & Kaplan, F. What is intrinsic motivation? A typology of computational approaches. Front. Neurorobot. 1, 6 (2007).","journal-title":"Front. Neurorobot."},{"key":"754_CR18","doi-asserted-by":"crossref","unstructured":"Pathak, D., Agrawal, P., Efros, A. A. & Darrell, T. Curiosity-driven exploration by self-supervised prediction. Proc. 34th International Conference on Machine Learning 70, 2778\u20132787 (PMLR, 2017).","DOI":"10.1109\/CVPRW.2017.70"},{"key":"754_CR19","doi-asserted-by":"publisher","first-page":"1159","DOI":"10.1613\/jair.1.13554","volume":"74","author":"C Colas","year":"2022","unstructured":"Colas, C., Karch, T., Sigaud, O. & Oudeyer, P.-Y. Autotelic agents with intrinsically motivated goal-conditioned reinforcement learning: A short survey. J. Artif. Intell. Res. 74, 1159\u20131199 (2022).","journal-title":"J. Artif. Intell. Res."},{"key":"754_CR20","doi-asserted-by":"crossref","unstructured":"Ladosz, P., Weng, L., Kim, M. & Oh, H. Exploration in deep reinforcement learning: a survey. Inf. Fusion 85, 1\u201322 (2022).","DOI":"10.1016\/j.inffus.2022.03.003"},{"key":"754_CR21","doi-asserted-by":"publisher","first-page":"230539","DOI":"10.1098\/rsos.230539","volume":"10","author":"M Jiang","year":"2023","unstructured":"Jiang, M., Rockt\u00e4schel, T. & Grefenstette, E. General intelligence requires rethinking exploration. R. Soc. Open Sci. 10, 230539 (2023).","journal-title":"R. Soc. Open Sci."},{"key":"754_CR22","doi-asserted-by":"publisher","first-page":"209","DOI":"10.1023\/A:1017984413808","volume":"49","author":"M Kearns","year":"2002","unstructured":"Kearns, M. & Singh, S. Near-optimal reinforcement learning in polynomial time. Mach. Learn. 49, 209\u2013232 (2002).","journal-title":"Mach. Learn."},{"key":"754_CR23","first-page":"1","volume":"20","author":"I Osband","year":"2019","unstructured":"Osband, I., Van Roy, B., Russo, D. J. & Wen, Z. Deep exploration via randomized value functions. J. Mach. Learn. Res. 20, 1\u201362 (2019).","journal-title":"J. Mach. Learn. Res."},{"key":"754_CR24","unstructured":"Leibo, J. Z., Hughes, E., Lanctot, M. & Graepel, T. Autocurricula and the emergence of innovation from social interaction: a manifesto for multi-agent intelligence research. Preprint at https:\/\/arXiv.org\/abs\/1903.00742 (2019)."},{"key":"754_CR25","unstructured":"Sukhbaatar, S. et al. Intrinsic motivation and automatic curricula via asymmetric self-play. 6th International Conference on Learning Representations 6 (2018)."},{"key":"754_CR26","unstructured":"Leibo, J. Z. et al. Malthusian reinforcement learning. Proc. 18th International Conference on Autonomous Agents and MultiAgent Systems 1099\u20131107 (2019)."},{"key":"754_CR27","unstructured":"Baker, B. et al. Emergent tool use from multi-agent autocurricula. 8th International Conference on Learning Representations 8 (2020)."},{"key":"754_CR28","unstructured":"Balduzzi, D. et al. Open-ended learning in symmetric zero-sum games. Proc. 36th International Conference on Machine Learning 97, 434\u2013443 (PMLR, 2019)."},{"key":"754_CR29","unstructured":"Plappert, M. et al. Asymmetric self-play for automatic goal discovery in robotic manipulation. Preprint at https:\/\/arXiv.org\/abs\/2101.04882 (2021)."},{"key":"754_CR30","unstructured":"Goodfellow, I. et al. Generative adversarial nets. Adv. NeurIPS 27, 2672\u20132680 (2014)."},{"key":"754_CR31","doi-asserted-by":"publisher","first-page":"1360","DOI":"10.1126\/science.1146282","volume":"317","author":"E Herrmann","year":"2007","unstructured":"Herrmann, E., Call, J., Hern\u00e1ndez-Lloreda, M. V., Hare, B. & Tomasello, M. Humans have evolved specialized skills of social cognition: the cultural intelligence hypothesis. Science 317, 1360\u20131366 (2007).","journal-title":"Science"},{"key":"754_CR32","doi-asserted-by":"publisher","first-page":"10918","DOI":"10.1073\/pnas.1100290108","volume":"108","author":"R Boyd","year":"2011","unstructured":"Boyd, R., Richerson, P. J. & Henrich, J. The cultural niche: why social learning is essential for human adaptation. Proc. Natl Acad. Sci. USA 108, 10918\u201310925 (2011).","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"754_CR33","doi-asserted-by":"publisher","first-page":"27","DOI":"10.1146\/annurev-ecolsys-110218-025040","volume":"50","author":"A Whiten","year":"2019","unstructured":"Whiten, A. Cultural evolution in animals. Annu. Rev. Ecol. Evol. Syst. 50, 27\u201348 (2019).","journal-title":"Annu. Rev. Ecol. Evol. Syst."},{"key":"754_CR34","doi-asserted-by":"publisher","first-page":"178","DOI":"10.1002\/(SICI)1520-6505(1998)6:5<178::AID-EVAN5>3.0.CO;2-8","volume":"6","author":"RIM Dunbar","year":"1998","unstructured":"Dunbar, R. I. M. The social brain hypothesis. Evol. Anthropol. 6, 178\u2013190 (1998).","journal-title":"Evol. Anthropol."},{"key":"754_CR35","doi-asserted-by":"publisher","first-page":"432","DOI":"10.1037\/com0000139","volume":"132","author":"RW Byrne","year":"2018","unstructured":"Byrne, R. W. Machiavellian intelligence retrospective. J. Comp. Psychol. 132, 432 (2018).","journal-title":"J. Comp. Psychol."},{"key":"754_CR36","doi-asserted-by":"publisher","first-page":"227","DOI":"10.1038\/374227a0","volume":"374","author":"E Szathm\u00e1ry","year":"1995","unstructured":"Szathm\u00e1ry, E. & Maynard Smith, J. The major evolutionary transitions. Nature 374, 227\u2013232 (1995).","journal-title":"Nature"},{"key":"754_CR37","doi-asserted-by":"crossref","unstructured":"Jablonka, E. & Lamb, M. J. Evolution in Four Dimensions: Genetic, Epigenetic, Behavioral, and Symbolic Variation in the History of Life (MIT Press, 2014).","DOI":"10.7551\/mitpress\/9689.001.0001"},{"key":"754_CR38","doi-asserted-by":"crossref","unstructured":"Heyes, C. Cognitive Gadgets: The Cultural Evolution of Thinking (Harvard Univ. Press, 2018).","DOI":"10.4159\/9780674985155"},{"key":"754_CR39","doi-asserted-by":"publisher","first-page":"197","DOI":"10.1146\/annurev-genet-102108-134304","volume":"43","author":"W-L Ng","year":"2009","unstructured":"Ng, W.-L. & Bassler, B. L. Bacterial quorum-sensing network architectures. Ann. Rev. Genet. 43, 197 (2009).","journal-title":"Ann. Rev. Genet."},{"key":"754_CR40","doi-asserted-by":"publisher","first-page":"215","DOI":"10.1016\/S0083-6729(10)83009-2","volume":"83","author":"FJ Verheggen","year":"2010","unstructured":"Verheggen, F. J., Haubruge, E. & Mescher, M. C. Alarm pheromones\u2014chemical signaling in response to danger. Vit. Horm. 83, 215\u2013239 (2010).","journal-title":"Vit. Horm."},{"key":"754_CR41","doi-asserted-by":"publisher","first-page":"4733","DOI":"10.1016\/j.cub.2020.08.079","volume":"30","author":"M Nagy","year":"2020","unstructured":"Nagy, M. et al. Synergistic benefits of group search in rats. Curr. Biol. 30, 4733\u20134738 (2020).","journal-title":"Curr. Biol."},{"key":"754_CR42","doi-asserted-by":"crossref","unstructured":"Schluter, D. The Ecology of Adaptive Radiation (Oxford Univ. Press, 2000).","DOI":"10.1093\/oso\/9780198505235.001.0001"},{"key":"754_CR43","unstructured":"Bansal, T., Pachocki, J., Sidor, S., Sutskever, I. & Mordatch, I. Emergent complexity via multi-agent competition. 6th International Conference on Learning Representations 6 (2018)."},{"key":"754_CR44","doi-asserted-by":"crossref","unstructured":"Reynolds, C. W. Flocks, herds and schools: a distributed behavioral model. Computer Graphics 21, 25\u201334 (1987).","DOI":"10.1145\/37402.37406"},{"key":"754_CR45","unstructured":"Lerer, A. & Peysakhovich, A. Maintaining cooperation in complex social dilemmas using deep reinforcement learning. Preprint at https:\/\/arXiv.org\/abs\/1707.01068 (2017)."},{"key":"754_CR46","unstructured":"Leibo, J. Z., Zambaldi, V., Lanctot, M., Marecki, J. & Graepel, T. Multi-agent reinforcement learning in sequential social dilemmas. Proc. 16th International Conference on Autonomous Agents and MultiAgent Systems 464\u2013473 (2017)."},{"key":"754_CR47","doi-asserted-by":"crossref","unstructured":"McKee, K. R., Leibo, J. Z., Beattie, C. & Everett, R. Quantifying the effects of environment and population diversity in multi-agent reinforcement learning. Auton. Agents Multi-Agent Syst. 36, 21 (2022).","DOI":"10.1007\/s10458-022-09548-8"},{"key":"754_CR48","first-page":"14502","volume":"34","author":"D Strouse","year":"2021","unstructured":"Strouse, D., McKee, K., Botvinick, M., Hughes, E. & Everett, R. Collaborating with humans without human data. Adv. NeurIPS 34, 14502\u201314515 (2021).","journal-title":"Adv. NeurIPS"},{"key":"754_CR49","unstructured":"Lazaridou, A., Peysakhovich, A. & Baroni, M. Multi-agent cooperation and the emergence of (natural) language. 5th International Conference on Learning Representations 5 (2017)."},{"key":"754_CR50","first-page":"17443","volume":"33","author":"WM Czarnecki","year":"2020","unstructured":"Czarnecki, W. M. et al. Real world games look like spinning tops. Adv. NeurIPS 33, 17443\u201317454 (2020).","journal-title":"Adv. NeurIPS"},{"key":"754_CR51","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1146\/annurev.ecolsys.36.091704.175517","volume":"38","author":"BJ McGill","year":"2007","unstructured":"McGill, B. J. & Brown, J. S. Evolutionary game theory and adaptive dynamics of continuous traits. Annu. Rev. Ecol. Evol. Syst. 38, 403\u2013435 (2007).","journal-title":"Annu. Rev. Ecol. Evol. Syst."},{"key":"754_CR52","doi-asserted-by":"publisher","first-page":"97","DOI":"10.1109\/4235.735432","volume":"2","author":"B Sareni","year":"1998","unstructured":"Sareni, B. & Krahenbuhl, L. Fitness sharing and niching methods revisited. IEEE Trans. Evol. Comp. 2, 97\u2013106 (1998).","journal-title":"IEEE Trans. Evol. Comp."},{"key":"754_CR53","doi-asserted-by":"publisher","first-page":"274","DOI":"10.1162\/artl_a_00319","volume":"26","author":"J Lehman","year":"2020","unstructured":"Lehman, J. et al. The surprising creativity of digital evolution: a collection of anecdotes from the evolutionary computation and artificial life research communities. Artif. Life 26, 274\u2013306 (2020).","journal-title":"Artif. Life"},{"key":"754_CR54","first-page":"1","volume":"1","author":"L Van Valen","year":"1973","unstructured":"Van Valen, L. A new evolutionary law. Evol. Theory 1, 1\u201330 (1973).","journal-title":"Evol. Theory"},{"key":"754_CR55","first-page":"489","volume":"205","author":"R Dawkins","year":"1979","unstructured":"Dawkins, R. & Krebs, J. R. Arms races between and within species. Proc. R. Soc. B 205, 489\u2013511 (1979).","journal-title":"Proc. R. Soc. B"},{"key":"754_CR56","doi-asserted-by":"publisher","first-page":"353","DOI":"10.1162\/artl.1994.1.4.353","volume":"1","author":"K Sims","year":"1994","unstructured":"Sims, K. Evolving 3D morphology and behavior by competition. Artif. Life 1, 353\u2013372 (1994).","journal-title":"Artif. Life"},{"key":"754_CR57","doi-asserted-by":"publisher","first-page":"311","DOI":"10.1162\/106454698568620","volume":"4","author":"S Nolfi","year":"1998","unstructured":"Nolfi, S. & Floreano, D. Coevolving predator and prey robots: do \u2018arms races\u2019 arise in artificial evolution? Artif. Life 4, 311\u2013335 (1998).","journal-title":"Artif. Life"},{"key":"754_CR58","doi-asserted-by":"publisher","first-page":"484","DOI":"10.1038\/nature16961","volume":"529","author":"D Silver","year":"2016","unstructured":"Silver, D. et al. Mastering the game of Go with deep neural networks and tree search. Nature 529, 484\u2013489 (2016).","journal-title":"Nature"},{"key":"754_CR59","unstructured":"Stooke, A. et al. Open-ended learning leads to generally capable agents. Preprint at https:\/\/arXiv.org\/abs\/2107.12808 (2021)."},{"key":"754_CR60","unstructured":"Johanson, M. B., Hughes, E., Timbers, F. & Leibo, J. Z. Emergent bartering behaviour in multi-agent reinforcement learning. Preprint at https:\/\/arXiv.org\/abs\/2205.06760 (2022)."},{"key":"754_CR61","unstructured":"Clune, J. AI-GAs: AI-generating algorithms, an alternate paradigm for producing general artificial intelligence. Preprint at https:\/\/arXiv.org\/abs\/1905.10985 (2019)."},{"key":"754_CR62","unstructured":"Nisioti, E. & Moulin-Frier, C. Grounding artificial intelligence in the origins of human behavior. Preprint at https:\/\/arXiv.org\/abs\/2012.08564 (2020)."},{"key":"754_CR63","unstructured":"Aubret, A., Matignon, L. & Hassas, S. A survey on intrinsic motivation in reinforcement learning. Preprint at https:\/\/arXiv.org\/abs\/1908.06976 (2019)."},{"key":"754_CR64","doi-asserted-by":"crossref","unstructured":"Tesauro, G. TD-Gammon, a self-teaching backgammon program, achieves master-level play. Neural Computation 6, 267\u2013285 (1994).","DOI":"10.1007\/978-1-4757-2379-3_11"},{"key":"754_CR65","doi-asserted-by":"publisher","first-page":"859","DOI":"10.1126\/science.aau6249","volume":"364","author":"M Jaderberg","year":"2019","unstructured":"Jaderberg, M. et al. Human-level performance in 3D multiplayer games with population-based reinforcement learning. Science 364, 859\u2013865 (2019).","journal-title":"Science"},{"key":"754_CR66","doi-asserted-by":"publisher","first-page":"1067","DOI":"10.1126\/science.ade9097","volume":"378","author":"A Bakhtin","year":"2022","unstructured":"Bakhtin, A. et al. Human-level play in the game of Diplomacy by combining language models with strategic reasoning. Science 378, 1067\u20131074 (2022).","journal-title":"Science"},{"key":"754_CR67","doi-asserted-by":"crossref","unstructured":"Byrne, R. & Whiten, A. Machiavellian Intelligence (Oxford Univ. Press, 1994).","DOI":"10.1093\/acprof:oso\/9780198522652.003.0013"},{"key":"754_CR68","unstructured":"Lanctot, M. et al. A unified game-theoretic approach to multiagent reinforcement learning. Adv. NeurIPS 30, 4190\u20134203 (2017)."},{"key":"754_CR69","doi-asserted-by":"publisher","first-page":"350","DOI":"10.1038\/s41586-019-1724-z","volume":"575","author":"O Vinyals","year":"2019","unstructured":"Vinyals, O. et al. Grandmaster level in StarCraft II using multi-agent reinforcement learning. Nature 575, 350\u2013354 (2019).","journal-title":"Nature"},{"key":"754_CR70","doi-asserted-by":"publisher","first-page":"208","DOI":"10.1126\/science.1184719","volume":"328","author":"L Rendell","year":"2010","unstructured":"Rendell, L. et al. Why copy others? Insights from the social learning strategies tournament. Science 328, 208\u2013213 (2010).","journal-title":"Science"},{"key":"754_CR71","doi-asserted-by":"publisher","first-page":"625","DOI":"10.1287\/orsc.1090.0468","volume":"21","author":"C Fang","year":"2010","unstructured":"Fang, C., Lee, J. & Schilling, M. A. Balancing exploration and exploitation through structural design: the isolation of subgroups and organizational learning. Org. Sci. 21, 625\u2013642 (2010).","journal-title":"Org. Sci."},{"key":"754_CR72","doi-asserted-by":"publisher","first-page":"667","DOI":"10.2189\/asqu.52.4.667","volume":"52","author":"D Lazer","year":"2007","unstructured":"Lazer, D. & Friedman, A. The network structure of exploration and exploitation. Admin. Sci. Quart. 52, 667\u2013694 (2007).","journal-title":"Admin. Sci. Quart."},{"key":"754_CR73","doi-asserted-by":"publisher","first-page":"422","DOI":"10.1037\/a0012798","volume":"137","author":"WA Mason","year":"2008","unstructured":"Mason, W. A., Jones, A. & Goldstone, R. L. Propagation of innovations in networked groups. J. Exp. Psychol. Gen. 137, 422 (2008).","journal-title":"J. Exp. Psychol. Gen."},{"key":"754_CR74","doi-asserted-by":"publisher","first-page":"431","DOI":"10.1163\/15685373-12340120","volume":"21","author":"M Vlasceanu","year":"2021","unstructured":"Vlasceanu, M., Morais, M. J. & Coman, A. Network structure impacts the synchronization of collective beliefs. J. Cogn. Cult. 21, 431\u2013448 (2021).","journal-title":"J. Cogn. Cult."},{"key":"754_CR75","doi-asserted-by":"publisher","first-page":"8171","DOI":"10.1073\/pnas.1525569113","volume":"113","author":"A Coman","year":"2016","unstructured":"Coman, A., Momennejad, I., Drach, R. D. & Geana, A. Mnemonic convergence in social networks: the emergent properties of cognition at a collective level. Proc. Natl Acad. Sci. USA 113, 8171\u20138176 (2016).","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"754_CR76","doi-asserted-by":"crossref","unstructured":"Centola, D. The network science of collective intelligence. Trends Cogn. Sci. 26, 923\u2013941 (2022).","DOI":"10.1016\/j.tics.2022.08.009"},{"key":"754_CR77","doi-asserted-by":"publisher","first-page":"8734","DOI":"10.1073\/pnas.1802407115","volume":"115","author":"E Bernstein","year":"2018","unstructured":"Bernstein, E., Shore, J. & Lazer, D. How intermittent breaks in interaction improve collective intelligence. Proc. Natl Acad. Sci. USA 115, 8734\u20138739 (2018).","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"754_CR78","doi-asserted-by":"crossref","unstructured":"McKee, K. R. et al. Scaffolding cooperation in human groups with deep reinforcement learning. Nat. Hum. Behav. 7, 1787\u20131796 (2023).","DOI":"10.1038\/s41562-023-01686-7"},{"key":"754_CR79","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1561\/2300000053","volume":"7","author":"T Osa","year":"2018","unstructured":"Osa, T. et al. An algorithmic perspective on imitation learning. Found. Trends Robot. 7, 1\u2013179 (2018).","journal-title":"Found. Trends Robot."},{"key":"754_CR80","doi-asserted-by":"crossref","unstructured":"Torabi, F., Warnell, G. & Stone, P. Behavioral cloning from observation. Proc. 27th International Joint Conference on Artificial Intelligence 4950\u20134957 (2018).","DOI":"10.24963\/ijcai.2018\/687"},{"key":"754_CR81","unstructured":"Ho, J. & Ermon, S. Generative adversarial imitation learning. Adv. NeurIPS 29, (2016)."},{"key":"754_CR82","unstructured":"Liu, S. et al. From motor control to team play in simulated humanoid football. Preprint at https:\/\/arXiv.org\/abs\/2105.12196 (2021)."},{"key":"754_CR83","unstructured":"Borsa, D. et al. Observational learning by reinforcement learning. Proc. 18th International Conference on Autonomous Agents and MultiAgent Systems 1117\u20131124 (2019)."},{"key":"754_CR84","unstructured":"Ndousse, K. K., Eck, D., Levine, S. & Jaques, N. Emergent social learning via multi-agent reinforcement learning. Proc. 38th International Conference on Machine Learning 139, 7991\u20138004 (PMLR, 2021)."},{"key":"754_CR85","unstructured":"Nisioti, E., Mahaut, M., Oudeyer, P.-Y., Momennejad, I. & Moulin-Frier, C. Social network structure shapes innovation: experience-sharing in RL with SAPIENS. Preprint at https:\/\/arXiv.org\/abs\/2206.05060 (2022)."},{"key":"754_CR86","doi-asserted-by":"publisher","first-page":"236","DOI":"10.1016\/j.jtbi.2005.08.038","volume":"239","author":"E Jablonka","year":"2006","unstructured":"Jablonka, E. & Lamb, M. J. The evolution of information in the major transitions. J. Theor. Biol. 239, 236\u2013246 (2006).","journal-title":"J. Theor. Biol."},{"key":"754_CR87","doi-asserted-by":"crossref","unstructured":"Henrich, J. The Secret of Our Success: How Culture is Driving Human Evolution, Domesticating Our Species, and Making Us Smarter (Princeton Univ. Press, 2016).","DOI":"10.1515\/9781400873296"},{"key":"754_CR88","doi-asserted-by":"publisher","first-page":"dev167486","DOI":"10.1242\/dev.167486","volume":"146","author":"S Bowling","year":"2019","unstructured":"Bowling, S., Lawlor, K. & Rodr\u00edguez, T. A. Cell competition: the winners and losers of fitness selection. Development 146, dev167486 (2019).","journal-title":"Development"},{"key":"754_CR89","doi-asserted-by":"publisher","first-page":"397","DOI":"10.1038\/356397a0","volume":"356","author":"MC Raff","year":"1992","unstructured":"Raff, M. C. Social controls on cell survival and cell death. Nature 356, 397\u2013400 (1992).","journal-title":"Nature"},{"key":"754_CR90","doi-asserted-by":"publisher","first-page":"e1004273","DOI":"10.1371\/journal.pcbi.1004273","volume":"11","author":"E Ferrante","year":"2015","unstructured":"Ferrante, E., Turgut, A. E., Du\u00e9\u00f1ez-Guzm\u00e1n, E., Dorigo, M. & Wenseleers, T. Evolution of self-organized task specialization in robot swarms. PLoS Comp. Biol. 11, e1004273 (2015).","journal-title":"PLoS Comp. Biol."},{"key":"754_CR91","unstructured":"Peysakhovich, A. & Lerer, A. Prosocial learning agents solve generalized stag hunts better than selfish ones. Proc. 17th International Conference on Autonomous Agents and MultiAgent Systems 2043\u20132044 (2018)."},{"key":"754_CR92","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11721-012-0075-2","volume":"7","author":"M Brambilla","year":"2013","unstructured":"Brambilla, M., Ferrante, E., Birattari, M. & Dorigo, M. Swarm robotics: a review from the swarm engineering perspective. Swarm Intell. 7, 1\u201341 (2013).","journal-title":"Swarm Intell."},{"key":"754_CR93","doi-asserted-by":"crossref","unstructured":"Oroojlooy, A. & Hajinezhad, D. A review of cooperative multi-agent deep reinforcement learning. Appl. Intell. 53, 13677\u201313722 (2023).","DOI":"10.1007\/s10489-022-04105-y"},{"key":"754_CR94","doi-asserted-by":"publisher","first-page":"36","DOI":"10.3389\/frobt.2020.00036","volume":"7","author":"M Schranz","year":"2020","unstructured":"Schranz, M., Umlauft, M., Sende, M. & Elmenreich, W. Swarm robotic behaviors and current applications. Front. Robot. AI 7, 36 (2020).","journal-title":"Front. Robot. AI"},{"key":"754_CR95","unstructured":"Leibo, J. Z. et al. Scalable evaluation of multi-agent reinforcement learning with Melting Pot. Proc. 38th International Conference on Machine Learning 139, 6187\u20136199 (PMLR, 2021)."},{"key":"754_CR96","unstructured":"Sunehag, P., Vezhnevets, A. S., Du\u00e9\u00f1ez-Guzm\u00e1n, E., Mordach, I. & Leibo, J. Z. Diversity through exclusion (DTE): niche identification for reinforcement learning through value-decomposition. Proc. 2023 International Conference on Autonomous Agents and Multiagent Systems 2827\u20132829 (2023)."},{"key":"754_CR97","unstructured":"Wang, J. X. et al. Evolving intrinsic motivations for altruistic behavior. Proc. 18th International Conference on Autonomous Agents and MultiAgent Systems 683\u2013692 (2019)."},{"key":"754_CR98","unstructured":"Gemp, I. et al. D3C: reducing the price of anarchy in multi-agent learning. Proc. 21st International Conference on Autonomous Agents and Multiagent Systems 498\u2013506 (2022)."},{"key":"754_CR99","doi-asserted-by":"publisher","first-page":"eabk2607","DOI":"10.1126\/sciadv.abk2607","volume":"8","author":"S Zheng","year":"2022","unstructured":"Zheng, S., Trott, A., Srinivasa, S., Parkes, D. C. & Socher, R. The AI economist: taxation policy design via two-level deep multiagent reinforcement learning. Sci. Adv. 8, eabk2607 (2022).","journal-title":"Sci. Adv."},{"key":"754_CR100","doi-asserted-by":"publisher","first-page":"1398","DOI":"10.1038\/s41562-022-01383-x","volume":"6","author":"R Koster","year":"2022","unstructured":"Koster, R. et al. Human-centered mechanism design with democratic AI. Nat. Hum. Behav. 6, 1398\u20131407 (2022).","journal-title":"Nat. Hum. Behav."},{"key":"754_CR101","doi-asserted-by":"publisher","first-page":"1114","DOI":"10.1126\/science.1213969","volume":"335","author":"LG Dean","year":"2012","unstructured":"Dean, L. G., Kendal, R. L., Schapiro, S. J., Thierry, B. & Laland, K. N. Identification of the social and cognitive processes underlying human cumulative culture. Science 335, 1114\u20131118 (2012).","journal-title":"Science"},{"key":"754_CR102","doi-asserted-by":"publisher","first-page":"20150192","DOI":"10.1098\/rstb.2015.0192","volume":"371","author":"M Muthukrishna","year":"2016","unstructured":"Muthukrishna, M. & Henrich, J. Innovation in the collective brain. Phil. Trans. R. Soc. B 371, 20150192 (2016).","journal-title":"Phil. Trans. R. Soc. B"},{"key":"754_CR103","doi-asserted-by":"publisher","first-page":"20160244","DOI":"10.1098\/rstb.2016.0244","volume":"372","author":"RI Dunbar","year":"2017","unstructured":"Dunbar, R. I. & Shultz, S. Why are there so many explanations for primate brain evolution? Phil. Trans. R. Soc. B 372, 20160244 (2017).","journal-title":"Phil. Trans. R. Soc. B"},{"key":"754_CR104","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1016\/j.cognition.2015.03.016","volume":"141","author":"S Kirby","year":"2015","unstructured":"Kirby, S., Tamariz, M., Cornish, H. & Smith, K. Compression and communication in the cultural evolution of linguistic structure. Cognition 141, 87\u2013102 (2015).","journal-title":"Cognition"},{"key":"754_CR105","doi-asserted-by":"crossref","unstructured":"Ostrom, E. Understanding Institutional Diversity (Princeton Univ. Press, 2005).","DOI":"10.1515\/9781400831739"},{"key":"754_CR106","unstructured":"Havrylov, S. & Titov, I. Emergence of language with multi-agent games: Learning to communicate with sequences of symbols. Adv. NeurIPS 30, (2017)."},{"key":"754_CR107","doi-asserted-by":"publisher","unstructured":"Mordatch, I. & Abbeel, P. Emergence of grounded compositional language in multi-agent populations. Proc. AAAI Conf. Artif. Intell. 32, https:\/\/doi.org\/10.1609\/aaai.v32i1.11492 (2018).","DOI":"10.1609\/aaai.v32i1.11492"},{"key":"754_CR108","first-page":"1877","volume":"33","author":"T Brown","year":"2020","unstructured":"Brown, T. et al. Language models are few-shot learners. Adv. NeurIPS 33, 1877\u20131901 (2020).","journal-title":"Adv. NeurIPS"},{"key":"754_CR109","unstructured":"Chowdhery, A. et al. PaLM: scaling language modeling with pathways. Preprint at https:\/\/arXiv.org\/abs\/2204.02311 (2022)."},{"key":"754_CR110","first-page":"18878","volume":"35","author":"SC Chan","year":"2022","unstructured":"Chan, S. C. et al. Data distributional properties drive emergent few-shot learning in transformers. Adv. NeurIPS 35, 18878\u201318891 (2022).","journal-title":"Adv. NeurIPS"},{"key":"754_CR111","first-page":"24824","volume":"35","author":"J Wei","year":"2022","unstructured":"Wei, J. et al. Chain of thought prompting elicits reasoning in large language models. Adv. NeurIPS 35, 24824\u201324837 (2022).","journal-title":"Adv. NeurIPS"},{"key":"754_CR112","doi-asserted-by":"crossref","unstructured":"Bisk, Y. et al. Experience grounds language. In Proc. 2020 Conference on Empirical Methods in Natural Language Processing 8718\u20138735 (2020).","DOI":"10.18653\/v1\/2020.emnlp-main.703"},{"key":"754_CR113","unstructured":"Ullman, T. Large language models fail on trivial alterations to theory-of-mind tasks. Preprint at https:\/\/arXiv.org\/abs\/2302.08399 (2023)."},{"key":"754_CR114","unstructured":"Liu, R. et al. Mind\u2019s eye: Grounded language model reasoning through simulation. 11th International Conference on Learning Representations 11 (2023)."},{"key":"754_CR115","unstructured":"Glaese, A. et al. Improving alignment of dialogue agents via targeted human judgements. Preprint at https:\/\/arXiv.org\/abs\/2209.14375 (2022)."},{"key":"754_CR116","doi-asserted-by":"publisher","first-page":"1068","DOI":"10.1038\/s42256-022-00591-4","volume":"4","author":"C Colas","year":"2022","unstructured":"Colas, C., Karch, T., Moulin-Frier, C. & Oudeyer, P.-Y. Language and culture internalization for human-like autotelic AI. Nat. Mach. Intell. 4, 1068\u20131076 (2022).","journal-title":"Nat. Mach. Intell."},{"key":"754_CR117","unstructured":"Villalobos, P. et al. Will we run out of data? An analysis of the limits of scaling datasets in machine learning. Preprint at https:\/\/arXiv.org\/abs\/2211.04325 (2022)."},{"key":"754_CR118","doi-asserted-by":"publisher","first-page":"1152","DOI":"10.1111\/mms.12314","volume":"32","author":"SK Gazda","year":"2016","unstructured":"Gazda, S. K. Driver-barrier feeding behavior in bottlenose dolphins (Tursiops truncatus): new insights from a longitudinal study. Mar. Mammal Sci. 32, 1152\u20131160 (2016).","journal-title":"Mar. Mammal Sci."},{"key":"754_CR119","doi-asserted-by":"publisher","first-page":"105062","DOI":"10.1016\/j.yhbeh.2021.105062","volume":"136","author":"KL Bales","year":"2021","unstructured":"Bales, K. L. et al. What is a pair bond? Horm. Behav. 136, 105062 (2021).","journal-title":"Horm. Behav."},{"key":"754_CR120","doi-asserted-by":"publisher","first-page":"1129","DOI":"10.1111\/ele.13079","volume":"21","author":"D Lukas","year":"2018","unstructured":"Lukas, D. & Clutton-Brock, T. Social complexity and kinship in animal societies. Ecol. Lett. 21, 1129\u20131134 (2018).","journal-title":"Ecol. Lett."},{"key":"754_CR121","doi-asserted-by":"publisher","first-page":"387","DOI":"10.1016\/j.tins.2015.04.004","volume":"38","author":"R Feldman","year":"2015","unstructured":"Feldman, R. The adaptive human parental brain: implications for children\u2019s social development. Trends Neurosci. 38, 387\u2013399 (2015).","journal-title":"Trends Neurosci."},{"key":"754_CR122","doi-asserted-by":"publisher","first-page":"20150767","DOI":"10.1098\/rsbl.2015.0767","volume":"11","author":"B Tarr","year":"2015","unstructured":"Tarr, B., Launay, J., Cohen, E. & Dunbar, R. Synchrony and exertion during dance independently raise pain threshold and encourage social bonding. Biol. Lett. 11, 20150767 (2015).","journal-title":"Biol. Lett."},{"key":"754_CR123","doi-asserted-by":"publisher","first-page":"171","DOI":"10.3389\/fnins.2014.00171","volume":"8","author":"C Lieberwirth","year":"2014","unstructured":"Lieberwirth, C. & Wang, Z. Social bonding: regulation by neuropeptides. Front. Neurosci. 8, 171 (2014).","journal-title":"Front. Neurosci."},{"key":"754_CR124","doi-asserted-by":"publisher","first-page":"1018","DOI":"10.1038\/s41559-019-0907-1","volume":"3","author":"JA \u212bgren","year":"2019","unstructured":"\u212bgren, J. A., Davies, N. G. & Foster, K. R. Enforcement is central to the evolution of cooperation. Nat. Ecol. Evol. 3, 1018\u20131029 (2019).","journal-title":"Nat. Ecol. Evol."},{"key":"754_CR125","doi-asserted-by":"publisher","first-page":"795","DOI":"10.1534\/genetics.114.165423","volume":"197","author":"AS Wilkins","year":"2014","unstructured":"Wilkins, A. S., Wrangham, R. W. & Fitch, W. T. The \u2018domestication syndrome\u2019 in mammals: a unified explanation based on neural crest cell behavior and genetics. Genetics 197, 795\u2013808 (2014).","journal-title":"Genetics"}],"container-title":["Nature Machine Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.nature.com\/articles\/s42256-023-00754-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s42256-023-00754-x","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s42256-023-00754-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,11,19]],"date-time":"2023-11-19T22:18:27Z","timestamp":1700432307000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.nature.com\/articles\/s42256-023-00754-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,11,17]]},"references-count":125,"journal-issue":{"issue":"11","published-online":{"date-parts":[[2023,11]]}},"alternative-id":["754"],"URL":"https:\/\/doi.org\/10.1038\/s42256-023-00754-x","relation":{},"ISSN":["2522-5839"],"issn-type":[{"value":"2522-5839","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,11,17]]},"assertion":[{"value":"9 March 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 September 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 November 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"The authors declare no competing interests","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}