{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,11]],"date-time":"2024-09-11T19:46:07Z","timestamp":1726083967163},"publisher-location":"Cham","reference-count":39,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030399573"},{"type":"electronic","value":"9783030399580"}],"license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020]]},"DOI":"10.1007\/978-3-030-39958-0_6","type":"book-chapter","created":{"date-parts":[[2020,5,7]],"date-time":"2020-05-07T13:29:08Z","timestamp":1588858148000},"page":"101-119","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Temporal Memory Sharing in Visual Reinforcement Learning"],"prefix":"10.1007","author":[{"given":"Stephen","family":"Kelly","sequence":"first","affiliation":[]},{"given":"Wolfgang","family":"Banzhaf","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,5,8]]},"reference":[{"key":"6_CR1","unstructured":"A. Simon, H.: The architecture of complexity. Proceedings of the American Philosophical Society 106, 467\u2013482 (1962)"},{"key":"6_CR2","doi-asserted-by":"crossref","unstructured":"Agapitos, A., Brabazon, A., O\u2019Neill, M.: Genetic programming with memory for financial trading. In: G. Squillero, P. Burelli (eds.) Applications of Evolutionary Computation, pp. 19\u201334. Springer International Publishing (2016)","DOI":"10.1007\/978-3-319-31204-0_2"},{"key":"6_CR3","doi-asserted-by":"crossref","unstructured":"Atkins, D., Neshatian, K., Zhang, M.: A domain independent genetic programming approach to automatic feature extraction for image classification. In: 2011 IEEE Congress of Evolutionary Computation (CEC), pp. 238\u2013245 (2011)","DOI":"10.1109\/CEC.2011.5949624"},{"key":"6_CR4","unstructured":"Beattie, C., Leibo, J.Z., Teplyashin, D., Ward, T., Wainwright, M., K\u00fcttler, H., Lefrancq, A., Green, S., Vald\u00e9s, V., Sadik, A., Schrittwieser, J., Anderson, K., York, S., Cant, M., Cain, A., Bolton, A., Gaffney, S., King, H., Hassabis, D., Legg, S., Petersen, S.: Deepmind lab. arXiv preprint arXiv:1612.03801 (2016)"},{"key":"6_CR5","doi-asserted-by":"publisher","first-page":"253","DOI":"10.1613\/jair.3912","volume":"47","author":"MG Bellemare","year":"2013","unstructured":"Bellemare, M.G., Naddaf, Y., Veness, J., Bowling, M.: The arcade learning environment: An evaluation platform for general agents. Journal of Artificial Intelligence Research 47, 253\u2013279 (2013)","journal-title":"Journal of Artificial Intelligence Research"},{"key":"6_CR6","unstructured":"Bishop, C.M.: Pattern Recognition and Machine Learning (Information Science and Statistics). Springer-Verlag (2006)"},{"key":"6_CR7","unstructured":"Brameier, M., Banzhaf, W.: Linear Genetic Programming, 1st edn. Springer (2007)"},{"key":"6_CR8","doi-asserted-by":"crossref","unstructured":"Brave, S.: The evolution of memory and mental models using genetic programming. In: Proceedings of the 1st Annual Conference on Genetic Programming, pp. 261\u2013266. MIT Press (1996)","DOI":"10.7551\/mitpress\/3242.003.0036"},{"key":"6_CR9","unstructured":"Choi, S.P.M., Yeung, D.Y., Zhang, N.L.: An environment model for nonstationary reinforcement learning. In: S.A. Solla, T.K. Leen, K. M\u00fcller (eds.) Advances in Neural Information Processing Systems 12, pp. 987\u2013993. MIT Press (2000)"},{"key":"6_CR10","doi-asserted-by":"publisher","first-page":"113","DOI":"10.1007\/BFb0055932","volume-title":"Genetic Programming","author":"M Conrads","year":"1998","unstructured":"Conrads, M., Nordin, P., Banzhaf, W.: Speech sound discrimination with genetic programming. In: W. Banzhaf, R. Poli, M. Schoenauer, T.C. Fogarty (eds.) Genetic Programming, pp. 113\u2013129. Springer Berlin Heidelberg (1998)"},{"issue":"3","key":"6_CR11","doi-asserted-by":"publisher","first-page":"490","DOI":"10.1016\/j.neuron.2017.05.039","volume":"95","author":"RL Davis","year":"2017","unstructured":"Davis, R.L., Zhong, Y.: The Biology of Forgetting \u2013 A Perspective. Neuron 95(3), 490\u2013503 (2017)","journal-title":"Neuron"},{"key":"6_CR12","doi-asserted-by":"crossref","unstructured":"Greve, R.B., Jacobsen, E.J., Risi, S.: Evolving neural turing machines for reward-based learning. In: Proceedings of the Genetic and Evolutionary Computation Conference 2016, GECCO \u201916, pp. 117\u2013124. ACM (2016)","DOI":"10.1145\/2908812.2908930"},{"key":"6_CR13","unstructured":"Hasselt, H.v., Guez, A., Silver, D.: Deep reinforcement learning with double q-learning. In: Proceedings of the Thirtieth AAAI Conference on Artificial Intelligence, AAAI\u201916, pp. 2094\u20132100. AAAI Press (2016)"},{"issue":"4","key":"6_CR14","doi-asserted-by":"publisher","first-page":"355","DOI":"10.1109\/TCIAIG.2013.2294713","volume":"6","author":"M Hausknecht","year":"2014","unstructured":"Hausknecht, M., Lehman, J., Miikkulainen, R., Stone, P.: A neuroevolution approach to general Atari game playing. IEEE Transactions on Computational Intelligence and AI in Games 6(4), 355\u2013366 (2014)","journal-title":"IEEE Transactions on Computational Intelligence and AI in Games"},{"key":"6_CR15","doi-asserted-by":"crossref","unstructured":"Haynes, T.D., Wainwright, R.L.: A simulation of adaptive agents in a hostile environment. In: Proceedings of the 1995 ACM Symposium on Applied Computing, SAC \u201995, pp. 318\u2013323. ACM (1995)","DOI":"10.1145\/315891.316007"},{"key":"6_CR16","unstructured":"Hintze, A., Edlund, J.A., Olson, R.S., Knoester, D.B., Schossau, J., Albantakis, L., Tehrani-Saleh, A., Kvam, P.D., Sheneman, L., Goldsby, H., Bohm, C., Adami, C.: Markov brains: A technical introduction. arXiv preprint 1709.05601 (2017)"},{"key":"6_CR17","doi-asserted-by":"crossref","unstructured":"Hintze, A., Schossau, J., Bohm, C.: The evolutionary buffet method. In: W. Banzhaf, L. Spector, L. Sheneman (eds.) Genetic Programming Theory and Practice XVI, Genetic and Evolutionary Computation Series, pp. 17\u201336. Springer (2018)","DOI":"10.1007\/978-3-030-04735-1_2"},{"issue":"6443","key":"6_CR18","doi-asserted-by":"publisher","first-page":"859","DOI":"10.1126\/science.aau6249","volume":"364","author":"M Jaderberg","year":"2019","unstructured":"Jaderberg, M., Czarnecki, W.M., Dunning, I., Marris, L., Lever, G., Casta\u00f1eda, A.G., Beattie, C., Rabinowitz, N.C., Morcos, A.S., Ruderman, A., Sonnerat, N., Green, T., Deason, L., Leibo, J.Z., Silver, D., Hassabis, D., Kavukcuoglu, K., Graepel, T.: Human-level performance in 3d multiplayer games with population-based reinforcement learning. Science 364(6443), 859\u2013865 (2019)","journal-title":"Science"},{"key":"6_CR19","unstructured":"Kelly, S.: Scaling genetic programming to challenging reinforcement tasks through emergent modularity. Ph.D. thesis, Faculty of Computer Science, Dalhousie University (2018)"},{"issue":"3","key":"6_CR20","doi-asserted-by":"publisher","first-page":"347","DOI":"10.1162\/evco_a_00232","volume":"26","author":"S Kelly","year":"2018","unstructured":"Kelly, S., Heywood, M.I.: Emergent solutions to high-dimensional multitask reinforcement learning. Evolutionary Computation 26(3), 347\u2013380 (2018)","journal-title":"Evolutionary Computation"},{"key":"6_CR21","doi-asserted-by":"crossref","unstructured":"Kelly, S., Smith, R.J., Heywood, M.I.: Emergent Policy Discovery for Visual Reinforcement Learning Through Tangled Program Graphs: A Tutorial, pp. 37\u201357. Springer International Publishing (2019)","DOI":"10.1007\/978-3-030-04735-1_3"},{"key":"6_CR22","doi-asserted-by":"crossref","unstructured":"Kober, J., Peters, J.: Reinforcement learning in robotics: A survey. In: M. Wiering, M. van Otterio (eds.) Reinforcement Learning, pp. 579\u2013610. Springer (2012)","DOI":"10.1007\/978-3-642-27645-3_18"},{"key":"6_CR23","doi-asserted-by":"crossref","unstructured":"Koza, J.R., Andre, D., Bennett, F.H., Keane, M.A.: Genetic Programming III: Darwinian Invention & Problem Solving, 1st edn. Morgan Kaufmann Publishers Inc. (1999)","DOI":"10.1109\/TEVC.1999.788530"},{"key":"6_CR24","doi-asserted-by":"crossref","unstructured":"Krawiec, K., Bhanu, B.: Visual learning by coevolutionary feature synthesis. IEEE Transactions on Systems, Man, and Cybernetics, Part B (Cybernetics) 35(3), 409\u2013425 (2005)","DOI":"10.1109\/TSMCB.2005.846644"},{"key":"6_CR25","doi-asserted-by":"crossref","unstructured":"Lalejini, A., Ofria, C.: What Else Is in an Evolved Name? Exploring Evolvable Specificity with SignalGP. In: W. Banzhaf, L. Spector, L. Sheneman (eds.) Genetic Programming Theory and Practice XVI, pp. 103\u2013121. Springer International Publishing (2019)","DOI":"10.1007\/978-3-030-04735-1_6"},{"issue":"2","key":"6_CR26","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1007\/s12530-015-9128-2","volume":"6","author":"E Lughofer","year":"2015","unstructured":"Lughofer, E., Sayed-Mouchaweh, M.: Adaptive and on-line learning in non-stationary environments. Evolving Systems 6(2), 75\u201377 (2015)","journal-title":"Evolving Systems"},{"issue":"1","key":"6_CR27","first-page":"523","volume":"61","author":"MC Machado","year":"2018","unstructured":"Machado, M.C., Bellemare, M.G., Talvitie, E., Veness, J., Hausknecht, M., Bowling, M.: Revisiting the arcade learning environment: Evaluation protocols and open problems for general agents. J. Artif. Int. Res. 61(1), 523\u2013562 (2018)","journal-title":"J. Artif. Int. Res."},{"key":"6_CR28","unstructured":"Mnih, V., Badia, A.P., Mirza, M., Graves, A., Lillicrap, T., Harley, T., Silver, D., Kavukcuoglu, K.: Asynchronous methods for deep reinforcement learning. In: M.F. Balcan, K.Q. Weinberger (eds.) Proceedings of The 33rd International Conference on Machine Learning, Proceedings of Machine Learning Research, vol. 48, pp. 1928\u20131937. PMLR (2016)"},{"key":"6_CR29","unstructured":"Mnih, V., Heess, N., Graves, A., Kavukcuoglu, K.: Recurrent models of visual attention. In: Proceedings of the 27th International Conference on Neural Information Processing Systems - Volume 2, NIPS\u201914, pp. 2204\u20132212. MIT Press (2014)"},{"issue":"7540","key":"6_CR30","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1038\/nature14236","volume":"518","author":"V Mnih","year":"2015","unstructured":"Mnih, V., Kavukcuoglu, K., Silver, D., Rusu, A.A., Veness, J., Bellemare, M.G., Graves, A., Riedmiller, M., Fidjeland, A.K., Ostrovski, G., Petersen, S., Beattie, C., Sadik, A., Antonoglou, I., King, H., Kumaran, D., Wierstra, D., Legg, S., Hassabis, D.: Human-level control through deep reinforcement learning. Nature 518(7540), 529\u2013533 (2015)","journal-title":"Nature"},{"key":"6_CR31","unstructured":"Schaul, T., Quan, J., Antonoglou, I., Silver, D.: Prioritized experience replay. In: International Conference on Learning Representations (2016)"},{"key":"6_CR32","doi-asserted-by":"crossref","unstructured":"Smith, R.J., Heywood, M.I.: A model of external memory for navigation in partially observable visual reinforcement learning tasks. In: L. Sekanina, T. Hu, N. Louren\u00e7o, H. Richter, P. Garc\u00eda-S\u00e1nchez (eds.) Genetic Programming, pp. 162\u2013177. Springer International Publishing (2019)","DOI":"10.1007\/978-3-030-16670-0_11"},{"key":"6_CR33","doi-asserted-by":"crossref","unstructured":"Stanley, K.O., Miikkulainen, R.: Evolving a Roving Eye for Go. In: T. Kanade, J. Kittler, J.M. Kleinberg, F. Mattern, J.C. Mitchell, M. Naor, O. Nierstrasz, C. Pandu Rangan, B. Steffen, M. Sudan, D. Terzopoulos, D. Tygar, M.Y. Vardi, G. Weikum, K. Deb (eds.) Genetic and Evolutionary Computation \u2014 GECCO 2004, vol. 3103, pp. 1226\u20131238. Springer Berlin Heidelberg, Berlin, Heidelberg (2004)","DOI":"10.1007\/978-3-540-24855-2_130"},{"key":"6_CR34","doi-asserted-by":"crossref","unstructured":"Sutton, R.R., Barto, A.G.: Reinforcement Learning: An introduction. MIT Press (1998)","DOI":"10.1109\/TNN.1998.712192"},{"key":"6_CR35","first-page":"136","volume":"1","author":"A Teller","year":"1994","unstructured":"Teller, A.: Turing completeness in the language of genetic programming with indexed memory. In: Proceedings of the First IEEE Conference on Evolutionary Computation. IEEE World Congress on Computational Intelligence, vol. 1, pp. 136\u2013141 (1994)","journal-title":"In: Proceedings of the First IEEE Conference on Evolutionary Computation. IEEE World Congress on Computational Intelligence"},{"issue":"3","key":"6_CR36","doi-asserted-by":"publisher","first-page":"967","DOI":"10.1111\/j.1558-5646.1996.tb02339.x","volume":"50","author":"GP Wagner","year":"1996","unstructured":"Wagner, G.P., Altenberg, L.: Perspective: Complex adaptations and the evolution of evolvability. Evolution 50(3), 967\u2013976 (1996)","journal-title":"Evolution"},{"key":"6_CR37","unstructured":"Wang, Z., Schaul, T., Hessel, M., Van Hasselt, H., Lanctot, M., De Freitas, N.: Dueling network architectures for deep reinforcement learning. In: Proceedings of the 33rd International Conference on International Conference on Machine Learning - Volume 48, ICML\u201916, pp. 1995\u20132003. JMLR.org (2016)"},{"issue":"4","key":"6_CR38","doi-asserted-by":"publisher","first-page":"445","DOI":"10.1162\/106454605774270589","volume":"11","author":"RA Watson","year":"2005","unstructured":"Watson, R.A., Pollack, J.B.: Modular interdependency in complex dynamical systems. Artificial Life 11(4), 445\u2013457 (2005)","journal-title":"Artificial Life"},{"key":"6_CR39","doi-asserted-by":"crossref","unstructured":"Wilson, D.G., Cussat-Blanc, S., Luga, H., Miller, J.F.: Evolving simple programs for playing atari games. In: Proceedings of the Genetic and Evolutionary Computation Conference, GECCO \u201918, pp. 229\u2013236. ACM (2018)","DOI":"10.1145\/3205455.3205578"}],"container-title":["Genetic and Evolutionary Computation","Genetic Programming Theory and Practice XVII"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-39958-0_6","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,5]],"date-time":"2024-08-05T13:03:21Z","timestamp":1722863001000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-030-39958-0_6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020]]},"ISBN":["9783030399573","9783030399580"],"references-count":39,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-39958-0_6","relation":{},"ISSN":["1932-0167","1932-0175"],"issn-type":[{"type":"print","value":"1932-0167"},{"type":"electronic","value":"1932-0175"}],"subject":[],"published":{"date-parts":[[2020]]},"assertion":[{"value":"8 May 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}