{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:25:55Z","timestamp":1750220755416,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":7,"publisher":"ACM","license":[{"start":{"date-parts":[[2020,7,8]],"date-time":"2020-07-08T00:00:00Z","timestamp":1594166400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"DARPA\/MTO","award":["FA8750-18-C-0103"],"award-info":[{"award-number":["FA8750-18-C-0103"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2020,7,8]]},"DOI":"10.1145\/3377929.3389946","type":"proceedings-article","created":{"date-parts":[[2020,8,26]],"date-time":"2020-08-26T15:26:55Z","timestamp":1598455615000},"page":"77-78","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Safer reinforcement learning through evolved instincts"],"prefix":"10.1145","author":[{"given":"Djordje","family":"Grbic","sequence":"first","affiliation":[{"name":"IT University Copenhagen"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sebastian","family":"Risi","sequence":"additional","affiliation":[{"name":"IT University Copenhagen"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2020,7,8]]},"reference":[{"volume-title":"Constrained Markov decision processes","author":"Altman Eitan","key":"e_1_3_2_1_1_1","doi-asserted-by":"crossref","DOI":"10.1201\/9781315140223"},{"volume-title":"Meta Learning by the Baldwin Effect. arXiv preprint arXiv:1806.07917","year":"2018","author":"Fernando Chrisantha Thomas","key":"e_1_3_2_1_2_1"},{"volume-title":"Model-agnostic meta-learning for fast adaptation of deep networks. arXiv preprint arXiv:1703.03400","year":"2017","author":"Finn Chelsea","key":"e_1_3_2_1_3_1"},{"volume-title":"Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980","year":"2014","author":"Kingma Diederik P","key":"e_1_3_2_1_4_1"},{"volume-title":"Combating deep reinforcement learning's sisyphean curse with reinforcement learning. arXiv preprint arXiv:1611.01211","year":"2016","author":"Lipton Zachary C","key":"e_1_3_2_1_5_1"},{"key":"e_1_3_2_1_6_1","unstructured":"Alex Ray Joshua Achiam and Dario Amodei. [n. d.]. Benchmarking Safe Exploration in Deep Reinforcement Learning. ([n. d.]).  Alex Ray Joshua Achiam and Dario Amodei. [n. d.]. Benchmarking Safe Exploration in Deep Reinforcement Learning. ([n. d.])."},{"key":"e_1_3_2_1_7_1","unstructured":"John Schulman Filip Wolski Prafulla Dhariwal Alec Radford and Oleg Klimov. 2017. Proximal Policy Optimization Algorithms. (2017). arXiv:cs.LG\/1707.06347  John Schulman Filip Wolski Prafulla Dhariwal Alec Radford and Oleg Klimov. 2017. Proximal Policy Optimization Algorithms. (2017). arXiv:cs.LG\/1707.06347"}],"event":{"name":"GECCO '20: Genetic and Evolutionary Computation Conference","sponsor":["SIGEVO ACM Special Interest Group on Genetic and Evolutionary Computation"],"location":"Canc\u00fan Mexico","acronym":"GECCO '20"},"container-title":["Proceedings of the 2020 Genetic and Evolutionary Computation Conference Companion"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3377929.3389946","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3377929.3389946","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T22:39:00Z","timestamp":1750199940000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3377929.3389946"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,7,8]]},"references-count":7,"alternative-id":["10.1145\/3377929.3389946","10.1145\/3377929"],"URL":"https:\/\/doi.org\/10.1145\/3377929.3389946","relation":{},"subject":[],"published":{"date-parts":[[2020,7,8]]},"assertion":[{"value":"2020-07-08","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}