{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,25]],"date-time":"2025-06-25T06:05:06Z","timestamp":1750831506436,"version":"3.28.0"},"reference-count":18,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,6,30]],"date-time":"2024-06-30T00:00:00Z","timestamp":1719705600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,6,30]],"date-time":"2024-06-30T00:00:00Z","timestamp":1719705600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,6,30]]},"DOI":"10.1109\/cec60901.2024.10611794","type":"proceedings-article","created":{"date-parts":[[2024,8,8]],"date-time":"2024-08-08T17:55:15Z","timestamp":1723139715000},"page":"1-8","source":"Crossref","is-referenced-by-count":1,"title":["A Reinforcement Learning Method Based on Natural Evolution Strategies"],"prefix":"10.1109","author":[{"given":"Koki","family":"Kimura","sequence":"first","affiliation":[{"name":"Tokyo Institute of Technology,Yokohama,Japan"}]},{"given":"Isao","family":"Ono","sequence":"additional","affiliation":[{"name":"Tokyo Institute of Technology,Yokohama,Japan"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.120495"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2022.3207346"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1007\/s11704-020-0241-4"},{"key":"ref4","first-page":"1889","article-title":"Trust region policy optimization","volume-title":"International conference on machine learning","author":"Schulman"},{"key":"ref5","article-title":"Proximal policy optimization algorithms","author":"Schulman","year":"2017","journal-title":"arXiv preprint"},{"key":"ref6","article-title":"Continuous control with deep reinforcement learning","author":"Lillicrap","year":"2015","journal-title":"arXiv preprint"},{"key":"ref7","first-page":"1861","article-title":"Soft actor-critic: Off-policy maximum entropy deep reinforcement learning with a stochastic actor","volume-title":"International conference on machine learning","author":"Haarnoja"},{"key":"ref8","article-title":"Evolution strategies as a scalable alternative to reinforcement learning","author":"Salimans","year":"2017","journal-title":"arXiv preprint"},{"key":"ref9","article-title":"Simple random search of static linear policies is competitive for reinforcement learning","volume":"31","author":"Mania","year":"2018","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2020\/205"},{"key":"ref11","first-page":"970","article-title":"Structured evolution with compact architectures for scalable policy optimization","volume-title":"International Conference on Machine Learning","author":"Choromanski"},{"volume-title":"Random optimization, automat. remote control","year":"1965","author":"Matyas","key":"ref12"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2012.6386109"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/1830483.1830557"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/cec.2008.4631255"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CEC.2008.4631255"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1017\/S0305004100031455"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1016\/0304-4076(88)90027-9"}],"event":{"name":"2024 IEEE Congress on Evolutionary Computation (CEC)","start":{"date-parts":[[2024,6,30]]},"location":"Yokohama, Japan","end":{"date-parts":[[2024,7,5]]}},"container-title":["2024 IEEE Congress on Evolutionary Computation (CEC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10609966\/10611750\/10611794.pdf?arnumber=10611794","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,11]],"date-time":"2024-08-11T04:21:24Z","timestamp":1723350084000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10611794\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,6,30]]},"references-count":18,"URL":"https:\/\/doi.org\/10.1109\/cec60901.2024.10611794","relation":{},"subject":[],"published":{"date-parts":[[2024,6,30]]}}}