{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T10:20:12Z","timestamp":1729678812416,"version":"3.28.0"},"reference-count":8,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2015,10]]},"DOI":"10.1109\/urai.2015.7358908","type":"proceedings-article","created":{"date-parts":[[2015,12,17]],"date-time":"2015-12-17T16:58:33Z","timestamp":1450371513000},"page":"465-469","source":"Crossref","is-referenced-by-count":3,"title":["Optimization of fish-like locomotion using hierarchical reinforcement learning"],"prefix":"10.1109","author":[{"given":"Jeonghyeon","family":"Wang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jinwhan","family":"Kim","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/S0004-3702(99)00052-1"},{"article-title":"Learning from delayed rewards","year":"1989","author":"watkins","key":"ref3"},{"key":"ref6","doi-asserted-by":"crossref","first-page":"227","DOI":"10.1613\/jair.639","article-title":"Hierarchical reinforcement learning with the maxq value function decomposition","volume":"13","author":"dietterich","year":"2000","journal-title":"J Artif Intell Res (JAIR)"},{"key":"ref5","first-page":"556","article-title":"Intra-option learning about temporally abstract actions","volume":"98","author":"sutton","year":"1998","journal-title":"ICML"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ROBOT.2000.844093"},{"key":"ref7","first-page":"1043","article-title":"Reinforcement learning with hierarchies of machines","author":"parr","year":"1998","journal-title":"Advances in neural information processing systems"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1017\/S0022112060001110"},{"key":"ref1","doi-asserted-by":"crossref","DOI":"10.5962\/p.203769","article-title":"The locomotion of fishes","author":"breder","year":"1926"}],"event":{"name":"2015 12th International Conference on Ubiquitous Robots and Ambient Intelligence (URAI)","start":{"date-parts":[[2015,10,28]]},"location":"Goyang, South Korea","end":{"date-parts":[[2015,10,30]]}},"container-title":["2015 12th International Conference on Ubiquitous Robots and Ambient Intelligence (URAI)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7347046\/7358803\/07358908.pdf?arnumber=7358908","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,29]],"date-time":"2022-05-29T13:32:28Z","timestamp":1653831148000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7358908\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,10]]},"references-count":8,"URL":"https:\/\/doi.org\/10.1109\/urai.2015.7358908","relation":{},"subject":[],"published":{"date-parts":[[2015,10]]}}}