{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,2,4]],"date-time":"2024-02-04T13:23:38Z","timestamp":1707053018344},"reference-count":7,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2010,8,1]],"date-time":"2010-08-01T00:00:00Z","timestamp":1280620800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Artif Life Robotics"],"published-print":{"date-parts":[[2010,8]]},"DOI":"10.1007\/s10015-010-0772-0","type":"journal-article","created":{"date-parts":[[2010,8,26]],"date-time":"2010-08-26T12:06:29Z","timestamp":1282824389000},"page":"97-100","source":"Crossref","is-referenced-by-count":5,"title":["A reinforcement learning with switching controllers for a continuous action space"],"prefix":"10.1007","volume":"15","author":[{"given":"Masato","family":"Nagayoshi","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hajime","family":"Murao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hisashi","family":"Tamaki","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2010,8,27]]},"reference":[{"key":"772_CR1","doi-asserted-by":"crossref","unstructured":"Sutton RS, Barto AG (1998) Reinforcement learning. A Bradford Book, MIT Press","DOI":"10.1016\/S1474-6670(17)38315-5"},{"issue":"2","key":"772_CR2","first-page":"267","volume":"15","author":"H. Kimura","year":"2000","unstructured":"Kimura H, Kobayashi S (2000) An analysis of actor-critic algorithms using eligibility traces: reinforcement learning with imperfect value functions (in Japanese). JSAI J 15(2):267\u2013275","journal-title":"JSAI J"},{"key":"772_CR3","doi-asserted-by":"crossref","first-page":"37","DOI":"10.1016\/S0921-8890(01)00113-0","volume":"36","author":"J. Morimoto","year":"2001","unstructured":"Morimoto J, Doya K (2001) Acquisition of stand-up behavior by a real robot using hierarchical reinforcement learning. Robotics Auton Syst 36:37\u201351","journal-title":"Robotics Auton Syst"},{"issue":"9","key":"772_CR4","first-page":"2121","volume":"J84-D-II","author":"K. Shibata","year":"2001","unstructured":"Shibata K, Nishino T, Okabe Y (2001) Active perception learning system based on actor-Q architecture (in Japanese). T IEICE Jpn, J84-D-II(9), p 2121\u20132130","journal-title":"T IEICE Jpn"},{"issue":"3","key":"772_CR5","first-page":"285","volume":"J84-DI","author":"A. Ito","year":"2001","unstructured":"Ito A, Kanabuchi M (2001) Speeding up multi-agent reinforcement learning by coarse-graining of perception: hunter game as an example (in Japanese). T IEICE Jpn, J84-DI(3), pp 285\u2013293","journal-title":"T IEICE Jpn"},{"key":"772_CR6","unstructured":"Nagayoshi M, Murao H, Tamaki H (2006) A state space filter for reinforcement learning. Proceedings of AROB 11th\u201906, pp 615\u2013618 (GS1-3)"},{"key":"772_CR7","doi-asserted-by":"crossref","unstructured":"Nagayoshi M, Murao H, Tamaki H (2006) A state space filter for reinforcement learning in POMDPs: application to a continuous state space. Proceedings of the SICE-ICSE International Joint Conference 2006, pp 6037\u20136042 (SE18-4)","DOI":"10.1109\/SICE.2006.315203"}],"container-title":["Artificial Life and Robotics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10015-010-0772-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10015-010-0772-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10015-010-0772-0","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,6,2]],"date-time":"2019-06-02T08:51:14Z","timestamp":1559465474000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10015-010-0772-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2010,8]]},"references-count":7,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2010,8]]}},"alternative-id":["772"],"URL":"https:\/\/doi.org\/10.1007\/s10015-010-0772-0","relation":{},"ISSN":["1433-5298","1614-7456"],"issn-type":[{"value":"1433-5298","type":"print"},{"value":"1614-7456","type":"electronic"}],"subject":[],"published":{"date-parts":[[2010,8]]}}}