{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T16:43:51Z","timestamp":1765039431164,"version":"3.37.3"},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2019,1,8]],"date-time":"2019-01-08T00:00:00Z","timestamp":1546905600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100005856","name":"Faculdade de Ci\u00eancias e Tecnologia, Universidade Nova de Lisboa","doi-asserted-by":"crossref","award":["PD\/BD\/113963\/2015"],"award-info":[{"award-number":["PD\/BD\/113963\/2015"]}],"id":[{"id":"10.13039\/501100005856","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100005856","name":"Faculdade de Ci\u00eancias e Tecnologia, Universidade Nova de Lisboa","doi-asserted-by":"publisher","award":["PEst-OE\/EEI\/UI0027\/2013","UID\/CEC\/00127\/2013"],"award-info":[{"award-number":["PEst-OE\/EEI\/UI0027\/2013","UID\/CEC\/00127\/2013"]}],"id":[{"id":"10.13039\/501100005856","id-type":"DOI","asserted-by":"publisher"}]},{"name":"EuRoC","award":["FP7-2013-NMP-ICT-FOF"],"award-info":[{"award-number":["FP7-2013-NMP-ICT-FOF"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Intell Robot Syst"],"published-print":{"date-parts":[[2019,11]]},"DOI":"10.1007\/s10846-018-0968-4","type":"journal-article","created":{"date-parts":[[2019,1,9]],"date-time":"2019-01-09T04:18:42Z","timestamp":1547007522000},"page":"141-157","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Contextual Direct Policy Search"],"prefix":"10.1007","volume":"96","author":[{"given":"Abbas","family":"Abdolmaleki","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6464-8012","authenticated-orcid":false,"given":"David","family":"Sim\u00f5es","sequence":"additional","affiliation":[]},{"given":"Nuno","family":"Lau","sequence":"additional","affiliation":[]},{"given":"Lu\u00eds Paulo","family":"Reis","sequence":"additional","affiliation":[]},{"given":"Gerhard","family":"Neumann","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,1,8]]},"reference":[{"key":"968_CR1","first-page":"1","volume":"10","author":"A Abdolmaleki","year":"2016","unstructured":"Abdolmaleki, A., Lau, N., Reis, L.P., Peters, J., Neumann, G.: Contextual policy search for linear and nonlinear generalization of a humanoid walking controller. J. Intell. Robot. Syst. 10, 1\u201316 (2016)","journal-title":"J. Intell. Robot. Syst."},{"key":"968_CR2","doi-asserted-by":"crossref","unstructured":"Abdolmaleki, A., Lioutikov, R., Peters, J., Lua, N., Reis, L., Neumann, G.: Regularized Covariance Estimation for Weighted Maximum Likelihood Policy Search Methods. In: Advances in Neural Information Processing Systems (NIPS). MIT Press (2015)","DOI":"10.1109\/HUMANOIDS.2015.7363529"},{"key":"968_CR3","doi-asserted-by":"crossref","unstructured":"Abdolmaleki, A., Lua, N., Reis, L., Neumann, G.: Regularized covariance estimation for weighted maximum likelihood policy search methods. In: Proceedings of the International Conference on Humanoid Robots (HUMANOIDS) (2015)","DOI":"10.1109\/HUMANOIDS.2015.7363529"},{"key":"968_CR4","doi-asserted-by":"crossref","unstructured":"Abdolmaleki, A., Lua, N., Reis, L., Peters, J., Neumann, G.: Contextual Policy Search for Generalizing a Parameterized Biped Walking Controller. In: IEEE International Conference on Autonomous Robot Systems and Competitions (ICARSC) (2015)","DOI":"10.1109\/ICARSC.2015.43"},{"key":"968_CR5","doi-asserted-by":"crossref","unstructured":"Abdolmaleki, A., Simoes, D., Lau, N., Reis, L.P., Neumann, G.: Contextual Relative Entropy Policy Search with Covariance Matrix Adaptation. In: 2016 IEEE International Conference On Autonomous Robot Systems and Competitions (ICARSC), pp. 94\u201399. IEEE (2016)","DOI":"10.1109\/ICARSC.2016.31"},{"key":"968_CR6","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511804441","volume-title":"Convex optimization","author":"S Boyd","year":"2004","unstructured":"Boyd, S., Vandenberghe, L.: Convex optimization. University Press, Cambridge (2004)"},{"key":"968_CR7","unstructured":"Broomhead, D.S., Lowe, D.: Radial Basis Functions, Multi-Variable Functional Interpolation and Adaptive Networks. Tech. rep., DTIC Document (1988)"},{"key":"968_CR8","unstructured":"Da Silva, B., Konidaris, G., Barto, A.: Learning parameterized skills. International Conference on Machine Learning (ICML) (2012)"},{"key":"968_CR9","unstructured":"Daniel, C., Neumann, G., Peters, J.: Hierarchical Relative Entropy Policy Search. In: International Conference on Artificial Intelligence and Statistics (AISTATS) (2012)"},{"key":"968_CR10","doi-asserted-by":"crossref","unstructured":"Deisenroth, M.P., Englert, P., Peters, J., Fox, D.: Multi-task Policy Search for Robotics. In: IEEE International Conference on Robotics and Automation (ICRA) (2014)","DOI":"10.1109\/ICRA.2014.6907421"},{"key":"968_CR11","unstructured":"Ha, S., Liu, C.: Evolutionary optimization for parameterized whole-body dynamic motor skills. In: Proceedings of IEEE International Conference on Robotics and Automation (ICRA) (2016)"},{"key":"968_CR12","doi-asserted-by":"crossref","unstructured":"Hansen, N., Muller, S., Koumoutsakos, P.: Reducing the Time Complexity of the Derandomized Evolution Strategy with Covariance Matrix Adaptation (CMA-ES). Evolutionary Computation (2003)","DOI":"10.1162\/106365603321828970"},{"issue":"2","key":"968_CR13","doi-asserted-by":"publisher","first-page":"159","DOI":"10.1162\/106365601750190398","volume":"9","author":"N Hansen","year":"2001","unstructured":"Hansen, N., Ostermeier, A.: Completely derandomized self-adaptation in evolution strategies. Evol. Comput. 9(2), 159\u2013195 (2001)","journal-title":"Evol. Comput."},{"key":"968_CR14","doi-asserted-by":"crossref","unstructured":"Igel, C., Suttorp, T., Hansen, N.: A computational efficient covariance matrix update and a (1 + 1)-CMA for evolution strategies. In: Proceedings of the 8th annual conference on Genetic and evolutionary computation (2006)","DOI":"10.1145\/1143997.1144082"},{"key":"968_CR15","unstructured":"Ijspeert, A., Schaal, S.: Learning Attractor Landscapes for Learning Motor Primitives. In: Advances in Neural Information Processing Systems 15(NIPS) (2003)"},{"key":"968_CR16","doi-asserted-by":"crossref","unstructured":"Kober, J., Oztop, E., Peters, J.: Reinforcement Learning to adjust Robot Movements to New Situations. In: Proceedings of the Robotics: Science and Systems Conference (RSS) (2010)","DOI":"10.15607\/RSS.2010.VI.005"},{"key":"968_CR17","first-page":"1","volume":"8","author":"J Kober","year":"2010","unstructured":"Kober, J., Peters, J.: Policy Search for Motor Primitives in Robotics. Mach. Learn. 8, 1\u201333 (2010)","journal-title":"Mach. Learn."},{"key":"968_CR18","unstructured":"Kupcsik, A., Deisenroth, M.P., Peters, J., Neumann, G.: Data-Efficient contextual policy search for robot movement skills. In: Proceedings of the National Conference on Artificial Intelligence (AAAI) (2013)"},{"key":"968_CR19","unstructured":"Mannor, S., Rubinstein, R., Gat, Y.: The Cross Entropy method for Fast Policy Search. In: Proceedings of the 20th International Conference on Machine Learning (ICML) (2003)"},{"key":"968_CR20","unstructured":"Molga, M., Smutnicki, C.: Test Functions for Optimization Needs. In: http:\/\/www.zsd.ict.pwr.wroc.pl\/files\/docs\/functions.pdf (2005)"},{"key":"968_CR21","unstructured":"Niehaus, C., R\u00f6fer, T., Laue, T.: Gait optimization on a humanoid robot using particle swarm optimization. In: Proceedings of the Second Workshop on Humanoid Soccer Robots in conjunction with the, pp. 1\u20137 (2007)"},{"key":"968_CR22","doi-asserted-by":"crossref","unstructured":"Peters, J., M\u00fclling, K., Altun, Y.: Relative Entropy Policy Search. In: Proceedings of the 24th National Conference on Artificial Intelligence (AAAI). AAAI Press (2010)","DOI":"10.1609\/aaai.v24i1.7727"},{"key":"968_CR23","unstructured":"R\u00fcckstie\u00df, T., Felder, M., Schmidhuber, J.: State-dependent Exploration for Policy Gradient Methods. In: Proceedings of the European Conference on Machine Learning (ECML) (2008)"},{"key":"968_CR24","doi-asserted-by":"crossref","unstructured":"Stulp, F., Raiola, G., Hoarau, A., Ivaldi, S., Sigaud, O.: Learning Compact Parameterized Skills with a Single Regression. In: IEEE-RAS International Conference on Humanoid Robots (Humanoids) (2013)","DOI":"10.1109\/HUMANOIDS.2013.7030008"},{"key":"968_CR25","unstructured":"Stulp, F., Sigaud, O.: Path Integral Policy Improvement with Covariance Matrix Adaptation. In: International Conference on Machine Learning (ICML) (2012)"},{"key":"968_CR26","unstructured":"Suganthan, P.N., Hansen, N., Liang, J.J., Deb, K., Chen, Y.P., Auger, A., Tiwari, S.: Problem Definitions and Evaluation Criteria for the CEC 2005 Special Session on Real-Parameter Optimization. Tech. rep., Nanyang Technological University, Singapore (2005)"},{"key":"968_CR27","doi-asserted-by":"publisher","unstructured":"Sun, Y., Wierstra, D., Schaul, T., Schmidhuber, J.: Efficient Natural Evolution Strategies. In: Proceedings of the 11th Annual conference on Genetic and evolutionary computation(GECCO). https:\/\/doi.org\/10.1145\/1569901.1569976 (2009)","DOI":"10.1145\/1569901.1569976"},{"key":"968_CR28","unstructured":"Theodorou, E., Buchli, J., Schaal, S.: A Generalized Path Integral Control Approach to Reinforcement Learning. The Journal of Machine Learning Research (2010)"},{"issue":"5","key":"968_CR29","first-page":"168","volume":"28","author":"JM Wang","year":"2009","unstructured":"Wang, J.M., Fleet, D.J., Hertzmann, A.: Optimizing walking controllers. ACM Trans. Graph. (TOG) 28(5), 168 (2009)","journal-title":"ACM Trans. Graph. (TOG)"},{"key":"968_CR30","doi-asserted-by":"crossref","unstructured":"Wierstra, D., Schaul, T., Peters, J., Schmidhuber, J.: Fitness Expectation Maximization. In: International Conference on Parallel Problem Solving from Nature, pp. 337\u2013346. Springer (2008)","DOI":"10.1007\/978-3-540-87700-4_34"}],"container-title":["Journal of Intelligent &amp; Robotic Systems"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10846-018-0968-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10846-018-0968-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10846-018-0968-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,9,12]],"date-time":"2023-09-12T19:51:54Z","timestamp":1694548314000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10846-018-0968-4"}},"subtitle":["With Regularized Covariance Matrix Estimation"],"short-title":[],"issued":{"date-parts":[[2019,1,8]]},"references-count":30,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2019,11]]}},"alternative-id":["968"],"URL":"https:\/\/doi.org\/10.1007\/s10846-018-0968-4","relation":{},"ISSN":["0921-0296","1573-0409"],"issn-type":[{"type":"print","value":"0921-0296"},{"type":"electronic","value":"1573-0409"}],"subject":[],"published":{"date-parts":[[2019,1,8]]},"assertion":[{"value":"14 December 2017","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 December 2018","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 January 2019","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}