{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,19]],"date-time":"2025-11-19T06:52:14Z","timestamp":1763535134400,"version":"3.40.3"},"publisher-location":"Berlin, Heidelberg","reference-count":20,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642238079"},{"type":"electronic","value":"9783642238086"}],"license":[{"start":{"date-parts":[[2011,1,1]],"date-time":"2011-01-01T00:00:00Z","timestamp":1293840000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2011]]},"DOI":"10.1007\/978-3-642-23808-6_1","type":"book-chapter","created":{"date-parts":[[2011,8,18]],"date-time":"2011-08-18T07:40:29Z","timestamp":1313653229000},"page":"1-17","source":"Crossref","is-referenced-by-count":5,"title":["Sparse Kernel-SARSA(\u03bb) with an Eligibility Trace"],"prefix":"10.1007","author":[{"given":"Matthew","family":"Robards","sequence":"first","affiliation":[]},{"given":"Peter","family":"Sunehag","sequence":"additional","affiliation":[]},{"given":"Scott","family":"Sanner","sequence":"additional","affiliation":[]},{"given":"Bhaskara","family":"Marthi","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"1_CR1","doi-asserted-by":"crossref","unstructured":"Aronszajn, N.: Theory of reproducing kernels. Transactions of the American Mathematical Society\u00a068 (1950)","DOI":"10.21236\/ADA296533"},{"key":"1_CR2","volume-title":"Pattern Recognition and Machine Learning (Information Science and Statistics)","author":"C.M. Bishop","year":"2007","unstructured":"Bishop, C.M.: Pattern Recognition and Machine Learning (Information Science and Statistics), 1st edn. Springer, Heidelberg (October 2007)","edition":"1"},{"key":"1_CR3","unstructured":"Csato, L., Opper, M.: Sparse representation for gaussian process models. In: Advances in Neural Information Processing Systems, vol. 13 (2001)"},{"key":"1_CR4","unstructured":"Engel, Y.: Algorithms and Representations for Reinforcement Learning. PhD thesis, Hebrew University (April 2005)"},{"key":"1_CR5","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1007\/3-540-36755-1_8","volume-title":"Machine Learning: ECML 2002","author":"Y. Engel","year":"2002","unstructured":"Engel, Y., Mannor, S., Meir, R.: Sparse online greedy support vector regression. In: Elomaa, T., Mannila, H., Toivonen, H. (eds.) ECML 2002. LNCS (LNAI), vol.\u00a02430, pp. 84\u201396. Springer, Heidelberg (2002)"},{"key":"1_CR6","unstructured":"Engel, Y., Mannor, S., Meir, R.: Bayes meets bellman: The gaussian process approach to temporal difference learning. In: Proc. of the 20th International Conference on Machine Learning, pp. 154\u2013161 (2003)"},{"key":"1_CR7","unstructured":"Jong, N., Stone, P.: Kernel-based models for reinforcement learning in continuous state spaces. In: ICML Workshop on Kernel Machines and Reinforcement Learning (2006)"},{"key":"1_CR8","doi-asserted-by":"crossref","unstructured":"Jung, T., Stone, P.: Gaussian processes for sample efficient reinforcement learning with rmax-like exploration. In: Proceedings of the European Conference on Machine Learning (September 2010)","DOI":"10.1007\/978-3-642-15880-3_44"},{"key":"1_CR9","doi-asserted-by":"publisher","first-page":"720","DOI":"10.1145\/1390156.1390247","volume-title":"ICML 2008: Proceedings of the 25th International Conference on Machine Learning","author":"F. Orabona","year":"2008","unstructured":"Orabona, F., Keshet, J., Caputo, B.: The projectron: a bounded kernel-based perceptron. In: ICML 2008: Proceedings of the 25th International Conference on Machine Learning, pp. 720\u2013727. ACM, New York (2008)"},{"key":"1_CR10","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1023\/A:1017928328829","volume":"49","author":"D. Ormoneit","year":"2002","unstructured":"Ormoneit, D., Sen, S.: Kernel-based reinforcement learning. Machine Learning\u00a049, 161\u2013178 (2002)","journal-title":"Machine Learning"},{"key":"1_CR11","doi-asserted-by":"publisher","DOI":"10.1002\/9780470316887","volume-title":"Markov Decision Processes: Discrete Stochastic Dynamic Programming","author":"M.L. Puterman","year":"1994","unstructured":"Puterman, M.L.: Markov Decision Processes: Discrete Stochastic Dynamic Programming. Wiley, New York (1994)"},{"key":"1_CR12","first-page":"751","volume-title":"Advances in Neural Information Processing Systems","author":"C.E. Rasmussen","year":"2003","unstructured":"Rasmussen, C.E., Kuss, M.: Gaussian processes in reinforcement learning. In: Advances in Neural Information Processing Systems, vol.\u00a016, pp. 751\u2013759. MIT Press, Cambridge (2003)"},{"key":"1_CR13","doi-asserted-by":"crossref","DOI":"10.7551\/mitpress\/4175.001.0001","volume-title":"Learning with Kernels: Support Vector Machines, Regularization, Optimization, and Beyond","author":"B. Scholkopf","year":"2001","unstructured":"Scholkopf, B., Smola, A.J.: Learning with Kernels: Support Vector Machines, Regularization, Optimization, and Beyond. MIT Press, Cambridge (2001)"},{"key":"1_CR14","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9780511809682","volume-title":"Kernel Methods for Pattern Analysis","author":"J. Shawe-Taylor","year":"2004","unstructured":"Shawe-Taylor, J., Cristianini, N.: Kernel Methods for Pattern Analysis. Cambridge University Press, Cambridge (2004)"},{"key":"1_CR15","volume-title":"Reinforcement Learning","author":"R. Sutton","year":"1998","unstructured":"Sutton, R., Barto, A.: Reinforcement Learning. The MIT Press, Cambridge (1998)"},{"key":"1_CR16","first-page":"1017","volume-title":"ICML 2009: Proceedings of the 26th Annual International Conference on Machine Learning","author":"G. Taylor","year":"2009","unstructured":"Taylor, G., Parr, R.: Kernelized value function approximation for reinforcement learning. In: ICML 2009: Proceedings of the 26th Annual International Conference on Machine Learning, pp. 1017\u20131024. ACM, New York (2009)"},{"key":"1_CR17","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1007\/11881070_8","volume-title":"Advances in Natural Computation","author":"X. Xu","year":"2006","unstructured":"Xu, X.: A sparse kernel-based least-squares temporal difference algorithm for reinforcement learning. In: Jiao, L., Wang, L., Gao, X.-b., Liu, J., Wu, F. (eds.) ICNC 2006. LNCS, vol.\u00a04221, pp. 47\u201356. Springer, Heidelberg (2006)"},{"issue":"4","key":"1_CR18","doi-asserted-by":"publisher","first-page":"973","DOI":"10.1109\/TNN.2007.899161","volume":"18","author":"X. Xu","year":"2007","unstructured":"Xu, X., Hu, D., Lu, X.: Kernel-based least squares policy iteration for reinforcement learning. IEEE Transactions on Neural Networks\u00a018(4), 973\u2013992 (2007)","journal-title":"IEEE Transactions on Neural Networks"},{"key":"1_CR19","unstructured":"Xu, X., Xie, T., Hu, D., Lu, X., Xu, X., Xie, T., Hu, D., Lu, X.: Kernel least-squares temporal difference learning kernel least-squares temporal difference learning. International Journal of Information Technology, 54\u201363 (2005)"},{"key":"1_CR20","doi-asserted-by":"crossref","unstructured":"Engel, Y., Mannor, S., Meir, R.: Reinforcement learning with Gaussian processes. In: 22nd International Conference on Machine Learning (ICML 2005), Bonn, Germany, pp. 201\u2013208 (2005)","DOI":"10.1145\/1102351.1102377"}],"container-title":["Lecture Notes in Computer Science","Machine Learning and Knowledge Discovery in Databases"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-23808-6_1","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,8]],"date-time":"2025-03-08T22:19:23Z","timestamp":1741472363000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-23808-6_1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011]]},"ISBN":["9783642238079","9783642238086"],"references-count":20,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-23808-6_1","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2011]]}}}