{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,4]],"date-time":"2024-09-04T17:21:17Z","timestamp":1725470477220},"publisher-location":"Berlin, Heidelberg","reference-count":12,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540372714"},{"type":"electronic","value":"9783540372738"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2006]]},"DOI":"10.1007\/11816157_92","type":"book-chapter","created":{"date-parts":[[2006,8,31]],"date-time":"2006-08-31T11:46:55Z","timestamp":1157024815000},"page":"757-766","source":"Crossref","is-referenced-by-count":1,"title":["Kernel-Based Reinforcement Learning"],"prefix":"10.1007","author":[{"given":"Guanghua","family":"Hu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yuqin","family":"Qiu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Liming","family":"Xiang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"key":"92_CR1","first-page":"9","volume":"3","author":"R.S. Sutton","year":"1988","unstructured":"Sutton, R.S.: Learning to Predict by the Methods of Temporal Differences. Machine Learning\u00a03, 9\u201344 (1988)","journal-title":"Machine Learning"},{"key":"92_CR2","first-page":"279","volume":"8","author":"C.J.C.H. Watkins","year":"1992","unstructured":"Watkins, C.J.C.H.: Q-Learning. Machine Learning\u00a08, 279\u2013292 (1992)","journal-title":"Machine Learning"},{"key":"92_CR3","doi-asserted-by":"publisher","first-page":"588","DOI":"10.1109\/3468.618258","volume":"27","author":"G. Santharam","year":"1997","unstructured":"Santharam, G., Sastry, P.S.: A Reinforcement Learning Neural Network for Adaptive Control Markov Chains. IEEE Transactions on System, Man and Cybernetics-Part A\u00a027, 588\u2013600 (1997)","journal-title":"IEEE Transactions on System, Man and Cybernetics-Part A"},{"key":"92_CR4","doi-asserted-by":"publisher","first-page":"674","DOI":"10.1109\/9.580874","volume":"42","author":"J.N. Tsitsiklis","year":"1997","unstructured":"Tsitsiklis, J.N., Roy, B.V.: An Analysis of Temporal-Difference Learning with Function Approximation. IEEE Transactions on Automatic Control\u00a042, 674\u2013690 (1997)","journal-title":"IEEE Transactions on Automatic Control"},{"key":"92_CR5","first-page":"59","volume":"22","author":"J.N. Tsitsiklis","year":"1996","unstructured":"Tsitsiklis, J.N., Roy, B.V.: Feature-Based Methods for Large Scale Dynamic Programming. Machine Learning\u00a022, 59\u201394 (1996)","journal-title":"Machine Learning"},{"key":"92_CR6","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511809682","volume-title":"Kernel Methods for Pattern Analysis","author":"J. Shawe-Taylor","year":"2004","unstructured":"Shawe-Taylor, J., Cristianini, N.: Kernel Methods for Pattern Analysis. Cambridge University Press, Camgbridge (2004)"},{"key":"92_CR7","volume-title":"Dynamic Programming: Deterministic and Stochastic Methods","author":"D.P. Bertsekas","year":"1987","unstructured":"Bertsekas, D.P.: Dynamic Programming: Deterministic and Stochastic Methods. Prentice-Hall, Englewood Cliffs (1987)"},{"key":"92_CR8","volume-title":"Statistical Learning Theory","author":"V.N. Vapnik","year":"1998","unstructured":"Vapnik, V.N.: Statistical Learning Theory. John Wiley & Sons, New York (1998)"},{"key":"92_CR9","doi-asserted-by":"publisher","first-page":"1025","DOI":"10.1016\/S0925-2312(02)00606-9","volume":"48","author":"G.C. Cawley","year":"2002","unstructured":"Cawley, G.C., Talbot, N.L.C.: Improved Sparse Least-Squares Support Vector Machines. Neurocomputing\u00a048, 1025\u20131031 (2002)","journal-title":"Neurocomputing"},{"key":"92_CR10","doi-asserted-by":"publisher","first-page":"271","DOI":"10.1023\/A:1012474916001","volume":"46","author":"G.W. Flake","year":"2002","unstructured":"Flake, G.W., Lawrence, S.: Efficient SVM Regression Training with SMO. Machine Learning\u00a046, 271\u2013290 (2002)","journal-title":"Machine Learning"},{"key":"92_CR11","doi-asserted-by":"publisher","first-page":"85","DOI":"10.1016\/S0925-2312(01)00644-0","volume":"48","author":"J.A.K. Suykens","year":"2002","unstructured":"Suykens, J.A.K., Brabanter, J.D., Lukas, L., Vandewalle, J.: Weighted Least Squares Support Machines: Robustness and Sparse Approximation. Neurocomputing\u00a048, 85\u2013105 (2002)","journal-title":"Neurocomputing"},{"key":"92_CR12","first-page":"185","volume-title":"Advances in Kernel Methods \u2013Support Vector Learning","author":"J. Platt","year":"1999","unstructured":"Platt, J.: Fast Training of Support Vector Machines Using Sequential Minimal Optimization. In: Scholkopf, B., Burges, C.J., Smola, A.J. (eds.) Advances in Kernel Methods \u2013Support Vector Learning, pp. 185\u2013208. MIT Press, Cambridge (1999)"}],"container-title":["Lecture Notes in Computer Science","Intelligent Computing"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/11816157_92.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,4,27]],"date-time":"2021-04-27T07:29:33Z","timestamp":1619508573000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/11816157_92"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2006]]},"ISBN":["9783540372714","9783540372738"],"references-count":12,"URL":"https:\/\/doi.org\/10.1007\/11816157_92","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2006]]}}}