{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,27]],"date-time":"2025-10-27T15:55:28Z","timestamp":1761580528170},"publisher-location":"Berlin, Heidelberg","reference-count":15,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540425366"},{"type":"electronic","value":"9783540447955"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2003]]},"DOI":"10.1007\/3-540-44795-4_8","type":"book-chapter","created":{"date-parts":[[2007,8,15]],"date-time":"2007-08-15T06:35:10Z","timestamp":1187159710000},"page":"85-96","source":"Crossref","is-referenced-by-count":13,"title":["A Reinforcement Learning Algorithm Applied to Simplified Two-Player Texas Hold\u2019em Poker"],"prefix":"10.1007","author":[{"given":"Fredrik A.","family":"Dahl","sequence":"first","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2001,8,30]]},"reference":[{"key":"8_CR1","unstructured":"Dahl, F.A.: The lagging anchor algorithm. Reinforcement learning in two-player zero-sum games with imperfect information. Machine Learning (to appear)."},{"key":"8_CR2","volume-title":"Game Theory","author":"G. Owen","year":"1995","unstructured":"Owen, G.: Game Theory. 3rd ed. Academic Press, San Diego (1995).","edition":"3"},{"key":"8_CR3","first-page":"9","volume":"3","author":"R.S. Sutton","year":"1988","unstructured":"Sutton, R.S.: Learning to predict by the methods of temporal differences. Machine Learning 3 (1988) 9\u201344.","journal-title":"Machine Learning"},{"key":"8_CR4","unstructured":"Watkins, C.J.C.H.: Learning from Delayed Rewards. PhD thesis, University of Cambridge, UK (1989)."},{"key":"8_CR5","doi-asserted-by":"publisher","first-page":"2017","DOI":"10.1162\/089976699300016070","volume":"11","author":"C. Szepesvari","year":"1999","unstructured":"Szepesvari, C., Littman, M.L.: A unified analysis of value-function-based reinforcement learning algorithms. Neural Computation 11 (1999) 2017\u20132060.","journal-title":"Neural Computation"},{"key":"8_CR6","first-page":"257","volume":"8","author":"G.J. Tesauro","year":"1992","unstructured":"Tesauro, G.J.: Practical issues in temporal difference learning. Machine Learning 8 (1992) 257\u2013277.","journal-title":"Machine Learning"},{"key":"8_CR7","first-page":"157","volume-title":"Proceedings of the 11th International Conference on Machine Learning","author":"M.L. Littman","year":"1994","unstructured":"Littman, M.L.: Markov games as a framework for multi-agent reinforcement learning. In: Proceedings of the 11th International Conference on Machine Learning, Morgan Kaufmann, New Brunswick (1994) 157\u2013163."},{"key":"8_CR8","series-title":"Lect Notes Comput Sci","doi-asserted-by":"publisher","first-page":"117","DOI":"10.1007\/3-540-45164-1_13","volume-title":"ECML 2000","author":"F.A. Dahl","year":"2000","unstructured":"Dahl F.A., Halck O.M.: Minimax TD-learning with neural nets in a Markov game. In: Lopez de Mantaras, R., Plaza, E. (eds.): ECML 2000. Proceedings of the 11th European Conference on Machine Learning. Lecture Notes in Computer Science Vol. 1810, Springer-Verlag, Berlin-Heidelberg-New York (2000) 117\u2013128."},{"key":"8_CR9","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1006\/game.1996.0051","volume":"14","author":"D. Koller","year":"1996","unstructured":"Koller, D., Megiddo, N., von Stengel, B.: Efficient computation of equilibria for extensive two-person games. Games and Economic Behavior 14 (1996) 247\u2013259.","journal-title":"Games and Economic Behavior"},{"key":"8_CR10","volume-title":"Games and Decisions","author":"R.D. Luce","year":"1957","unstructured":"Luce, R.D., Raiffa, H.: Games and Decisions. Wiley, New York (1957)."},{"key":"8_CR11","doi-asserted-by":"publisher","first-page":"167","DOI":"10.1016\/S0004-3702(97)00023-4","volume":"94","author":"D. Koller","year":"1997","unstructured":"Koller, D., Pfeffer, A.: Representations and solutions for game-theoretic problems. Artificial Intelligence 94 (1997) 167\u2013215.","journal-title":"Artificial Intelligence"},{"key":"8_CR12","volume-title":"Proceedings of the ICML-99-Workshop on Machine Learning in Game Playing","author":"J. Schaeffer","year":"1999","unstructured":"Schaeffer, J., Billings, D., Pe\u00f1a, L., Szafron, D.: Learning to play strong poker. In: F\u00fcrnkranz, J., Kubat, M. (eds.): Proceedings of the ICML-99-Workshop on Machine Learning in Game Playing, Jozef Stefan Institute, Ljubljana (1999)."},{"key":"8_CR13","volume-title":"Fundamentals of Artificial Neural Networks","author":"M.H. Hassoun","year":"1995","unstructured":"Hassoun, M.H.: Fundamentals of Artificial Neural Networks. MIT Press, Cambridge, Massachusetts (1995)."},{"key":"8_CR14","volume-title":"Game equilibrium models","author":"R. Selten","year":"1991","unstructured":"Selten R. (1991). Anticipatory learning in two-person games, in: Selten, R. (ed.): Game equilibrium models, vol. I: Evolution and game dynamics, Springer-Verlag, Berlin."},{"key":"8_CR15","volume-title":"Proceedings of the ICML-99-Workshop on Machine Learning in Game Playing","author":"O.M. Halck","year":"1999","unstructured":"Halck, O.M., Dahl, F.A.: On classification of games and evaluation of players \u2014 with some sweeping generalizations about the literature. In: F\u00fcrnkranz, J., Kubat, M. (eds.): Proceedings of the ICML-99-Workshop on Machine Learning in Game Playing, Jozef Stefan Institute, Ljubljana (1999)."}],"container-title":["Lecture Notes in Computer Science","Machine Learning: ECML 2001"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/3-540-44795-4_8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,2,21]],"date-time":"2019-02-21T21:14:00Z","timestamp":1550783640000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/3-540-44795-4_8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2001,8,30]]},"ISBN":["9783540425366","9783540447955"],"references-count":15,"URL":"https:\/\/doi.org\/10.1007\/3-540-44795-4_8","relation":{},"ISSN":["0302-9743"],"issn-type":[{"type":"print","value":"0302-9743"}],"subject":[],"published":{"date-parts":[[2001,8,30]]}}}