{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,28]],"date-time":"2026-02-28T16:26:58Z","timestamp":1772296018831,"version":"3.50.1"},"publisher-location":"Berlin, Heidelberg","reference-count":15,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"value":"9783642130328","type":"print"},{"value":"9783642130335","type":"electronic"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2010]]},"DOI":"10.1007\/978-3-642-13033-5_21","type":"book-chapter","created":{"date-parts":[[2011,1,22]],"date-time":"2011-01-22T00:57:08Z","timestamp":1295657828000},"page":"199-208","source":"Crossref","is-referenced-by-count":18,"title":["Solving Non-Stationary Bandit Problems by Random Sampling from Sibling Kalman Filters"],"prefix":"10.1007","author":[{"given":"Ole-Christoffer","family":"Granmo","sequence":"first","affiliation":[]},{"given":"Stian","family":"Berg","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"21_CR1","unstructured":"Wyatt, J.: Exploration and Inference in Learning from Reinforcement. PhD thesis, University of Edinburgh (1997)"},{"key":"21_CR2","doi-asserted-by":"crossref","unstructured":"Granmo, O.C.: Solving Two-Armed Bernoulli Bandit Problems Using a Bayesian Learning Automaton. To Appear in the International Journal of Intelligent Computing and Cybernetics (2010)","DOI":"10.1108\/17563781011049179"},{"key":"21_CR3","doi-asserted-by":"crossref","first-page":"285","DOI":"10.1093\/biomet\/25.3-4.285","volume":"25","author":"W.R. Thompson","year":"1933","unstructured":"Thompson, W.R.: On the likelihood that one unknown probability exceeds another in view of the evidence of two samples. Biometrika\u00a025, 285\u2013294 (1933)","journal-title":"Biometrika"},{"issue":"1","key":"21_CR4","doi-asserted-by":"publisher","first-page":"166","DOI":"10.1109\/TSMCB.2006.879012","volume":"37","author":"O.C. Granmo","year":"2007","unstructured":"Granmo, O.C., Oommen, B.J., Myrer, S.A., Olsen, M.G.: Learning Automata-based Solutions to the Nonlinear Fractional Knapsack Problem with Applications to Optimal Resource Allocation. IEEE Transactions on Systems, Man, and Cybernetics, Part B\u00a037(1), 166\u2013175 (2007)","journal-title":"IEEE Transactions on Systems, Man, and Cybernetics, Part B"},{"key":"21_CR5","volume-title":"Learning Automata: An Introduction","author":"K.S. Narendra","year":"1989","unstructured":"Narendra, K.S., Thathachar, M.A.L.: Learning Automata: An Introduction. Prentice-Hall, Englewood Cliffs (1989)"},{"key":"21_CR6","series-title":"Lecture Notes in Artificial Intelligence","doi-asserted-by":"publisher","first-page":"437","DOI":"10.1007\/11564096_42","volume-title":"Machine Learning: ECML 2005","author":"J. Vermorel","year":"2005","unstructured":"Vermorel, J., Mohri, M.: Multi-armed bandit algorithms and empirical evaluation. In: Gama, J., Camacho, R., Brazdil, P.B., Jorge, A.M., Torgo, L. (eds.) ECML 2005. LNCS (LNAI), vol.\u00a03720, pp. 437\u2013448. Springer, Heidelberg (2005)"},{"key":"21_CR7","volume-title":"Reinforcement Learning: An Introduction","author":"R.S. Sutton","year":"1998","unstructured":"Sutton, R.S., Barto, A.G.: Reinforcement Learning: An Introduction. MIT Press, Cambridge (1998)"},{"key":"21_CR8","doi-asserted-by":"publisher","first-page":"235","DOI":"10.1023\/A:1013689704352","volume":"47","author":"P. Auer","year":"2002","unstructured":"Auer, P., Cesa-Bianchi, N., Fischer, P.: Finite-time Analysis of the Multiarmed Bandit Problem. Machine Learning\u00a047, 235\u2013256 (2002)","journal-title":"Machine Learning"},{"key":"21_CR9","doi-asserted-by":"crossref","unstructured":"Kaelbling, L.P.: Learning in Embedded Systems. PhD thesis, Stanford University (1993)","DOI":"10.7551\/mitpress\/4168.001.0001"},{"key":"21_CR10","doi-asserted-by":"crossref","unstructured":"Wang, T., Lizotte, D., Bowling, M., Scuurmans, D.: Bayesian sparse sampling for on-line reward optimization. In: Proceedings of the 22nd International conference on Machine learning, pp. 956\u2013963 (2005)","DOI":"10.1145\/1102351.1102472"},{"key":"21_CR11","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"850","DOI":"10.1007\/11840817_88","volume-title":"Artificial Neural Networks \u2013 ICANN 2006","author":"C. Dimitrakakis","year":"2006","unstructured":"Dimitrakakis, C.: Nearly optimal exploration-exploitation decision thresholds. In: Kollias, S.D., Stafylopatis, A., Duch, W., Oja, E. (eds.) ICANN 2006. LNCS, vol.\u00a04131, pp. 850\u2013859. Springer, Heidelberg (2006)"},{"key":"21_CR12","first-page":"761","volume-title":"AAAI\/IAAI","author":"R. Dearden","year":"1998","unstructured":"Dearden, R., Friedman, N., Russell, S.: Bayesian q-learning. In: AAAI\/IAAI, pp. 761\u2013768. AAAI Press, Menlo Park (1998)"},{"key":"21_CR13","doi-asserted-by":"crossref","unstructured":"Engel, Y., Mannor, S., Meir, R.: Reinforcement learning with gaussian processes. In: Proceedings of the 22nd International conference on Machine learning, pp. 956\u2013963 (2005)","DOI":"10.1145\/1102351.1102377"},{"key":"21_CR14","volume-title":"Machine Learning","author":"T.M. Mitchell","year":"1997","unstructured":"Mitchell, T.M.: Machine Learning. McGraw-Hill, New York (1997)"},{"key":"21_CR15","volume-title":"Artificial Intelligence - A Modern Approach","author":"S. Russel","year":"2003","unstructured":"Russel, S., Norvig, P.: Artificial Intelligence - A Modern Approach, 2nd edn. Prentice-Hall, Englewood Cliffs (2003)","edition":"2"}],"container-title":["Lecture Notes in Computer Science","Trends in Applied Intelligent Systems"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-13033-5_21.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,11,24]],"date-time":"2020-11-24T03:00:07Z","timestamp":1606186807000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-13033-5_21"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2010]]},"ISBN":["9783642130328","9783642130335"],"references-count":15,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-13033-5_21","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2010]]}}}