{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T09:33:36Z","timestamp":1778232816392,"version":"3.51.4"},"reference-count":25,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2012,11,13]],"date-time":"2012-11-13T00:00:00Z","timestamp":1352764800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Ann Oper Res"],"published-print":{"date-parts":[[2013,9]]},"DOI":"10.1007\/s10479-012-1250-y","type":"journal-article","created":{"date-parts":[[2012,11,13]],"date-time":"2012-11-13T09:20:03Z","timestamp":1352798403000},"page":"37-62","source":"Crossref","is-referenced-by-count":16,"title":["The multi-armed bandit, with constraints"],"prefix":"10.1007","volume":"208","author":[{"given":"Eric V.","family":"Denardo","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Eugene A.","family":"Feinberg","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Uriel G.","family":"Rothblum","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2012,11,13]]},"reference":[{"key":"1250_CR1","volume-title":"Constrained Markov decision processes","author":"E. Altman","year":"1999","unstructured":"Altman, E. (1999). Constrained Markov decision processes. Boca Raton, USA: Chapman & Hall\/CRC."},{"key":"1250_CR2","doi-asserted-by":"crossref","first-page":"336","DOI":"10.1057\/9780230226203.0088","volume-title":"The new Palgrave dictionary of economics","author":"D. Bergemann","year":"2008","unstructured":"Bergemann, D., & V\u00e4lim\u00e4kim, J. (2008). Bandit problems. In S. Durlauf & L. Blume (Eds.), The new Palgrave dictionary of economics (Vol. 1, 2nd ed., pp. 336\u2013340). New York: Palgrave Macmillan.","edition":"2"},{"key":"1250_CR3","doi-asserted-by":"crossref","DOI":"10.1007\/978-94-015-3711-7","volume-title":"Bandit problems","author":"D. A. Berry","year":"1985","unstructured":"Berry, D. A., & Friestedt, B. (1985). Bandit problems. London: Chapman & Hall."},{"key":"1250_CR4","doi-asserted-by":"crossref","first-page":"257","DOI":"10.1287\/moor.21.2.257","volume":"21","author":"D. Bertsimas","year":"1993","unstructured":"Bertsimas, D., & Ni\u00f1o-Mora, J. (1993). Conservation laws, extended polymatroids and multi-armed bandit problems: a polyhedral approach to indexable systems. Mathematics of Operations Research, 21, 257\u2013306.","journal-title":"Mathematics of Operations Research"},{"key":"1250_CR5","doi-asserted-by":"crossref","first-page":"165","DOI":"10.1137\/1009030","volume":"9","author":"E. V. Denardo","year":"1967","unstructured":"Denardo, E. V. (1967). Contraction mappings in the theory underlying dynamic programming. SIAM Review, 9, 165\u2013177.","journal-title":"SIAM Review"},{"key":"1250_CR6","doi-asserted-by":"crossref","first-page":"374","DOI":"10.1287\/moor.1060.0240","volume":"32","author":"E. V. Denardo","year":"2007","unstructured":"Denardo, E. V., Park, H., & Rothblum, U. G. (2007). Risk-sensitive and risk-neutral multiarmed bandits. Mathematics of Operations Research, 32, 374\u2013394.","journal-title":"Mathematics of Operations Research"},{"key":"1250_CR7","doi-asserted-by":"crossref","first-page":"414","DOI":"10.1137\/S0363012904442616","volume":"45","author":"E. V. Denardo","year":"2006","unstructured":"Denardo, E. V., & Rothblum, U. G. (2006). A turnpike theorem for a risk-sensitive Markov decision problem with stopping. SIAM Journal on Control and Optimization, 45, 414\u2013431.","journal-title":"SIAM Journal on Control and Optimization"},{"key":"1250_CR8","doi-asserted-by":"crossref","first-page":"255","DOI":"10.1214\/aoap\/1177005062","volume":"4","author":"N. El Karoui","year":"1994","unstructured":"El Karoui, N., & Karatzas, I. (1994). Dynamic allocation indices in continuous time. The Annals of Applied Probability, 4, 255\u2013286.","journal-title":"The Annals of Applied Probability"},{"key":"1250_CR9","doi-asserted-by":"crossref","first-page":"129","DOI":"10.1287\/moor.1110.0525","volume":"37","author":"E. A. Feinberg","year":"2012","unstructured":"Feinberg, E. A., & Rothblum, U. G. (2012). Splitting randomized stationary policies in total\u2014reward Markov decision processes. Mathematics of Operations Research, 37, 129\u2013153.","journal-title":"Mathematics of Operations Research"},{"key":"1250_CR10","doi-asserted-by":"crossref","first-page":"148","DOI":"10.1111\/j.2517-6161.1979.tb01068.x","volume":"41","author":"J. C. Gittins","year":"1979","unstructured":"Gittins, J. C. (1979). Bandit problems and dynamic allocation indices (with discussion). Journal of the Royal Statistical Society. Series B, 41, 148\u2013177.","journal-title":"Journal of the Royal Statistical Society. Series B"},{"key":"1250_CR11","volume-title":"Multi-armed bandit allocation indices","author":"J. C. Gittins","year":"1989","unstructured":"Gittins, J. C. (1989). Multi-armed bandit allocation indices. Chichester: Wiley"},{"key":"1250_CR12","first-page":"241","volume-title":"Progress in statistics, European meeting of statisticians I","author":"J. C. Gittins","year":"1974","unstructured":"Gittins, J. C., & Jones, D. M. (1974). A dynamic allocation index for the sequential design experiments. In J. Gani, K. Sarkadu, & I. Vince (Eds.), Progress in statistics, European meeting of statisticians I (pp.\u00a0241\u2013266). Amsterdam: North-Holland."},{"key":"1250_CR13","doi-asserted-by":"crossref","DOI":"10.1002\/9780470980033","volume-title":"Multi-armed bandit allocation indices","author":"J. C. Gittins","year":"2011","unstructured":"Gittins, J. C., Glazebrook, K., & Weber, R. (2011). Multi-armed bandit allocation indices (2nd ed.). Chichester: Wiley","edition":"2"},{"key":"1250_CR14","doi-asserted-by":"crossref","first-page":"1270","DOI":"10.1214\/aoap\/1028903380","volume":"8","author":"H. Kaspi","year":"1998","unstructured":"Kaspi, H., & Mandelbaum, A. (1998). Multi-armed bandits in discrete and continuous time. The Annals of Applied Probability, 8, 1270\u20131290.","journal-title":"The Annals of Applied Probability"},{"key":"1250_CR15","series-title":"IMS lecture notes\u2014monograph series","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1214\/lnms\/1215540286","volume-title":"Adaptive statistical procedures and related topics","author":"M. N. Katehakis","year":"1986","unstructured":"Katehakis, M. N., & Derman, C. (1986). Computing optimal sequential allocation rules in clinical trials. In J. Van Ryzin (Ed.), IMS lecture notes\u2014monograph series: Vol.\u00a08. Adaptive statistical procedures and related topics (pp. 29\u201339). Hayward: Inst. Math. Stat."},{"key":"1250_CR16","doi-asserted-by":"crossref","first-page":"262","DOI":"10.1287\/moor.12.2.262","volume":"22","author":"M. N. Katehakis","year":"1987","unstructured":"Katehakis, M. N., & Veinott, A. F. Jr. (1987). The multiarmed bandit problem: decomposition and computation. Mathematics of Operations Research, 22, 262\u2013268.","journal-title":"Mathematics of Operations Research"},{"key":"1250_CR17","doi-asserted-by":"crossref","first-page":"596","DOI":"10.1287\/ijoc.1060.0206","volume":"10","author":"J. Ni\u00f1o-Mora","year":"2007","unstructured":"Ni\u00f1o-Mora, J. (2007). A (2\/3)n 3 fast pivoting algorithm for the Gittins index and optimal stopping of a Markov chain. INFORMS Journal on Computing, 10, 596\u2013606.","journal-title":"INFORMS Journal on Computing"},{"key":"1250_CR18","doi-asserted-by":"crossref","first-page":"130","DOI":"10.1006\/jeth.1997.2347","volume":"78","author":"K. Schlag","year":"1998","unstructured":"Schlag, K. (1998). Why imitate, and if so, how? A bounded rational approach to multi-armed bandits. Journal of Economic Theory, 78, 130\u2013156.","journal-title":"Journal of Economic Theory"},{"key":"1250_CR19","doi-asserted-by":"crossref","first-page":"1526","DOI":"10.1016\/j.spl.2008.01.049","volume":"78","author":"I. Sonin","year":"2008","unstructured":"Sonin, I. (2008). A generalized Gittins index for Markov chains and its recursive calculation. Statistics & Probability Letters, 78, 1526\u20131533.","journal-title":"Statistics & Probability Letters"},{"key":"1250_CR20","doi-asserted-by":"crossref","first-page":"194","DOI":"10.1214\/aoap\/1177005207","volume":"4","author":"J. Tsitsiklis","year":"1994","unstructured":"Tsitsiklis, J. (1994). A short proof of the Gittins index theorem. The Annals of Applied Probability, 4, 194\u2013199.","journal-title":"The Annals of Applied Probability"},{"key":"1250_CR21","doi-asserted-by":"crossref","first-page":"426","DOI":"10.1109\/TAC.1985.1103989","volume":"AC-30","author":"P. Variaya","year":"1985","unstructured":"Variaya, P., Walrand, J., & Buyukkoc, C. (1985). Extensions of the multi-armed bandit problem: The discounted case. IEEE Transactions on Automatic Control, AC-30, 426\u2013439.","journal-title":"IEEE Transactions on Automatic Control"},{"key":"1250_CR22","doi-asserted-by":"crossref","first-page":"1635","DOI":"10.1214\/aoms\/1177697379","volume":"40","author":"A. F. Veinott Jr.","year":"1969","unstructured":"Veinott, A. F. Jr. (1969). Discrete dynamic programming with sensitive discount optimality criteria. The Annals of Mathematical Statistics, 40, 1635\u20131660.","journal-title":"The Annals of Mathematical Statistics"},{"key":"1250_CR23","doi-asserted-by":"crossref","first-page":"1024","DOI":"10.1214\/aoap\/1177005588","volume":"2","author":"R. Weber","year":"1992","unstructured":"Weber, R. (1992). On the Gittins index for multiarmed bandits. The Annals of Applied Probability, 2, 1024\u20131033.","journal-title":"The Annals of Applied Probability"},{"key":"1250_CR24","doi-asserted-by":"crossref","first-page":"269","DOI":"10.1017\/S0269964800000826","volume":"2","author":"G. Weiss","year":"1988","unstructured":"Weiss, G. (1988). Branching bandit processes. Probability in the Engineering and Informational Sciences, 2, 269\u2013278.","journal-title":"Probability in the Engineering and Informational Sciences"},{"key":"1250_CR25","doi-asserted-by":"crossref","first-page":"143","DOI":"10.1111\/j.2517-6161.1980.tb01111.x","volume":"43","author":"P. Whittle","year":"1980","unstructured":"Whittle, P. (1980). Multi-armed bandits and the Gittins index. Journal of the Royal Statistical Society. Series B, 43, 143\u2013149.","journal-title":"Journal of the Royal Statistical Society. Series B"}],"container-title":["Annals of Operations Research"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10479-012-1250-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10479-012-1250-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10479-012-1250-y","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,5,1]],"date-time":"2024-05-01T09:37:53Z","timestamp":1714556273000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10479-012-1250-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,11,13]]},"references-count":25,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2013,9]]}},"alternative-id":["1250"],"URL":"https:\/\/doi.org\/10.1007\/s10479-012-1250-y","relation":{},"ISSN":["0254-5330","1572-9338"],"issn-type":[{"value":"0254-5330","type":"print"},{"value":"1572-9338","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012,11,13]]}}}