{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,29]],"date-time":"2026-03-29T15:34:37Z","timestamp":1774798477284,"version":"3.50.1"},"reference-count":39,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"12","license":[{"start":{"date-parts":[[2009,12,1]],"date-time":"2009-12-01T00:00:00Z","timestamp":1259625600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Automat. Contr."],"published-print":{"date-parts":[[2009,12]]},"DOI":"10.1109\/tac.2009.2031725","type":"journal-article","created":{"date-parts":[[2009,11,6]],"date-time":"2009-11-06T21:03:49Z","timestamp":1257541429000},"page":"2787-2802","source":"Crossref","is-referenced-by-count":52,"title":["A Structured Multiarmed Bandit Problem and the Greedy Policy"],"prefix":"10.1109","volume":"54","author":[{"given":"A.J.","family":"Mersereau","sequence":"first","affiliation":[]},{"given":"P.","family":"Rusmevichientong","sequence":"additional","affiliation":[]},{"given":"J.N.","family":"Tsitsiklis","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1287\/mnsc.21.11.1225"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-34675-5"},{"key":"ref33","author":"farias","year":"2006","journal-title":"Dynamic Pricing With a Prior on Market Response"},{"key":"ref32","author":"aviv","year":"2005","journal-title":"Dynamic Pricing of Short Life-Cycle Products Through Active Learning"},{"key":"ref31","author":"carvalho","year":"2004","journal-title":"How Should a Manager Set Prices When the Demand Function is Unknown?"},{"key":"ref30","first-page":"385","article-title":"online convex optimization in the bandit setting: gradient descent without a gradient","author":"flaxman","year":"2005","journal-title":"Proc Annu ACM-SIAM Symp Discrete Algorithm"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1137\/S0097539701398375"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1006\/game.1999.0740"},{"key":"ref35","author":"durrett","year":"1996","journal-title":"Probability Theory and Examples"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1287\/opre.1080.0640"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1214\/aoap\/1177005207"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1287\/moor.21.2.257"},{"key":"ref12","author":"frostig","year":"1999","journal-title":"Four Proofs of Gittins' Multiarmed Bandit Theorem"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/9.40770"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.2307\/1427934"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1023\/A:1013689704352"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.2307\/2332286"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1090\/S0002-9904-1952-09620-8"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/978-94-015-3711-7"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177704454"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/1109557.1109660"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/0022-0531(74)90066-0"},{"key":"ref27","doi-asserted-by":"crossref","first-page":"109","DOI":"10.1007\/978-3-540-27819-1_8","article-title":"online geometric optimization in the bandit setting against an adaptive adversary","author":"mcmahan","year":"2004","journal-title":"Proc 17th Annu Conf Learning Theory"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/0196-8858(85)90002-8"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1111\/1468-0262.00170"},{"key":"ref29","first-page":"697","article-title":"nearly tight bounds for the continuum-armed bandit problem","author":"kleinberg","year":"2005","journal-title":"Proc Adv Neural Inform Processing Syst"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.2307\/2951539"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"143","DOI":"10.1111\/j.2517-6161.1980.tb01111.x","article-title":"multi-armed bandits and the gittins index","volume":"42","author":"whittle","year":"1980","journal-title":"J Royal Stat Soc B"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.75.2.586"},{"key":"ref2","first-page":"241","author":"gittins","year":"1974","journal-title":"Progress in Statistics"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1214\/aoap\/1177005588"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1214\/aos\/1176350495"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1214\/aos\/1176346603"},{"key":"ref22","doi-asserted-by":"crossref","first-page":"771","DOI":"10.1111\/j.2517-6161.1995.tb02062.x","article-title":"response surface bandits","volume":"57","author":"ginebra","year":"1995","journal-title":"J Roy Stat Soc B"},{"key":"ref21","author":"pressman","year":"1990","journal-title":"Sequential Control With Incomplete Information"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1137\/S0363012994275440"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/1273496.1273587"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1016\/j.jcss.2007.04.016"},{"key":"ref25","first-page":"1505","article-title":"optimistic linear programming gives logarithmic regret for irreducible mdps","author":"tewari","year":"2008","journal-title":"Proc Adv Neural Inform Processing Syst"}],"container-title":["IEEE Transactions on Automatic Control"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx5\/9\/5340373\/05308361.pdf?arnumber=5308361","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,13]],"date-time":"2025-02-13T03:36:18Z","timestamp":1739417778000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/5308361\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009,12]]},"references-count":39,"journal-issue":{"issue":"12"},"URL":"https:\/\/doi.org\/10.1109\/tac.2009.2031725","relation":{},"ISSN":["0018-9286","1558-2523"],"issn-type":[{"value":"0018-9286","type":"print"},{"value":"1558-2523","type":"electronic"}],"subject":[],"published":{"date-parts":[[2009,12]]}}}