{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,19]],"date-time":"2025-12-19T22:12:02Z","timestamp":1766182322843,"version":"3.37.3"},"reference-count":29,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100004787","name":"The Scientific and Technological Research Council of T\u00fcrkiye (TUBITAK) BIDEB 2232-B International Fellowship for Early Stage Researchers","doi-asserted-by":"publisher","award":["121C124"],"award-info":[{"award-number":["121C124"]}],"id":[{"id":"10.13039\/501100004787","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Control Syst. Lett."],"published-print":{"date-parts":[[2024]]},"DOI":"10.1109\/lcsys.2024.3416240","type":"journal-article","created":{"date-parts":[[2024,6,18]],"date-time":"2024-06-18T18:12:14Z","timestamp":1718734334000},"page":"1733-1738","source":"Crossref","is-referenced-by-count":5,"title":["Strategizing Against Q-Learners: A Control-Theoretical Approach"],"prefix":"10.1109","volume":"8","author":[{"ORCID":"https:\/\/orcid.org\/0009-0007-7516-4850","authenticated-orcid":false,"given":"Yuksel","family":"Arslantas","sequence":"first","affiliation":[{"name":"Department of Electrical and Electronics Engineering, Bilkent University, Ankara, T&#x00FC;rkiye"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-6765-3598","authenticated-orcid":false,"given":"Ege","family":"Yuceel","sequence":"additional","affiliation":[{"name":"Department of Electrical and Electronics Engineering, Bilkent University, Ankara, T&#x00FC;rkiye"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5779-3986","authenticated-orcid":false,"given":"Muhammed O.","family":"Sayin","sequence":"additional","affiliation":[{"name":"Department of Electrical and Electronics Engineering, Bilkent University, Ankara, T&#x00FC;rkiye"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-32430-8_14"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1002\/9781119723950.ch19"},{"key":"ref3","first-page":"1","article-title":"Strategizing against no-regret learners","volume-title":"Proc. 33rd Adv. Neural Inf. Process. Syst.","author":"Deng"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2023.3266505"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.23919\/CCC55666.2022.9902863"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1016\/B978-1-55860-307-3.50049-6"},{"key":"ref7","article-title":"Asymptotic convergence and performance of multi-agent Q-learning dynamics","author":"Hussain","year":"2023","journal-title":"arXiv:2301.09619"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.39.10.1953"},{"key":"ref9","first-page":"1167","article-title":"Classes of multiagent Q-learning dynamics with epsilon-greedy exploration","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Wunder"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0172395"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1257\/aer.20190623"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1111\/1756-2171.12383"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-022-10348-5"},{"key":"ref14","first-page":"11225","article-title":"Adaptive reward-poisoning attacks against reinforcement learning","volume-title":"Proc. 37th Int. Conf. Mach. Learn.","author":"Zhang"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/LCSYS.2020.2979572"},{"key":"ref16","first-page":"1","article-title":"Robust multi-agent Q-learning in cooperative games with adversaries","volume-title":"Proc. AAAI Conf. Artif. Intell.","author":"Nisioti"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i04.6086"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1287\/mksc.2020.1276"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/3580507.3597726"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/LCSYS.2024.3416240"},{"volume-title":"Markov Decision Processes: Discrete Stochastic Dynamic Programming","year":"2014","author":"Puterman","key":"ref21"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2002.1184960"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-75225-7_30"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1287\/opre.51.6.850.24925"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1287\/moor.1040.0094"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1007\/BF00114724"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/cdc.1995.478953"},{"key":"ref28","first-page":"1","article-title":"Error propagation for approximate policy and value iteration","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Farahmand"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-79033-6"}],"container-title":["IEEE Control Systems Letters"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/7782633\/10411713\/10561617.pdf?arnumber=10561617","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,24]],"date-time":"2024-10-24T17:38:04Z","timestamp":1729791484000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10561617\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"references-count":29,"URL":"https:\/\/doi.org\/10.1109\/lcsys.2024.3416240","relation":{},"ISSN":["2475-1456"],"issn-type":[{"type":"electronic","value":"2475-1456"}],"subject":[],"published":{"date-parts":[[2024]]}}}