{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,21]],"date-time":"2026-02-21T18:07:53Z","timestamp":1771697273371,"version":"3.50.1"},"reference-count":28,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,7]]},"DOI":"10.1109\/acc.2016.7524910","type":"proceedings-article","created":{"date-parts":[[2016,8,5]],"date-time":"2016-08-05T13:52:25Z","timestamp":1470405145000},"page":"167-172","source":"Crossref","is-referenced-by-count":18,"title":["Multi-agent temporal-difference learning with linear function approximation: Weak convergence under time-varying network topologies"],"prefix":"10.1109","author":[{"given":"Milos S.","family":"Stankovic","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Srdjan S.","family":"Stankovic","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2010.2076530"},{"key":"ref11","doi-asserted-by":"crossref","first-page":"601","DOI":"10.1109\/TAC.2014.2364096","article-title":"Distributed optimization over time-varying directed graphs","volume":"60","author":"nedi?","year":"2015","journal-title":"IEEE Trans Autom Control"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TSP.2012.2217338"},{"key":"ref13","author":"stankovi?","year":"2014","journal-title":"Distributed stochastic approximation weak convergence and network design"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2006.887293"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2013.2283750"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2012.2203214"},{"key":"ref17","author":"sutton","year":"1998","journal-title":"Reinforcement Learning An Introduction"},{"key":"ref18","author":"bertsekas","year":"1996","journal-title":"Neuro-Dynamic Programming"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1016\/B978-1-55860-377-6.50013-X"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6638519"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2015.07.018"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6911(97)90015-3"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2009.02.014"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.1986.1104412"},{"key":"ref5","author":"tsitsiklis","year":"1984","journal-title":"Problems in decentralized decision making and computation"},{"key":"ref8","doi-asserted-by":"crossref","first-page":"48","DOI":"10.1109\/TAC.2008.2009515","article-title":"Distributed subgradient methods for multiagent optimization","volume":"54","author":"nedi?","year":"2009","journal-title":"IEEE Trans Autom Control"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1137\/0325070"},{"key":"ref2","first-page":"4364","article-title":"Consensus based multi-agent control structures","author":"stankovi?","year":"2008","journal-title":"Proc IEEE Conf Decision and Control"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2013.2275131"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2008.2009583"},{"key":"ref20","first-page":"417","article-title":"Off-policy temporal-difference learning with function approximation","author":"precup","year":"2001","journal-title":"Proc 18th Int Conf on Machine Learning"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TSMCC.2007.913919"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/1553374.1553501"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TSP.2013.2241057"},{"key":"ref23","author":"mathkar","year":"2013","journal-title":"Distributed reinforcement learning via gossip"},{"key":"ref26","author":"kushner","year":"2003","journal-title":"Stochastic Approximation and Recursive Algorithms and Applications"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2014.2368731"}],"event":{"name":"2016 American Control Conference (ACC)","location":"Boston, MA, USA","start":{"date-parts":[[2016,7,6]]},"end":{"date-parts":[[2016,7,8]]}},"container-title":["2016 American Control Conference (ACC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7518121\/7524873\/07524910.pdf?arnumber=7524910","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,24]],"date-time":"2017-06-24T16:04:51Z","timestamp":1498320291000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7524910\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,7]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/acc.2016.7524910","relation":{},"subject":[],"published":{"date-parts":[[2016,7]]}}}