{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,4]],"date-time":"2026-06-04T21:02:03Z","timestamp":1780606923039,"version":"3.54.1"},"reference-count":18,"publisher":"Society for Industrial & Applied Mathematics (SIAM)","issue":"2","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["SIAM J. Control Optim."],"published-print":{"date-parts":[[2000,1]]},"DOI":"10.1137\/s0363012997331639","type":"journal-article","created":{"date-parts":[[2003,6,11]],"date-time":"2003-06-11T11:12:06Z","timestamp":1055329926000},"page":"447-469","source":"Crossref","is-referenced-by-count":341,"title":["The O.D.E. Method for Convergence of Stochastic Approximation and Reinforcement Learning"],"prefix":"10.1137","volume":"38","author":[{"given":"V. S.","family":"Borkar","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"S. P.","family":"Meyn","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"351","reference":[{"key":"R2","first-page":"835","volume":"13","author":"Barto A. G.","year":"1983","journal-title":"IEEE Trans. Systems, Man and Cybernetics","ISSN":"https:\/\/id.crossref.org\/issn\/0018-9472","issn-type":"print"},{"key":"R3","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-75894-2"},{"key":"R5","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6911(97)90015-3"},{"key":"R6","doi-asserted-by":"publisher","DOI":"10.1137\/S0363012995282784"},{"key":"R7","first-page":"169","volume":"24","author":"Borkar V. S.","year":"1996","journal-title":"Appl. Math.","ISSN":"https:\/\/id.crossref.org\/issn\/0862-7940","issn-type":"print"},{"key":"R8","doi-asserted-by":"publisher","DOI":"10.1109\/81.563625"},{"key":"R9","doi-asserted-by":"publisher","DOI":"10.1214\/aoap\/1177004828"},{"key":"R10","doi-asserted-by":"publisher","DOI":"10.1109\/9.471210"},{"key":"R11","doi-asserted-by":"publisher","DOI":"10.1016\/0893-6080(89)90018-X"},{"key":"R12","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1994.6.6.1185"},{"key":"R13","doi-asserted-by":"publisher","DOI":"10.1137\/S036301299731669X"},{"key":"R14","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4899-2696-8"},{"key":"R15","first-page":"0","volume":"39","author":"Maly\u0161ev V.","year":"1979","journal-title":"Trudy Moskov. Mat. Obshch."},{"key":"R16","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4471-3267-7"},{"key":"R17","doi-asserted-by":"publisher","DOI":"10.1214\/aoap\/1177004900"},{"key":"R18","volume-title":"Discrete\u2010parameter martingales","author":"Neveu J.","year":"1975"},{"key":"R20","first-page":"195","volume":"16","author":"Tsitsiklis J.","year":"1994","journal-title":"Mach. Learning","ISSN":"https:\/\/id.crossref.org\/issn\/0885-6125","issn-type":"print"},{"key":"R21","first-page":"279","volume":"8","author":"Watkins C. J. C. H.","year":"1992","journal-title":"Mach. Learning","ISSN":"https:\/\/id.crossref.org\/issn\/0885-6125","issn-type":"print"}],"container-title":["SIAM Journal on Control and Optimization"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/epubs.siam.org\/doi\/pdf\/10.1137\/S0363012997331639","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,1,29]],"date-time":"2017-01-29T07:41:20Z","timestamp":1485675680000},"score":1,"resource":{"primary":{"URL":"http:\/\/epubs.siam.org\/doi\/10.1137\/S0363012997331639"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2000,1]]},"references-count":18,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2000,1]]}},"alternative-id":["10.1137\/S0363012997331639"],"URL":"https:\/\/doi.org\/10.1137\/s0363012997331639","relation":{},"ISSN":["0363-0129","1095-7138"],"issn-type":[{"value":"0363-0129","type":"print"},{"value":"1095-7138","type":"electronic"}],"subject":[],"published":{"date-parts":[[2000,1]]}}}