{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,16]],"date-time":"2025-10-16T00:19:48Z","timestamp":1760573988304,"version":"build-2065373602"},"reference-count":20,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,6,24]],"date-time":"2025-06-24T00:00:00Z","timestamp":1750723200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,6,24]],"date-time":"2025-06-24T00:00:00Z","timestamp":1750723200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100018696","name":"R\u00e9gion Normandie","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100018696","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,6,24]]},"DOI":"10.23919\/ecc65951.2025.11187042","type":"proceedings-article","created":{"date-parts":[[2025,10,14]],"date-time":"2025-10-14T17:38:09Z","timestamp":1760463489000},"page":"2644-2649","source":"Crossref","is-referenced-by-count":0,"title":["Convergent NMPC-based Reinforcement Learning Using Deep Expected Sarsa and Nonlinear Temporal Difference Learning"],"prefix":"10.23919","author":[{"given":"Amine","family":"Salaje","sequence":"first","affiliation":[{"name":"Universite de Rouen, ESIGELEC, IRSEEM,Rouen,France,76000"}]},{"given":"Thomas","family":"Chevet","sequence":"additional","affiliation":[{"name":"Universite de Rouen, ESIGELEC, IRSEEM,Rouen,France,76000"}]},{"given":"Nicolas","family":"Langlois","sequence":"additional","affiliation":[{"name":"Universite de Rouen, ESIGELEC, IRSEEM,Rouen,France,76000"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46024-6"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1017\/S0263574717000637"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1016\/j.ijepes.2021.107411"},{"volume-title":"Reinforcement Learning: An introduction.","year":"2018","author":"Sutton","key":"ref4"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2019.2913768"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.23919\/ECC.2019.8795816"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.ifacol.2020.12.2276"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.ifacol.2020.12.2294"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.23919\/ACC50511.2021.9483100"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.23919\/ECC54610.2021.9655129"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/j.ifacol.2023.10.548"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CoDIT58514.2023.10284335"},{"key":"ref13","first-page":"719","article-title":"Toward off-policy learning control with function approximation","volume-title":"Proc. 27th ICML","author":"Maei"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2022.3195530"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ADPRL.2009.4927542"},{"key":"ref16","first-page":"1412.6980","article-title":"Adam: A method for stochastic optimization","author":"Kingma","year":"2014"},{"key":"ref17","article-title":"Convergent temporal-difference learning with arbitrary smooth function approximation","volume":"22","author":"Maei","year":"2009","journal-title":"Adv. Neural Inf. Process"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/1553374.1553501"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/IECON48115.2021.9589658"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/s12532-018-0139-4"}],"event":{"name":"2025 European Control Conference (ECC)","start":{"date-parts":[[2025,6,24]]},"location":"Thessaloniki, Greece","end":{"date-parts":[[2025,6,27]]}},"container-title":["2025 European Control Conference (ECC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11186289\/11186290\/11187042.pdf?arnumber=11187042","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,15]],"date-time":"2025-10-15T05:50:04Z","timestamp":1760507404000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11187042\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,24]]},"references-count":20,"URL":"https:\/\/doi.org\/10.23919\/ecc65951.2025.11187042","relation":{},"subject":[],"published":{"date-parts":[[2025,6,24]]}}}