{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,1]],"date-time":"2025-07-01T05:48:13Z","timestamp":1751348893754,"version":"3.28.0"},"reference-count":34,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,12,13]],"date-time":"2023-12-13T00:00:00Z","timestamp":1702425600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,12,13]],"date-time":"2023-12-13T00:00:00Z","timestamp":1702425600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100000001","name":"NSF","doi-asserted-by":"publisher","award":["ECCS 2025732,ECCS 1750041"],"award-info":[{"award-number":["ECCS 2025732,ECCS 1750041"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,12,13]]},"DOI":"10.1109\/cdc49753.2023.10383590","type":"proceedings-article","created":{"date-parts":[[2024,1,19]],"date-time":"2024-01-19T18:38:36Z","timestamp":1705689516000},"page":"7817-7823","source":"Crossref","is-referenced-by-count":2,"title":["Weighted-Norm Bounds on Model Approximation in MDPs with Unbounded Per-Step Cost"],"prefix":"10.1109","author":[{"given":"Berk","family":"Bozkurt","sequence":"first","affiliation":[{"name":"McGill University,Department of Electrical and Computer Engineering,Montreal,QC,Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Aditya","family":"Mahajan","sequence":"additional","affiliation":[{"name":"McGill University,Department of Electrical and Computer Engineering,Montreal,QC,Canada"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ashutosh","family":"Nayyar","sequence":"additional","affiliation":[{"name":"University of Southern California,Department of Electrical and Computer Engineering,Los Angeles,CA,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yi","family":"Ouyang","sequence":"additional","affiliation":[{"name":"Preferred Networks America,Burlingame,CA,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/0022-247X(71)90106-5"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1287\/moor.3.3.231"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1287\/moor.4.2.179"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1137\/0318003"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.1975.1100984"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/9.133184"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.jmaa.2011.11.015"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.1986.1104250"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1287\/moor.22.4.872"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2014.2343831"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-79033-6"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1080\/02670836.2022.2152925"},{"issue":"12","key":"ref13","first-page":"1","article-title":"Approximate information state for approximate planning and reinforcement learning in partially observed systems","volume":"23","author":"Subramanian","year":"2022","journal-title":"J. Mach. Learn. Res."},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/BF00935190"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/0165-1889(94)90048-5"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1016\/j.jmaa.2015.10.008"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1287\/moor.2016.0832"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TAC.2019.2907172"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1137\/17M1157660"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1137\/18M1208058"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1016\/j.automatica.2022.110179"},{"key":"ref22","article-title":"Approximate homomorphisms: A framework for non-exact minimization in Markov decision processes","author":"Ravindran","year":"2004","journal-title":"KBCS"},{"key":"ref23","article-title":"Plannable approximations to mdp homomorphisms: Equivariance under actions","author":"van der Pol","year":"2020","journal-title":"arXiv preprint"},{"key":"ref24","first-page":"162","article-title":"Metrics for finite Markov decision processes","volume":"4","author":"Ferns","year":"2004","journal-title":"UAl"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1137\/10080484X"},{"key":"ref26","first-page":"1653","article-title":"Equivalence relations in fully and partially observable Markov decision processes","volume":"9","author":"Castro","year":"2009","journal-title":"IJCAI"},{"key":"ref27","first-page":"2915","article-title":"Near optimal behavior via approximate state abstraction","volume-title":"ICML","author":"Abel","year":"2016"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1613\/jair.1.11478"},{"key":"ref29","first-page":"2170","article-title":"Deepmdp: Learning continuous latent space models for representation learning","volume-title":"ICML","author":"Gelada","year":"2019"},{"key":"ref30","doi-asserted-by":"crossref","DOI":"10.1109\/CDC49753.2023.10383590","article-title":"Weighted-norm bounds on model approximation in MDPs with unbounded per-step cost","volume-title":"extended version","author":"Bozkurt"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4612-0729-0"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4612-0561-6"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.2307\/1906813"},{"key":"ref34","article-title":"Dynamic programming and optimal control","author":"Bertsekas","year":"2015","journal-title":"Athena Scientific"}],"event":{"name":"2023 62nd IEEE Conference on Decision and Control (CDC)","start":{"date-parts":[[2023,12,13]]},"location":"Singapore, Singapore","end":{"date-parts":[[2023,12,15]]}},"container-title":["2023 62nd IEEE Conference on Decision and Control (CDC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10383192\/10383193\/10383590.pdf?arnumber=10383590","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,23]],"date-time":"2024-01-23T16:27:16Z","timestamp":1706027236000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10383590\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,12,13]]},"references-count":34,"URL":"https:\/\/doi.org\/10.1109\/cdc49753.2023.10383590","relation":{},"subject":[],"published":{"date-parts":[[2023,12,13]]}}}