{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,12]],"date-time":"2025-10-12T20:07:15Z","timestamp":1760299635354,"version":"3.41.0"},"reference-count":36,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017,5]]},"DOI":"10.23919\/acc.2017.7963427","type":"proceedings-article","created":{"date-parts":[[2017,7,10]],"date-time":"2017-07-10T21:39:58Z","timestamp":1499722798000},"page":"3120-3127","source":"Crossref","is-referenced-by-count":21,"title":["Deep reinforcement learning for partial differential equation control"],"prefix":"10.23919","author":[{"given":"Amir-massoud","family":"Farahmand","sequence":"first","affiliation":[]},{"given":"Saleh","family":"Nabi","sequence":"additional","affiliation":[]},{"given":"Daniel N.","family":"Nikovski","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"journal-title":"Buoyancy-driven exchange flow with applications to architectural fluid mechanics","year":"2015","author":"nabi","key":"ref33"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1146\/annurev.fluid.31.1.201"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/MCSE.2009.52"},{"key":"ref30","article-title":"Adam: A method for stochastic optimization","author":"kingma","year":"2015","journal-title":"International Conference on Learning Representations (ICLR)"},{"key":"ref36","first-page":"2825","article-title":"Scikit-learn: Machine learning in Python","volume":"12","author":"pedregosa","year":"2011","journal-title":"Journal of Machine Learning Resaerch"},{"key":"ref35","article-title":"Theano: A Python framework for fast computation of mathematical expressions","volume":"abs 1605 2688","year":"2016","journal-title":"T development team"},{"journal-title":"Keras","year":"2015","author":"chollet","key":"ref34"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2013.6759923"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1115\/1.4031175"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1017\/jfm.2014.182"},{"key":"ref13","volume":"116","author":"duriez","year":"2016","journal-title":"Machine Learning Control-Taming Nonlinear Dynamics and Turbulence ser Fluid mechanics and its applications"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/b97848"},{"journal-title":"Regularization in Reinforcement Learning","year":"2011","author":"farahmand","key":"ref15"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ACC.2009.5160611"},{"journal-title":"Deep Learning","year":"2016","author":"goodfellow","key":"ref17"},{"key":"ref18","article-title":"End to end learning for self-driving cars","volume":"abs 1604 7316","author":"bojarski","year":"2016","journal-title":"CoRR"},{"key":"ref19","first-page":"503","article-title":"Tree-based batch mode reinforcement learning","volume":"6","author":"ernst","year":"2005","journal-title":"Journal of Machine Learning Resaerch"},{"key":"ref28","first-page":"1097","article-title":"ImageNet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"Advances in Neural Information Processing Systems (NIPS-25)"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1038\/nature14236"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1137\/040614384"},{"journal-title":"Reinforcement Learning An Introduction","year":"1998","author":"sutton","key":"ref3"},{"key":"ref6","first-page":"1","article-title":"End-to-end training of deep visuomotor policies","volume":"17","author":"levine","year":"2016","journal-title":"Journal of Machine Learning Resaerch"},{"key":"ref29","first-page":"161","article-title":"The tradeoffs of large scale learning","author":"bottou","year":"2008","journal-title":"Advances in Neural Information Processing Systems (NIPS-20)"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1038\/nature16961"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ACC.2009.5160552"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ACC.2011.5991540"},{"key":"ref2","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-031-01551-9","author":"szepesv\u00e1ri","year":"2010","journal-title":"Algorithms for Reinforcement Learning"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.camwa.2016.01.011"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2016.7798966"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/11564096_32"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2010.5596468"},{"key":"ref21","first-page":"815","article-title":"Finite-time bounds for fitted value iteration","volume":"9","author":"munos","year":"2008","journal-title":"Journal of Machine Learning Resaerch"},{"journal-title":"The Elements of Statistical Learning Data Mining Inference and Prediction","year":"2001","author":"hastie","key":"ref24"},{"key":"ref23","first-page":"1349","article-title":"Value pursuit iteration","author":"farahmand","year":"2012","journal-title":"Advances in Neural Information Processing Systems (NIPS-25)"},{"key":"ref26","first-page":"568","article-title":"Error propagation for approximate policy and value iteration","author":"farahmand","year":"2010","journal-title":"Advances in Neural Information Processing Systems (NIPS-23)"},{"journal-title":"All of Nonparametric Statistics (Springer Texts in Statistics)","year":"2007","author":"wasserman","key":"ref25"}],"event":{"name":"2017 American Control Conference (ACC)","start":{"date-parts":[[2017,5,24]]},"location":"Seattle, WA, USA","end":{"date-parts":[[2017,5,26]]}},"container-title":["2017 American Control Conference (ACC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7951530\/7962914\/07963427.pdf?arnumber=7963427","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,21]],"date-time":"2025-06-21T20:29:01Z","timestamp":1750537741000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/7963427\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,5]]},"references-count":36,"URL":"https:\/\/doi.org\/10.23919\/acc.2017.7963427","relation":{},"subject":[],"published":{"date-parts":[[2017,5]]}}}