{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T07:31:42Z","timestamp":1725521502465},"publisher-location":"Berlin, Heidelberg","reference-count":27,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540897217"},{"type":"electronic","value":"9783540897224"}],"license":[{"start":{"date-parts":[[2008,1,1]],"date-time":"2008-01-01T00:00:00Z","timestamp":1199145600000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2008]]},"DOI":"10.1007\/978-3-540-89722-4_1","type":"book-chapter","created":{"date-parts":[[2008,11,26]],"date-time":"2008-11-26T08:57:14Z","timestamp":1227689834000},"page":"1-14","source":"Crossref","is-referenced-by-count":2,"title":["Lazy Planning under Uncertainty by Optimizing Decisions on an Ensemble of Incomplete Disturbance Trees"],"prefix":"10.1007","author":[{"given":"Boris","family":"Defourny","sequence":"first","affiliation":[]},{"given":"Damien","family":"Ernst","sequence":"additional","affiliation":[]},{"given":"Louis","family":"Wehenkel","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"1_CR1","volume-title":"Predictive Control with Constraints","author":"J. Maciejowski","year":"2001","unstructured":"Maciejowski, J.: Predictive Control with Constraints. Prentice Hall, Englewood Cliffs (2001)"},{"key":"1_CR2","doi-asserted-by":"publisher","first-page":"667","DOI":"10.1016\/S0098-1354(98)00301-9","volume":"23","author":"M. Morari","year":"1999","unstructured":"Morari, M., Lee, J.: Model predictive control: past, present and future. Computers and Chemical Engineering\u00a023, 667\u2013682 (1999)","journal-title":"Computers and Chemical Engineering"},{"key":"1_CR3","volume-title":"Introduction to Stochastic Programming","author":"J. Birge","year":"1997","unstructured":"Birge, J., Louveaux, F.: Introduction to Stochastic Programming. Springer, New York (1997)"},{"key":"1_CR4","first-page":"144","volume-title":"POPL 1993: Proceedings of the 20th ACM SIGPLAN-SIGACT symposium on Principles of programming languages","author":"J. Launchbury","year":"1993","unstructured":"Launchbury, J.: A natural semantics for lazy evaluation. In: POPL 1993: Proceedings of the 20th ACM SIGPLAN-SIGACT symposium on Principles of programming languages, pp. 144\u2013154. ACM, New York (1993)"},{"key":"1_CR5","unstructured":"Friedman, J., Kohavi, R., Yun, Y.: Lazy decision trees. In: Proc. of 13th National Conference on Artificial Intelligence, AAAI 1996. Part 1(of 2), pp. 717\u2013724 (1996)"},{"issue":"2","key":"1_CR6","doi-asserted-by":"publisher","first-page":"511","DOI":"10.1137\/050632865","volume":"17","author":"H. Heitsch","year":"2006","unstructured":"Heitsch, H., R\u00f6misch, W., Strugarek, C.: Stability of multistage stochastic programs. SIAM Journal on Optimization\u00a017(2), 511\u2013525 (2006)","journal-title":"SIAM Journal on Optimization"},{"key":"1_CR7","first-page":"483","volume-title":"Stochastic Programming. Handbooks in Operations Research and Management Science","author":"W. R\u00f6misch","year":"2003","unstructured":"R\u00f6misch, W.: Stability of stochastic programming problems. In: Ruszczy\u0144ski, A., Shapiro, A. (eds.) Stochastic Programming. Handbooks in Operations Research and Management Science, vol.\u00a010, pp. 483\u2013554. Elsevier, Amsterdam (2003)"},{"key":"1_CR8","first-page":"153","volume":"84","author":"M. Dempster","year":"1998","unstructured":"Dempster, M.: Sequential importance sampling algorithms for dynamic stochastic programming. Annals of Operations Research\u00a084, 153\u2013184 (1998)","journal-title":"Annals of Operations Research"},{"key":"1_CR9","first-page":"353","volume-title":"Stochastic Programming. Handbooks in Operations Research and Management Science","author":"A. Shapiro","year":"2003","unstructured":"Shapiro, A.: Monte Carlo sampling methods. In: Ruszczy\u0144ski, A., Shapiro, A. (eds.) Stochastic Programming. Handbooks in Operations Research and Management Science, vol.\u00a010, pp. 353\u2013425. Elsevier, Amsterdam (2003)"},{"issue":"2","key":"1_CR10","doi-asserted-by":"publisher","first-page":"295","DOI":"10.1287\/mnsc.47.2.295.9834","volume":"47","author":"K. H\u00f8yland","year":"2001","unstructured":"H\u00f8yland, K., Wallace, S.: Generating scenario trees for multistage decision problems. Management Science\u00a047(2), 295\u2013307 (2001)","journal-title":"Management Science"},{"key":"1_CR11","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1007\/s10479-006-0140-6","volume":"152","author":"R. Hochreiter","year":"2007","unstructured":"Hochreiter, R., Pflug, G.: Financial scenario generation for stochastic multi-stage decision processes as facility location problems. Annals of Operations Research\u00a0152, 257\u2013272 (2007)","journal-title":"Annals of Operations Research"},{"issue":"4","key":"1_CR12","doi-asserted-by":"publisher","first-page":"792","DOI":"10.1287\/moor.27.4.792.304","volume":"27","author":"S. Rachev","year":"2002","unstructured":"Rachev, S., R\u00f6misch, W.: Quantitative stability in stochastic programming: The method of probability metrics. Mathematics of Operations Research\u00a027(4), 792\u2013818 (2002)","journal-title":"Mathematics of Operations Research"},{"key":"1_CR13","doi-asserted-by":"crossref","unstructured":"Ernst, D., Glavic, M., Capitanescu, F., Wehenkel, L.: Reinforcement learning versus model predictive control: a comparison on a power system problem. IEEE Transactions on Systems, Man and Cybernetics - Part B (to appear, 2008)","DOI":"10.1109\/TSMCB.2008.2007630"},{"key":"1_CR14","doi-asserted-by":"publisher","first-page":"1361","DOI":"10.1016\/0005-1098(96)00063-5","volume":"32","author":"M. Kothare","year":"1996","unstructured":"Kothare, M., Balakrishnan, V., Morari, M.: Robust constrained model predictive control using matrix inequalities. Automatica\u00a032, 1361\u20131379 (1996)","journal-title":"Automatica"},{"issue":"6","key":"1_CR15","doi-asserted-by":"publisher","first-page":"1559","DOI":"10.1016\/j.automatica.2008.01.017","volume":"44","author":"Y. Nesterov","year":"2008","unstructured":"Nesterov, Y., Vial, J.P.: Confidence level solutions for stochastic programming. Automatica\u00a044(6), 1559\u20131568 (2008)","journal-title":"Automatica"},{"issue":"2","key":"1_CR16","first-page":"197","volume":"5","author":"R. Schapire","year":"1990","unstructured":"Schapire, R.: The strength of weak learnability. Machine Learning\u00a05(2), 197\u2013227 (1990)","journal-title":"Machine Learning"},{"issue":"2","key":"1_CR17","first-page":"123","volume":"24","author":"L. Breiman","year":"1996","unstructured":"Breiman, L.: Bagging predictors. Machine Learning\u00a024(2), 123\u2013140 (1996)","journal-title":"Machine Learning"},{"key":"1_CR18","first-page":"503","volume":"6","author":"D. Ernst","year":"2005","unstructured":"Ernst, D., Geurts, P., Wehenkel, L.: Tree-based batch mode reinforcement learning. Journal of Machine Learning Research\u00a06, 503\u2013556 (2005)","journal-title":"Journal of Machine Learning Research"},{"key":"1_CR19","first-page":"1038","volume":"8","author":"R. Sutton","year":"1996","unstructured":"Sutton, R.: Generalization in reinforcement learning: successful examples using sparse coarse coding. Advances in Neural Information Processing Systems\u00a08, 1038\u20131044 (1996)","journal-title":"Advances in Neural Information Processing Systems"},{"issue":"2-3","key":"1_CR20","doi-asserted-by":"publisher","first-page":"193","DOI":"10.1023\/A:1017932429737","volume":"49","author":"M. Kearns","year":"2002","unstructured":"Kearns, M., Mansour, Y., Ng, A.: A sparse sampling algorithm for near-optimal planning in large Markov decision processes. Machine Learning\u00a049(2-3), 193\u2013208 (2002)","journal-title":"Machine Learning"},{"key":"1_CR21","volume-title":"Information Science and Statistics","author":"R. Rubinstein","year":"2004","unstructured":"Rubinstein, R., Kroese, D.: The Cross-Entropy Method. A Unified Approach to Combinatorial Optimization, Monte-Carlo Simulation, and Machine Learning. In: Information Science and Statistics. Springer, Heidelberg (2004)"},{"key":"1_CR22","first-page":"1023","volume-title":"Proceedings of the Twelfth National Conference on Artificial Intelligence (AAAI 1994)","author":"A. Cassandra","year":"1994","unstructured":"Cassandra, A., Kaelbling, L., Littman, M.: Acting optimally in partially observable stochastic domains. In: Proceedings of the Twelfth National Conference on Artificial Intelligence (AAAI 1994), Seattle, Washington, USA, vol.\u00a02, pp. 1023\u20131028. AAAI Press\/MIT Press, Menlo Park (1994)"},{"key":"1_CR23","unstructured":"Ng, A., Jordan, M.: PEGASUS: a policy search method for large MDPs and POMDPs. In: Proceedings of the Sixteenth Conference on Uncertainty in Artificial Intelligence, pp. 406\u2013415 (1999)"},{"key":"1_CR24","unstructured":"Defourny, B.: Approximate solution to multistage stochastic programs with ensembles of randomized scenario trees. Master\u2019s thesis, University of Li\u00e8ge, Department of Electrical Engineering and Computer Science (2007)"},{"key":"1_CR25","unstructured":"Defourny, B., Wehenkel, L.: Averaging decisions from an ensemble of scenario trees: a validation on newsvendor problems (submitted, 2008)"},{"key":"1_CR26","volume-title":"Dynamic Programming","author":"R. Bellman","year":"1957","unstructured":"Bellman, R.: Dynamic Programming. Princeton University Press, Princeton (1957)"},{"key":"1_CR27","first-page":"1057","volume":"12","author":"R. Sutton","year":"2000","unstructured":"Sutton, R., McAllester, D., Singh, S., Mansour, Y.: Policy gradient methods for reinforcement learning with function approximation. Advances in Neural Information Processing Systems\u00a012, 1057\u20131063 (2000)","journal-title":"Advances in Neural Information Processing Systems"}],"container-title":["Lecture Notes in Computer Science","Recent Advances in Reinforcement Learning"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-89722-4_1","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,15]],"date-time":"2019-05-15T14:59:11Z","timestamp":1557932351000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-89722-4_1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2008]]},"ISBN":["9783540897217","9783540897224"],"references-count":27,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-89722-4_1","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2008]]}}}