{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,13]],"date-time":"2025-10-13T09:10:25Z","timestamp":1760346625867,"version":"3.37.3"},"reference-count":27,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2017,7,21]],"date-time":"2017-07-21T00:00:00Z","timestamp":1500595200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100002809","name":"Generalitat de Catalunya","doi-asserted-by":"publisher","award":["2014-SGR-118"],"award-info":[{"award-number":["2014-SGR-118"]}],"id":[{"id":"10.13039\/501100002809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100006003","name":"Fundaci\u00f3n General CSIC","doi-asserted-by":"publisher","award":["NASAID 201550E022"],"award-info":[{"award-number":["NASAID 201550E022"]}],"id":[{"id":"10.13039\/501100006003","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001807","name":"FAPESP","doi-asserted-by":"crossref","award":["2011\/19280-8"],"award-info":[{"award-number":["2011\/19280-8"]}],"id":[{"id":"10.13039\/501100001807","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001807","name":"FAPESP","doi-asserted-by":"crossref","award":["2016\/21047-3"],"award-info":[{"award-number":["2016\/21047-3"]}],"id":[{"id":"10.13039\/501100001807","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100002322","name":"CAPES","doi-asserted-by":"crossref","id":[{"id":"10.13039\/501100002322","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100003593","name":"CNPq","doi-asserted-by":"crossref","award":["307093\/2014-0","473989\/2013-1"],"award-info":[{"award-number":["307093\/2014-0","473989\/2013-1"]}],"id":[{"id":"10.13039\/501100003593","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Appl Intell"],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1007\/s10489-017-0988-y","type":"journal-article","created":{"date-parts":[[2017,7,21]],"date-time":"2017-07-21T05:09:04Z","timestamp":1500613744000},"page":"993-1007","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Answer set programming for non-stationary Markov decision processes"],"prefix":"10.1007","volume":"47","author":[{"given":"Leonardo A.","family":"Ferreira","sequence":"first","affiliation":[]},{"given":"Reinaldo A.","family":"C. Bianchi","sequence":"additional","affiliation":[]},{"given":"Paulo E.","family":"Santos","sequence":"additional","affiliation":[]},{"given":"Ramon Lopez","family":"de Mantaras","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,7,21]]},"reference":[{"key":"988_CR1","doi-asserted-by":"publisher","first-page":"122","DOI":"10.1007\/978-3-642-40564-8_13","volume-title":"Logic programming and nonmonotonic reasoning, vol 8148","author":"J Babb","year":"2013","unstructured":"Babb J, Lee J (2013) Cplus 2ASP: computing action language C + $\\mathcal {C}+$ in answer set programming. In: Cabalar P, Son TC (eds) Logic programming and nonmonotonic reasoning, vol 8148. Springer, Berlin Heidelberg, pp 122\u2013134"},{"doi-asserted-by":"publisher","unstructured":"Babb J, Lee J (2015) Action language B C + . J Logic Comput, p exv062. doi: 10.1093\/logcom\/exv062","key":"988_CR2","DOI":"10.1093\/logcom\/exv062"},{"issue":"1\u20132","key":"988_CR3","doi-asserted-by":"publisher","first-page":"183","DOI":"10.1007\/s10472-006-9026-1","volume":"47","author":"M Balduccini","year":"2006","unstructured":"Balduccini M, Gelfond M, Nogueira M (2006) Answer set based design of knowledge systems. Ann Math Artif Intell 47(1\u20132): 183\u2013219","journal-title":"Ann Math Artif Intell"},{"unstructured":"Balduccini M, Gelfond M, Nogueira M, Watson R (2002) Planning with the USA-advisor. In: 3rd NASA international workshop on planning and scheduling for space. Houston","key":"988_CR4"},{"key":"988_CR5","doi-asserted-by":"publisher","first-page":"439","DOI":"10.1007\/3-540-45402-0_39","volume-title":"Logic programming and nonmotonic reasoning, vol 2173","author":"M Balduccini","year":"2001","unstructured":"Balduccini M, Gelfond M, Watson R, Nogueira M (2001) The USA-advisor. In: Goos G, Harmanis J, van Leeuwen J, Eiter T, Faber W, Truszczy\u0144ski M L (eds) Logic programming and nonmotonic reasoning, vol 2173. Springer Berlin Heidelberg, Berlin, Heidelberg, pp 439\u2013442"},{"issue":"1","key":"988_CR6","doi-asserted-by":"publisher","first-page":"57","DOI":"10.1017\/S1471068408003645","volume":"9","author":"C Baral","year":"2009","unstructured":"Baral C, Gelfond M, Rushton N (2009) Probabilistic reasoning with answer sets. Theory Pract Logic Program 9(1):57","journal-title":"Theory Pract Logic Program"},{"issue":"8","key":"988_CR7","doi-asserted-by":"publisher","first-page":"716","DOI":"10.1073\/pnas.38.8.716","volume":"38","author":"R Bellman","year":"1952","unstructured":"Bellman R (1952) On the theory of dynamic programming. Proc Natl Acad Sci 38(8):716\u2013719","journal-title":"Proc Natl Acad Sci"},{"issue":"4","key":"988_CR8","doi-asserted-by":"publisher","first-page":"679","DOI":"10.1512\/iumj.1957.6.56038","volume":"6","author":"R Bellman","year":"1957","unstructured":"Bellman R (1957) A Markovian decision process. Ind Univ Math J 6(4):679\u2013684","journal-title":"Ind Univ Math J"},{"unstructured":"Bellman RE, Dreyfus SE (1971) Applied dynamic programming, 4 edn. Princeton Univ Press","key":"988_CR9"},{"key":"988_CR10","first-page":"401","volume-title":"Advances in neural information processing systems, vol 17","author":"E Even-dar","year":"2005","unstructured":"Even-dar E, Kakade SM, Mansour Y (2005) Experts in a markov decision process. In: Saul LK, Weiss Y, Bottou L (eds) Advances in neural information processing systems, vol 17. MIT Press, Cambridge, pp 401\u2013408. http:\/\/dl.acm.org\/citation.cfm?id=2976091 . Accessed on September 2016"},{"issue":"3","key":"988_CR11","doi-asserted-by":"publisher","first-page":"726","DOI":"10.1287\/moor.1090.0396","volume":"34","author":"E Even-Dar","year":"2009","unstructured":"Even-Dar E, Kakade SM, Mansour Y (2009) Online markov decision processes. Math Oper Res 34(3):726\u2013736","journal-title":"Math Oper Res"},{"doi-asserted-by":"crossref","unstructured":"Gebser M, Kaminski R, Kaufmann B (2013) Answer set solving in practice. Morgan & Claypool Publishers","key":"988_CR12","DOI":"10.1007\/978-3-031-01561-8"},{"key":"988_CR13","first-page":"1070","volume-title":"Proceedings of international logic programming conference and symposium","author":"M Gelfond","year":"1988","unstructured":"Gelfond M, Lifschitz V (1988) The stable model semantics for logic programming. In: Kowalski R, Bowen K (eds) Proceedings of international logic programming conference and symposium. MIT Press, Cambridge, pp 1070\u20131080. http:\/\/www.cs.utexas.edu\/users\/ai-lab\/?gel88 . Accessed on March 2016"},{"unstructured":"Gelfond M, Rushton N (2010) Causal and probabilistic reasoning in P-log. Heuristics, probabilities and causality. A tribute to Judea Pearl, pp 337\u2013359","key":"988_CR14"},{"doi-asserted-by":"crossref","unstructured":"Khandelwal P, Yang F, Leonetti M, Lifschitz V, Stone P (2014) Planning in action language BC while learning action costs for mobile robots. In: Proceedings of the twenty-fourth international conference on automated planning and scheduling, ICAPS 2014. Portsmouth","key":"988_CR15","DOI":"10.1609\/icaps.v24i1.13671"},{"issue":"1\u20132","key":"988_CR16","doi-asserted-by":"publisher","first-page":"39","DOI":"10.1016\/S0004-3702(02)00186-8","volume":"138","author":"V Lifschitz","year":"2002","unstructured":"Lifschitz V (2002) Answer set programming and plan generation. Artif Intell 138(1\u20132):39\u201354","journal-title":"Artif Intell"},{"unstructured":"McCarthy J (1998) Elaboration tolerance. In: Proceedings of the fourth symposium on logical formalizations of commonsense reasoning (common sense 98), vol 98. London","key":"988_CR17"},{"key":"988_CR18","doi-asserted-by":"publisher","first-page":"169","DOI":"10.1007\/3-540-45241-9_12","volume-title":"Practical aspects of declarative languages, vol 1990","author":"M Nogueira","year":"2001","unstructured":"Nogueira M, Balduccini M, Gelfond M, Watson R, Barry M (2001) An A-Prolog decision support system for the space shuttle. In: Goos G, Hartmanis J, van Leeuwen J, Ramakrishnan IV (eds) Practical aspects of declarative languages, vol 1990. Springer Berlin Heidelberg, Berlin, Heidelberg, pp 169\u2013183"},{"unstructured":"Ryan MR, Pendrith MD (1998) Rl-tops: an architecture for modularity and re-use in reinforcement learning. In: Proceedings of the fifteenth international conference on machine learning. Morgan Kaufmann, pp 481\u2013487","key":"988_CR19"},{"unstructured":"Ryan MRK (2002) Using abstract models of behaviours to automatically generate reinforcement learning hierarchies. In: Proceedings of the 19th international conference on machine learning. Morgan Kaufmann, pp 522\u2013529","key":"988_CR20"},{"doi-asserted-by":"crossref","unstructured":"Sprauel J, Teichteil-K\u00f6nigsbuch F, Kolobov A (2014) Saturated path-constrained MDP: planning under uncertainty and deterministic model-checking constraints. In: Proceedings of 28th AAAI conf. on artificial intelligence (AAAI), pp 2367\u20132373","key":"988_CR21","DOI":"10.1609\/aaai.v28i1.9041"},{"unstructured":"Sridharan M, Gelfond M, Zhang S, Wyatt J (2015) Mixing non-monotonic logical reasoning and probabilistic planning for robots. In: Workshop on hybrid reasoning @ IJCAI 2015","key":"988_CR22"},{"unstructured":"Sutton RS, Barto AG (2015) Reinforcement learning an introduction, 2nd edn. In: progress (Draft). MIT Press","key":"988_CR23"},{"key":"988_CR24","volume-title":"Learning from delayed rewards","author":"CJCH Watkins","year":"1989","unstructured":"Watkins CJCH (1989) Learning from delayed rewards. University of Cambridge England, PhD thesis"},{"doi-asserted-by":"crossref","unstructured":"Yang F, Khandelwal P, Leonetti M, Stone P (2014) Planning in answer set programming while learning action costs for mobile robots. In: AAAI Spring 2014 symposium on knowledge representation and reasoning in robotics (AAAI-SSS)","key":"988_CR25","DOI":"10.1609\/icaps.v24i1.13671"},{"issue":"3","key":"988_CR26","doi-asserted-by":"publisher","first-page":"737","DOI":"10.1287\/moor.1090.0397","volume":"34","author":"JY Yu","year":"2009","unstructured":"Yu JY, Mannor S, Shimkin N (2009) Markov decision processes with arbitrary reward processes. Math Oper Res 34(3):737\u2013757","journal-title":"Math Oper Res"},{"issue":"3","key":"988_CR27","doi-asserted-by":"publisher","first-page":"699","DOI":"10.1109\/TRO.2015.2422531","volume":"31","author":"S Zhang","year":"2015","unstructured":"Zhang S, Sridharan M, Wyatt JL (2015) Mixed logical inference and probabilistic planning for robots in unreliable worlds. Trans Robot IEEE 31(3):699\u2013713","journal-title":"Trans Robot IEEE"}],"container-title":["Applied Intelligence"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10489-017-0988-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-017-0988-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-017-0988-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,24]],"date-time":"2023-08-24T16:42:55Z","timestamp":1692895375000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10489-017-0988-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,7,21]]},"references-count":27,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2017,12]]}},"alternative-id":["988"],"URL":"https:\/\/doi.org\/10.1007\/s10489-017-0988-y","relation":{},"ISSN":["0924-669X","1573-7497"],"issn-type":[{"type":"print","value":"0924-669X"},{"type":"electronic","value":"1573-7497"}],"subject":[],"published":{"date-parts":[[2017,7,21]]},"assertion":[{"value":"21 July 2017","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}