{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T22:48:49Z","timestamp":1725576529423},"publisher-location":"Berlin, Heidelberg","reference-count":21,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540408048"},{"type":"electronic","value":"9783540452263"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2003]]},"DOI":"10.1007\/978-3-540-45226-3_4","type":"book-chapter","created":{"date-parts":[[2011,1,17]],"date-time":"2011-01-17T14:00:22Z","timestamp":1295272822000},"page":"22-29","source":"Crossref","is-referenced-by-count":0,"title":["ART-Based Neuro-fuzzy Modelling Applied to Reinforcement Learning"],"prefix":"10.1007","author":[{"given":"Konstantinos C.","family":"Zikidis","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Spyros G.","family":"Tzafestas","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"key":"4_CR1","doi-asserted-by":"crossref","unstructured":"Baird, L.C.: Reinforcement learning in continuous time: Advantage updating. In: Proc. of IEEE Intl. Conf. on Neural Networks (ICNN 1994), Orlando, Florida (1994)","DOI":"10.1109\/ICNN.1994.374604"},{"key":"4_CR2","doi-asserted-by":"crossref","unstructured":"Baird, L.C.: Residual algorithms: Reinforcement learning with function approximation. In: Prieditis, A., Russell, S. (eds.) Proc. of 12th Intl. Conf. on Mach. Learn., pp. 30\u201337. Morgan Kaufmann, San Francisco (1995)","DOI":"10.1016\/B978-1-55860-377-6.50013-X"},{"key":"4_CR3","unstructured":"Baxter, J., Bartlett, P.L.: Reinforcement learning in POMDP\u2019s via direct gradient ascent. In: Proc. of 17th Intl. Conf. on Machine Learning, Stanford, CA (2000)"},{"key":"4_CR4","unstructured":"Box, G.E.P., Jenkins, G.M.: Time Series Analysis, Forecasting, and Control. Holden Day, San Francisco (1970)"},{"key":"4_CR5","first-page":"369","volume-title":"Advances in Neural Information Processing Systems (Proc. of 1994 Conf.)","author":"J.A. Boyan","year":"1995","unstructured":"Boyan, J.A., Moore, A.W.: Generalization in reinforcement learning: Safely approximating the value functions. In: Tesauro, G., Touretzky, D. (eds.) Advances in Neural Information Processing Systems (Proc. of 1994 Conf.), San Mateo, CA, pp. 369\u2013376. Morgan Kaufmann, San Mateo (1995)"},{"key":"4_CR6","doi-asserted-by":"publisher","first-page":"759","DOI":"10.1016\/0893-6080(91)90056-B","volume":"4","author":"G.A. Carpenter","year":"1991","unstructured":"Carpenter, G.A., Grossberg, S., Rosen, G.A.: Fuzzy ART: Fast stable learning and categorization of analog patterns by an adaptive resonance system. Neural Networks\u00a04, 759\u2013771 (1991)","journal-title":"Neural Networks"},{"issue":"5","key":"4_CR7","doi-asserted-by":"publisher","first-page":"698","DOI":"10.1109\/72.159059","volume":"3","author":"G.A. Carpenter","year":"1992","unstructured":"Carpenter, G.A., Grossberg, S., Markuzon, N., Reynolds, J.H., Rosen, D.B.: Fuzzy ARTMAP: A neural architecture for incremental supervised learning of analog multidimensional maps. IEEE Trans. on Neural Networks\u00a03(5), 698\u2013712 (1992)","journal-title":"IEEE Trans. on Neural Networks"},{"key":"4_CR8","unstructured":"Gordon, G.: Stable function approximation in dynamic programming. In: Proc. of 14th Intl. Conf. on Machine Learning, Nashville, TN (1997)"},{"key":"4_CR9","unstructured":"Kimura, H., Kobayashi, S.: An analysis of actor\/critic algorithms using eligibility traces: reinforcement learning with imperfect value functions. In: Proc. of 15th Intl. Conf. on Mach. Learn., Madison, Wisconsin, pp. 278\u2013286 (1998)"},{"key":"4_CR10","unstructured":"Konda, V.R., Tsitsiklis, J.N.: Actor critic algorithms. In: Advances in Neural Information Processing Systems (Proc. of the 1999 conference), Cambridge, MA, vol.\u00a012. MIT Press, Cambridge (1999)"},{"key":"4_CR11","volume-title":"Neural Fuzzy Systems: a Neuro-Fuzzy Synergism to Intelligent Systems","author":"C.-J. Lin","year":"1996","unstructured":"Lin, C.-J., Lee, C.S.G.: Neural Fuzzy Systems: a Neuro-Fuzzy Synergism to Intelligent Systems. Prentice Hall, Englewood Cliffs (1996)"},{"key":"4_CR12","doi-asserted-by":"publisher","first-page":"287","DOI":"10.1126\/science.267326","volume":"197","author":"M.C. Mackey","year":"1977","unstructured":"Mackey, M.C., Glass, L.: Oscillation and chaos in physiological control systems. Science\u00a0197, 287\u2013289 (1977)","journal-title":"Science"},{"key":"4_CR13","doi-asserted-by":"publisher","first-page":"1585","DOI":"10.1049\/piee.1974.0328","volume":"121","author":"E.H. Mamdani","year":"1974","unstructured":"Mamdani, E.H., Assilian, S.: Applications of fuzzy algorithms for control of simple dynamic plant. Proc. Inst. Elec. Eng.\u00a0121, 1585\u20131588 (1974)","journal-title":"Proc. Inst. Elec. Eng."},{"key":"4_CR14","first-page":"1","volume":"21","author":"A.W. Moore","year":"1995","unstructured":"Moore, A.W., Atkeson, C.G.: The parti-game algorithm for variable resolution reinforcement learning in multidimensional state-spaces. Machine Learning\u00a021, 1\u201336 (1995)","journal-title":"Machine Learning"},{"key":"4_CR15","volume-title":"Reinforcement learning: An introduction","author":"R.S. Sutton","year":"1998","unstructured":"Sutton, R.S., Barto, A.G.: Reinforcement learning: An introduction. MIT Press, Cambridge (1998)"},{"key":"4_CR16","first-page":"1057","volume-title":"Advances in Neural Information Processing Systems","author":"R.S. Sutton","year":"1999","unstructured":"Sutton, R.S., McAllester, D., Singh, S., Mansour, Y.: Policy gradient methods for reinforcement learning with function approximation. In: Advances in Neural Information Processing Systems, Cambridge, MA, vol.\u00a012, pp. 1057\u20131063. MIT Press, Cambridge (1999)"},{"key":"4_CR17","doi-asserted-by":"crossref","first-page":"116","DOI":"10.1109\/TSMC.1985.6313399","volume":"15","author":"T. Takagi","year":"1985","unstructured":"Takagi, T., Sugeno, M.: Fuzzy identification of systems and its application to modeling and control. IEEE Trans on Syst., Man, Cybern.\u00a015, 116\u2013132 (1985)","journal-title":"IEEE Trans on Syst., Man, Cybern."},{"issue":"5","key":"4_CR18","doi-asserted-by":"publisher","first-page":"797","DOI":"10.1109\/3477.956041","volume":"31","author":"S.G. Tzafestas","year":"2001","unstructured":"Tzafestas, S.G., Zikidis, K.C.: NeuroFAST: On-line neuro-fuzzy ART-based structure and parameter learning TSK model. IEEE Trans on Syst., Man, Cybern.\u00a031(5), 797\u2013802 (2001)","journal-title":"IEEE Trans on Syst., Man, Cybern."},{"key":"4_CR19","unstructured":"Tzafestas, S.G., Zikidis, K.C.: High Accuracy Neuro \u2013 Fuzzy Modeling. In: IEEE Int. Conf. on Artificial Intelligence Systems (IEEE ICAIS 2002), Divnomorskoe, Russia (2002)"},{"key":"4_CR20","first-page":"229","volume":"8","author":"R.J. Williams","year":"1992","unstructured":"Williams, R.J.: Simple statistical gradient-following algorithms for connectionist reinforcement learning. Machine Learning\u00a08, 229\u2013256 (1992)","journal-title":"Machine Learning"},{"key":"4_CR21","unstructured":"Zikidis, K.C., Tzafestas, S.G.: Adaptive neuro-fuzzy modeling applied to policy gradient reinforcement learning. In: 5th Hellenic European Conference on Computer Mathematics & its Applications (HERCMA 2001), Athens, Greece (2001)"}],"container-title":["Lecture Notes in Computer Science","Knowledge-Based Intelligent Information and Engineering Systems"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-45226-3_4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,6,7]],"date-time":"2019-06-07T18:53:04Z","timestamp":1559933584000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-45226-3_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2003]]},"ISBN":["9783540408048","9783540452263"],"references-count":21,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-45226-3_4","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2003]]}}}