{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,15]],"date-time":"2025-08-15T00:17:39Z","timestamp":1755217059686,"version":"3.43.0"},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2003,9,1]],"date-time":"2003-09-01T00:00:00Z","timestamp":1062374400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2003,9,1]],"date-time":"2003-09-01T00:00:00Z","timestamp":1062374400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Fuzzy Optimization and Decision Making"],"published-print":{"date-parts":[[2003,9]]},"DOI":"10.1023\/a:1025059919437","type":"journal-article","created":{"date-parts":[[2003,9,16]],"date-time":"2003-09-16T18:24:47Z","timestamp":1063736687000},"page":"183-213","source":"Crossref","is-referenced-by-count":1,"title":["Application of a Near-Optimal Reinforcement Learning Controller to a Robotics Problem in Manufacturing: A Hybrid Approach"],"prefix":"10.1007","volume":"2","author":[{"suffix":"II","given":"Warren E.","family":"Hearnes","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Augustine O.","family":"Esogbue","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"issue":"1\u20134","key":"5141907_CR1","doi-asserted-by":"crossref","first-page":"45","DOI":"10.1016\/0360-8352(92)90060-W","volume":"23","author":"A. Bahrami","year":"1992","unstructured":"Bahrami, A. and C. Dagli. (1992). \u201cNatural Intelligence in Design and Manufacturing,\u201d Computers and Industrial Engineering 23(1\u20134), 45\u201348.","journal-title":"Computers and Industrial Engineering"},{"issue":"5","key":"5141907_CR2","doi-asserted-by":"crossref","first-page":"834","DOI":"10.1109\/TSMC.1983.6313077","volume":"13","author":"A. Barto","year":"1983","unstructured":"Barto, A., R. Sutton, and C. Anderson. (1983). \u201cNeuronlike Adaptive Elements that Can Solve Difficult Learning Control Problems,\u201d IEEE Transactions on Systems, Man, and Cybernetics SMC-13(5), 834\u2013846.","journal-title":"IEEE Transactions on Systems, Man, and Cybernetics"},{"issue":"1\u20132","key":"5141907_CR3","doi-asserted-by":"crossref","first-page":"81","DOI":"10.1016\/0004-3702(94)00011-O","volume":"72","author":"A. Barto","year":"1995","unstructured":"Barto, A., S. Bradtke, and S. Singh. (1995). \u201cLearning to Act Using Real-Time Dynamic Programming,\u201d Artificial Intelligence 72(1\u20132), 81\u2013138.","journal-title":"Artificial Intelligence"},{"key":"5141907_CR4","volume-title":"Dynamic Programming","author":"R. Bellman","year":"1957","unstructured":"Bellman, R. (1957). Dynamic Programming. Princeton, NJ: Princeton University Press."},{"key":"5141907_CR5","doi-asserted-by":"crossref","DOI":"10.1515\/9781400874668","volume-title":"Adaptive Control Processes: A Guided Tour","author":"R. Bellman","year":"1961","unstructured":"Bellman, R. (1961). Adaptive Control Processes: A Guided Tour. Princeton, NJ: Princeton University Press."},{"key":"5141907_CR6","doi-asserted-by":"crossref","DOI":"10.1515\/9781400874651","volume-title":"Applied Dynamic Programming","author":"R. Bellman","year":"1962","unstructured":"Bellman, R. and S. Dreyfus. (1962). Applied Dynamic Programming. Princeton, NJ: Princeton University Press."},{"key":"5141907_CR7","doi-asserted-by":"crossref","unstructured":"Berenji, H. (1994). \u201cFuzzy Q-Learning: A New Approach for Fuzzy Dynamic Programming,\u201d In Proceedings of the Third IEEE Conference on Fuzzy Systems. Orlando, FL, 486\u2013491.","DOI":"10.1109\/FUZZY.1994.343737"},{"issue":"5","key":"5141907_CR8","doi-asserted-by":"crossref","first-page":"724","DOI":"10.1109\/72.159061","volume":"3","author":"H. Berenji","year":"1992","unstructured":"Berenji, H. and P. Khedkar. (1992). \u201cLearning and Tuning Fuzzy Logic Controllers through Reinforcements,\u201d IEEE Transactions on Neural Networks 3(5), 724\u2013740.","journal-title":"IEEE Transactions on Neural Networks"},{"key":"5141907_CR9","first-page":"622","volume":"1","author":"H. Berenji","year":"1998","unstructured":"Berenji, H. and S. Saraf. (1998). \u201cCompetition and Collaboration Among Fuzzy Reinforcement Learning Agents,\u201d In Proceedings of the (1998) IEEE International Conference on Fuzzy Systems. Anchorage, AK, 1, 622\u2013627.","journal-title":"Proceedings of the (1998) IEEE International Conference on Fuzzy Systems. Anchorage, AK"},{"key":"5141907_CR10","volume-title":"Neuro-Dynamic Programming","author":"D. Bertsekas","year":"1996","unstructured":"Bertsekas, D. and J. Tsitsiklis. (1996). Neuro-Dynamic Programming. Belmont, MA: Athena Scientific."},{"key":"5141907_CR11","first-page":"257","volume":"62","author":"A. Boschitsch","year":"1986","unstructured":"Boschitsch, A. and O. Bendiksen. (1986). \u201cNonlinear Control Laws For Tethered Satellites,\u201d Advances in Astronautical Sciences 62, 257\u2013276.","journal-title":"Advances in Astronautical Sciences"},{"key":"5141907_CR12","doi-asserted-by":"crossref","unstructured":"Esogbue, A. and W. Hearnes. (1994). \u201cConstructive Experiments with a New Fuzzy Adaptive Controller,\u201d In Proceedings of the (1994) NAFIPS\/IFIS\/NASA\/ Conference. San Antonio, TX, 377\u2013380.","DOI":"10.1109\/IJCF.1994.375085"},{"issue":"2","key":"5141907_CR13","doi-asserted-by":"crossref","first-page":"121","DOI":"10.1023\/A:1022685208277","volume":"1","author":"A. Esogbue","year":"1999","unstructured":"Esogbue, A. and W. Hearnes. (1999). \u201cA Learning Algorithm for the Control of Continuous Action Space Set-Point Regulator Systems,\u201d Journal of Computational Analysis and Applications 1(2), 121\u2013145.","journal-title":"Journal of Computational Analysis and Applications"},{"key":"5141907_CR14","doi-asserted-by":"crossref","unstructured":"Esogbue, A. and J. Murrell. (1993a). \u201cA Fuzzy Adaptive Controller Using Reinforcement Learning Neural Networks,\u201d In Proceedings of Second IEEE International Conference on Fuzzy Systems, 178\u2013183.","DOI":"10.1109\/FUZZY.1993.327494"},{"key":"5141907_CR15","unstructured":"Esogbue, A. and J. Murrell. (1993b). \u201cOptimization of a Fuzzy Adaptive Network for Control Applications,\u201d In Proceedings of the Fifth International Fuzzy Systems Association World Congress. Seoul, Korea, 1346\u20131349."},{"issue":"9\u201310","key":"5141907_CR16","doi-asserted-by":"crossref","first-page":"29","DOI":"10.1016\/0898-1221(94)90120-1","volume":"27","author":"A. Esogbue","year":"1994","unstructured":"Esogbue, A. and J. Murrell. (1994). \u201cAdvances in Fuzzy Adaptive Control,\u201d Computers & Mathematics with Applications 27(9\u201310), 29\u201335.","journal-title":"Computers & Mathematics with Applications"},{"key":"5141907_CR17","first-page":"699","volume":"II","author":"A. Esogbue","year":"1995","unstructured":"Esogbue, A., Q. Song, and W. Hearnes. (1995). \u201cApplication of a Self-Learning Fuzzy-Neuro Controller to the Power System Stabilization Problem,\u201d In Proceedings of the (1995) World Congress on Neural Networks. Washington, DC, II, 699\u2013702.","journal-title":"Proceedings of the (1995) World Congress on Neural Networks. Washington, DC"},{"key":"5141907_CR18","unstructured":"Hearnes, W. (1999). \u201cNear-Optimal Intelligent Control for Continuous Set-Point Regulator Problems via Approximate Dynamic Programming,\u201d Ph.d. thesis, School of Industrial and Systems Engineering, Georgia Institute of Technology, Atlanta, GA."},{"key":"5141907_CR19","doi-asserted-by":"crossref","unstructured":"Kaelbling, L., M. Littman, and A. Moore. (1996). \u201cReinforcement Learning: A Survey,\u201d Journal of Artificial Intelligence Research 4.","DOI":"10.1613\/jair.301"},{"issue":"6","key":"5141907_CR20","doi-asserted-by":"crossref","first-page":"1531","DOI":"10.1109\/72.641474","volume":"8","author":"R. Kandadai","year":"1997","unstructured":"Kandadai, R. and J. Tien. (1997). \u201cA Knowledge-Base Generating Heirarchical Fuzzy-Neural Controller,\u201d IEEE Transactions on Neural Networks 8(6), 1531\u20131541.","journal-title":"IEEE Transactions on Neural Networks"},{"key":"5141907_CR21","first-page":"313","volume-title":"Theoretical Aspects of Fuzzy Control","author":"B. Kosko","year":"1995","unstructured":"Kosko, B. and J. Dickerson. (1995). \u201cFunction Approximation with Additive Fuzzy Systems,\u201d In H. Nguyen, M. Sugeno, R. Tong, and R. Yager (eds.), Theoretical Aspects of Fuzzy Control. New York: John Wiley & Sons, Chapt. 12, 313\u2013347."},{"key":"5141907_CR22","doi-asserted-by":"crossref","first-page":"365","DOI":"10.1007\/BF00123657","volume":"5","author":"I. Kouatli","year":"1994","unstructured":"Kouatli, I. (1994). \u201cA Simplified Fuzzy Multivariable Structure in a Manufacturing Environment,\u201d Journal of Intelligent Manufacturing 5, 365\u2013387.","journal-title":"Journal of Intelligent Manufacturing"},{"key":"5141907_CR23","doi-asserted-by":"crossref","first-page":"53","DOI":"10.1016\/B978-0-12-568150-6.50009-X","volume-title":"Dynamic Programming and Its Applications","author":"T. Morin","year":"1978","unstructured":"Morin, T. (1978). \u201cComputational Advances in Dynamic Programming,\u201d In M. Puterman (ed), Dynamic Programming and Its Applications. New York: Academic Press, 53\u201390."},{"key":"5141907_CR24","unstructured":"Murrell, J. A. (1993). \u201cA Statistical Fuzzy Associative Learning Approach To Intelligent Control,\u201d Ph.D. thesis, School of Industrial and Systems Engineering, Georgia Institute of Technology, Atlanta, GA."},{"key":"5141907_CR25","unstructured":"Oh, C.-H., T. Nakashima, and H. Ishibuchi. (1998). \u201cInitialization of Q-Values by Fuzzy Rules for Accelerating Q-Learning,\u201d In Proceedings of the (1998) IEEE International Joint Conference on Neural Networks. Anchorage, AK, 2051\u20132056."},{"key":"5141907_CR26","doi-asserted-by":"crossref","first-page":"9","DOI":"10.1023\/A:1022633531479","volume":"3","author":"R. Sutton","year":"1988","unstructured":"Sutton, R. (1988). \u201cLearning to Predict by the Method of Temporal Differences,\u201d Machine Learning 3, 9\u201344.","journal-title":"Machine Learning"},{"key":"5141907_CR27","unstructured":"Watkins, C. (1989). \u201cLearning from Delayed Rewards,\u201d Ph.d. thesis, Cambridge University, Cambridge, England."},{"key":"5141907_CR28","first-page":"279","volume":"8","author":"C. Watkins","year":"1992","unstructured":"Watkins, C. and P. Dayan. (1992). \u201cQ-Learning,\u201d Machine Learning 8, 279\u2013292.","journal-title":"Machine Learning"},{"issue":"1","key":"5141907_CR29","doi-asserted-by":"crossref","first-page":"105","DOI":"10.1023\/A:1007562800292","volume":"33","author":"M. Wiering","year":"1998","unstructured":"Wiering, M. and J. Schmidhuber. (1998). \u201cFast Online Q(\u03bb), \u201d Machine Learning 33(1), 105\u2013115.","journal-title":"Machine Learning"},{"key":"5141907_CR30","unstructured":"Williams, R. and L. I. Baird. (1993). \u201cAnalysis of Some Incremental Variants of Policy Iteration: First Steps toward Understanding Actor-Critic Learning Systems,\u201d Technical Report NU-CCS-93-11, Boston, MA."}],"container-title":["Fuzzy Optimization and Decision Making"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1023\/A:1025059919437.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1023\/A:1025059919437\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1023\/A:1025059919437.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,5]],"date-time":"2025-08-05T04:21:49Z","timestamp":1754367709000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1023\/A:1025059919437"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2003,9]]},"references-count":30,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2003,9]]}},"alternative-id":["5141907"],"URL":"https:\/\/doi.org\/10.1023\/a:1025059919437","relation":{},"ISSN":["1568-4539","1573-2908"],"issn-type":[{"type":"print","value":"1568-4539"},{"type":"electronic","value":"1573-2908"}],"subject":[],"published":{"date-parts":[[2003,9]]}}}