{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,26]],"date-time":"2026-03-26T02:35:18Z","timestamp":1774492518372,"version":"3.50.1"},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"2-4","license":[{"start":{"date-parts":[[1998,10,1]],"date-time":"1998-10-01T00:00:00Z","timestamp":907200000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[1998,10,1]],"date-time":"1998-10-01T00:00:00Z","timestamp":907200000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Journal of Intelligent and Robotic Systems"],"published-print":{"date-parts":[[1998,10]]},"DOI":"10.1023\/a:1008083631190","type":"journal-article","created":{"date-parts":[[2002,12,22]],"date-time":"2002-12-22T12:45:23Z","timestamp":1040561123000},"page":"165-182","source":"Crossref","is-referenced-by-count":16,"title":["Reinforcement Learning and Robust Control for Robot Compliance Tasks"],"prefix":"10.1007","volume":"23","author":[{"given":"Cheng-Peng","family":"Kuan","sequence":"first","affiliation":[]},{"given":"Kuu-young","family":"Young","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"issue":"5","key":"165962_CR1","doi-asserted-by":"crossref","first-page":"549","DOI":"10.1109\/56.20440","volume":"4","author":"R. J. Anderson","year":"1988","unstructured":"Anderson, R. J. and Spong, M. W.: Hybrid impedance control of robotic manipulators, IEEE J. Robotics Automat.\n4(5) (1988), 549\u2013556.","journal-title":"IEEE J. Robotics Automat."},{"key":"165962_CR2","unstructured":"Asada, H. and Asari, Y.: The direct teaching of tool manipulation skills via the impedance identification of human motions, in: IEEE Int. Conf. on Robotics and Automation, 1988, pp. 1269\u20131274."},{"issue":"2","key":"165962_CR3","doi-asserted-by":"crossref","first-page":"166","DOI":"10.1109\/70.88037","volume":"5","author":"H. Asada","year":"1989","unstructured":"Asada, H. and Izumi, H.: Automatic program generation from teaching data for the hybrid control of robots, IEEE Trans. Robotics Automat.\n5(2) (1989), 166\u2013173.","journal-title":"IEEE Trans. Robotics Automat."},{"key":"165962_CR4","doi-asserted-by":"crossref","unstructured":"Asada, H. and Liu, S.: Transfer of human skills to neural net robot controllers, in: IEEE Int. Conf. on Robotics and Automation, 1991, pp. 2442\u20132448.","DOI":"10.1109\/ROBOT.1991.131990"},{"key":"165962_CR5","first-page":"469","volume-title":"Handbook of Intelligent Control","author":"A. G. Barto","year":"1992","unstructured":"Barto, A. G.: Reinforcement learning and adaptive critic methods, in: White and Sofge (eds), Handbook of Intelligent Control, Van Nostrand Reinhold, New York, 1992, pp. 469\u2013491."},{"key":"165962_CR6","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4612-0957-7","volume-title":"Linear System Theory","author":"F. Callier","year":"1991","unstructured":"Callier, F. and Desoer, C.: Linear System Theory, Springer, New York, 1991."},{"issue":"4","key":"165962_CR7","doi-asserted-by":"crossref","first-page":"361","DOI":"10.1109\/70.246048","volume":"9","author":"S. Chiaverini","year":"1993","unstructured":"Chiaverini, S. and Sciavicco, L.: The parallel approach to force\/position control of robotic manipulators, IEEE Trans. Robotics Automat.\n9(4) (1993), 361\u2013373.","journal-title":"IEEE Trans. Robotics Automat."},{"key":"165962_CR8","unstructured":"De Schutter, J. and Leysen, J.: Tracking in compliant robot motion: Automatic generation of the task frame trajectory based on observation of the natural constraints, in: Int. Symp. of Robotics Research, 1987, pp. 215\u2013223."},{"issue":"1","key":"165962_CR9","doi-asserted-by":"crossref","first-page":"13","DOI":"10.1109\/37.257890","volume":"14","author":"V. Gullapalli","year":"1994","unstructured":"Gullapalli, V., Franklin, J. A., and Benbrahim, H.: Acquiring robot skills via reinforcement learning, IEEE Control Systems Magazine\n14(1) (1994), 13\u201324.","journal-title":"IEEE Control Systems Magazine"},{"key":"165962_CR10","volume-title":"Neural Networks: A Comprehensive Foundation","author":"S. Haykin","year":"1994","unstructured":"Haykin, S.: Neural Networks: A Comprehensive Foundation, Macmillan, New York, 1994."},{"key":"165962_CR11","doi-asserted-by":"crossref","unstructured":"Hirzinger, G. and Landzettel, K.: Sensory feedback structures for robots with supervised learning, in: IEEE Int. Conf. on Robotics and Automation, 1985, pp. 627\u2013635.","DOI":"10.1109\/ROBOT.1985.1087345"},{"key":"165962_CR12","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1115\/1.3140702","volume":"107","author":"N. Hogan","year":"1985","unstructured":"Hogan, N.: Impedance control: An approach to manipulation. Part I: Theory; Part II: Implementation; Part III: Application, ASME J. Dyn. Systems Meas. Control\n107 (1985), 1\u201324.","journal-title":"ASME J. Dyn. Systems Meas. Control"},{"key":"165962_CR13","doi-asserted-by":"crossref","first-page":"354","DOI":"10.1115\/1.3143806","volume":"108","author":"H. Kazerooni","year":"1986","unstructured":"Kazerooni, H., Bausch, J. J., and Kramer, B.: An approach to automated deburring by robot manipulators, ASME J. Dyn. Systems Meas. Control\n108 (1986), 354\u2013359.","journal-title":"ASME J. Dyn. Systems Meas. Control"},{"issue":"2","key":"165962_CR14","doi-asserted-by":"crossref","first-page":"83","DOI":"10.1109\/JRA.1986.1087045","volume":"2","author":"H. Kazerooni","year":"1986","unstructured":"Kazerooni, H., Sheridan, T. B., and Houpt, P. K.: Robust compliant motion for manipulators. Part I: The fundamental concepts of compliant motion. Part II: Design method, IEEE J. Robotics Automat.\n2(2) (1986), 83\u2013105.","journal-title":"IEEE J. Robotics Automat."},{"issue":"1","key":"165962_CR15","doi-asserted-by":"crossref","first-page":"43","DOI":"10.1109\/JRA.1987.1087068","volume":"3","author":"O. Khatib","year":"1987","unstructured":"Khatib, O.: A unified approach for motion and force control of robot manipulators: The operational space formulation, IEEE J. Robotics Automat.\n3(1) (1987), 43\u201353.","journal-title":"IEEE J. Robotics Automat."},{"issue":"6","key":"165962_CR16","doi-asserted-by":"crossref","first-page":"799","DOI":"10.1109\/70.338535","volume":"10","author":"Y. Kuniyoshi","year":"1994","unstructured":"Kuniyoshi, Y., Inaba, M., and Inoue, H.: Learning by watching: extracting reusable task knowledge from visual observation of human performance, IEEE Trans. Robotics Automat.\n10(6) (1994), 799\u2013822.","journal-title":"IEEE Trans. Robotics Automat."},{"key":"165962_CR17","doi-asserted-by":"crossref","unstructured":"Lee, S. and Lee, H. S.: Intelligent control of manipulators interacting with an uncertain environment based on generalized impedance, in: IEEE Int. Symp. on Intelligent Control, 1991, pp. 61\u201366.","DOI":"10.1109\/ISIC.1991.187334"},{"issue":"1","key":"165962_CR18","doi-asserted-by":"crossref","first-page":"3","DOI":"10.1177\/027836498400300101","volume":"3","author":"T. Lozano-Perez","year":"1984","unstructured":"Lozano-Perez, T., Mason, M. T., and Taylor, R. H.: Automatic synthesis of fine-motion strategies for robots, Internat. J. Robotics Res.\n3(1) (1984), 3\u201324.","journal-title":"Internat. J. Robotics Res."},{"issue":"3","key":"165962_CR19","doi-asserted-by":"crossref","first-page":"408","DOI":"10.1109\/70.88152","volume":"7","author":"W.-S. Lu","year":"1991","unstructured":"Lu, W.-S. and Meng, Q.-H.: Impedance control with adaptation for robotic manipulations, IEEE Trans. Robotics Automat.\n7(3) (1991), 408\u2013415.","journal-title":"IEEE Trans. Robotics Automat."},{"issue":"5","key":"165962_CR20","doi-asserted-by":"crossref","first-page":"754","DOI":"10.1109\/70.466608","volume":"11","author":"Z. Lu","year":"1995","unstructured":"Lu, Z., Kawamura, S., and Goldenberg, A. A.: An approach to sliding mode-based impedance control, IEEE Trans. Robotics Automat.\n11(5) (1995), 754\u2013759.","journal-title":"IEEE Trans. Robotics Automat."},{"issue":"5","key":"165962_CR21","doi-asserted-by":"crossref","first-page":"971","DOI":"10.1109\/21.120050","volume":"21","author":"V. Lumelsky","year":"1991","unstructured":"Lumelsky, V.: On human performance in telerobotics, IEEE Trans. Systems Man Cybernet.\n21(5) (1991), 971\u2013982.","journal-title":"IEEE Trans. Systems Man Cybernet."},{"issue":"6","key":"165962_CR22","doi-asserted-by":"crossref","first-page":"418","DOI":"10.1109\/TSMC.1981.4308708","volume":"11","author":"M. T. Mason","year":"1981","unstructured":"Mason, M. T.: Compliance and force control for computer controlled manipulators, IEEE Trans. Systems Man Cybernet.\n11(6) (1981), 418\u2013432.","journal-title":"IEEE Trans. Systems Man Cybernet."},{"key":"165962_CR23","doi-asserted-by":"crossref","first-page":"126","DOI":"10.1115\/1.3139652","volume":"102","author":"M. H. Raibert","year":"1981","unstructured":"Raibert, M. H. and Craig, J. J.: Hybrid position\/force control of manipulators, ASME J. Dyn. Systems Meas. Control\n102 (1981), 126\u2013133.","journal-title":"ASME J. Dyn. Systems Meas. Control"},{"key":"165962_CR24","volume-title":"Motor Control and Learning: A Behavioral Emphasis","author":"R. A. Schmidt","year":"1988","unstructured":"Schmidt, R. A.: Motor Control and Learning: A Behavioral Emphasis, Human Kinetics Publishers, Champaign, IL, 1988."},{"issue":"2","key":"165962_CR25","doi-asserted-by":"crossref","first-page":"421","DOI":"10.1080\/00207178408933284","volume":"40","author":"J. E. Slotine","year":"1984","unstructured":"Slotine, J.-J. E.: Sliding controller design for nonlinear systems, Internat. J. Control\n40(2) (1984), 421\u2013434.","journal-title":"Internat. J. Control"},{"issue":"2","key":"165962_CR26","doi-asserted-by":"crossref","first-page":"19","DOI":"10.1109\/37.126844","volume":"12","author":"R. S. Sutton","year":"1992","unstructured":"Sutton, R. S., Barto, A. G., and Williams, R. J.: Reinforcement learning is direct adaptive optimal control, IEEE Control Systems Magazine\n12(2) (1992), 19\u201322.","journal-title":"IEEE Control Systems Magazine"},{"issue":"3","key":"165962_CR27","doi-asserted-by":"crossref","first-page":"365","DOI":"10.1109\/9.73573","volume":"36","author":"J. T. Wen","year":"1991","unstructured":"Wen, J. T. and Murphy, S.: Stability analysis of position and force control for robot arms, IEEE Trans. Automat. Control\n36(3) (1991), 365\u2013371.","journal-title":"IEEE Trans. Automat. Control"},{"issue":"7","key":"165962_CR28","doi-asserted-by":"crossref","first-page":"1065","DOI":"10.1109\/21.297797","volume":"24","author":"C. H. Wu","year":"1994","unstructured":"Wu, C. H. and Kim, M. G.: Modeling of part-mating strategies for automating assembly operations for robots, IEEE Trans. Systems Man Cybernet.\n24(7) (1994), 1065\u20131074.","journal-title":"IEEE Trans. Systems Man Cybernet."},{"issue":"5","key":"165962_CR29","doi-asserted-by":"crossref","first-page":"621","DOI":"10.1109\/70.326567","volume":"10","author":"T. Yang","year":"1994","unstructured":"Yang, T., Xu, Y., and Chen, C. S.: Hidden Markov model approach to skill learning and its application to telerobotics, IEEE Trans. Robotics Automat.\n10(5) (1994), 621\u2013631.","journal-title":"IEEE Trans. Robotics Automat."},{"issue":"2","key":"165962_CR30","doi-asserted-by":"crossref","first-page":"220","DOI":"10.1109\/70.238286","volume":"9","author":"T. Yoshikawa","year":"1993","unstructured":"Yoshikawa, T. and Sudou, A.: Dynamic hybrid position\/force control of robot manipulators \u2014 On-line estimation of unknown constraint, IEEE J. Robotics Automat.\n9(2) (1993), 220\u2013226.","journal-title":"IEEE J. Robotics Automat."}],"container-title":["Journal of Intelligent and Robotic Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1023\/A:1008083631190.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1023\/A:1008083631190\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1023\/A:1008083631190.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,6]],"date-time":"2025-06-06T14:32:46Z","timestamp":1749220366000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1023\/A:1008083631190"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[1998,10]]},"references-count":30,"journal-issue":{"issue":"2-4","published-print":{"date-parts":[[1998,10]]}},"alternative-id":["165962"],"URL":"https:\/\/doi.org\/10.1023\/a:1008083631190","relation":{},"ISSN":["0921-0296","1573-0409"],"issn-type":[{"value":"0921-0296","type":"print"},{"value":"1573-0409","type":"electronic"}],"subject":[],"published":{"date-parts":[[1998,10]]}}}