{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T04:45:38Z","timestamp":1742964338288,"version":"3.40.3"},"publisher-location":"Berlin, Heidelberg","reference-count":17,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540421443"},{"type":"electronic","value":"9783540451532"}],"license":[{"start":{"date-parts":[[2001,1,1]],"date-time":"2001-01-01T00:00:00Z","timestamp":978307200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2001]]},"DOI":"10.1007\/3-540-45153-6_11","type":"book-chapter","created":{"date-parts":[[2007,11,13]],"date-time":"2007-11-13T20:24:20Z","timestamp":1194985460000},"page":"111-120","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Imitation and Reinforcement Learning in Agents with Heterogeneous Actions"],"prefix":"10.1007","author":[{"given":"Bob","family":"Price","sequence":"first","affiliation":[]},{"given":"Craig","family":"Boutilier","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2001,5,16]]},"reference":[{"key":"11_CR1","unstructured":"Wei Zhang and Thomas G. Dietterich. A reinforcement learning approach to job-shop scheduling. In IJCAI-95, pages 1114\u20131120, Montreal, 1995."},{"key":"11_CR2","unstructured":"Justin A. Boyan and Andrew W. Moore. Learning evaluation functions for global optimization and boolean satisfiability. In AAAI-98, pages 3\u201310, July 26-30, 1998, Madison, Wisconsin, 1998."},{"key":"11_CR3","unstructured":"Bob Price and Craig Boutilier. Implicit imitation in multiagent reinforcement learning. In ICML-99, pages 325\u2013334, Bled, SI, 1999."},{"key":"11_CR4","unstructured":"Paul Bakker and Yasuo Kuniyoshi. Robot see, robot do: An overview of robot imitation. In AISB96 Workshop on Learning in Robots and Animals, pages 3\u201311, Brighton,UK, 1996."},{"key":"11_CR5","unstructured":"C. G. Atkeson and S. Schaal. Robot learning from demonstration. In ICML-97, pages 12\u201320, Nashville, TN, 1997."},{"key":"11_CR6","doi-asserted-by":"crossref","unstructured":"Aude Billard and Gillian Hayes. Learning to communicate through imitation in autonomous robots. In ICANN-97, pages 763-68, Lausanne, Switzerland, 1997.","DOI":"10.1007\/BFb0020246"},{"key":"11_CR7","series-title":"Technical Report DAI","volume-title":"A robot controller using learning by imitation","author":"G. M. Hayes","year":"1994","unstructured":"G. M. Hayes and J. Demiris. A robot controller using learning by imitation. Technical Report DAI No. 676, University of Edinburgh. Dept. of Artificial Intelligence, 1994."},{"issue":"6","key":"11_CR8","doi-asserted-by":"publisher","first-page":"799","DOI":"10.1109\/70.338535","volume":"10","author":"Y. Kuniyoshi","year":"1994","unstructured":"Yasuo Kuniyoshi, Masayuki Inaba, and Hirochika Inoue. Learning by watching: Extracting reusable task knowledge from visual observation of human performance. IEEE Transactions on Robotics and Automation, 10(6):799\u2013822, 1994.","journal-title":"IEEE Transactions on Robotics and Automation"},{"key":"11_CR9","first-page":"573","volume-title":"IJCAI-85","author":"T. M. Mitchell","year":"1985","unstructured":"T. M. Mitchell, S. Mahadevan, and L. Steinberg. LEAP: A learning apprentice for VLSI design. In IJCAI-85, pages 573\u2013580, Los Altos, California, 1985. Morgan Kaufmann Publishers, Inc."},{"key":"11_CR10","first-page":"596","volume-title":"AAAI-91","author":"P. E. Utgoff","year":"1991","unstructured":"Paul E. Utgoff and Jeffrey A. Clouse. Two kinds of training information for evaluation function learning. In AAAI-91, pages 596\u2013600, Anaheim, CA, 1991. AAAI Press."},{"key":"11_CR11","unstructured":"Chrystopher Nehaniv and Kerstin Dautenhahn. Mapping between dissimilar bodies: Affordances and the algebraic foundations of imitation. In EWLR-98, pages 64\u201372, Edinburgh, 1998."},{"key":"11_CR12","unstructured":"Dorian \u0160uc and Ivan Bratko. Skill reconstruction as induction of LQ controllers with subgoals. In IJCAI-97, pages 914\u2013919, Nagoya, 1997."},{"key":"11_CR13","doi-asserted-by":"crossref","unstructured":"Maja J. Mataric, Matthew Williamson, John Demiris, and Aswath Mohan. Behaviour-based primitives for articulated control. In SAB-98, pages 165\u2013170, Zurich, 1998.","DOI":"10.7551\/mitpress\/3119.003.0026"},{"issue":"1","key":"11_CR14","first-page":"103-30","volume":"13","author":"A. W. Moore","year":"1993","unstructured":"Andrew W. Moore and Christopher G. Atkeson. Prioritized sweeping: Reinforcement learning with less data and less real time. Machine Learning, 13(1):103-30, 1993.","journal-title":"Machine Learning"},{"key":"11_CR15","doi-asserted-by":"crossref","DOI":"10.7551\/mitpress\/4168.001.0001","volume-title":"Learning in Embedded Systems","author":"L. P. Kaelbling","year":"1993","unstructured":"Leslie Pack Kaelbling. Learning in Embedded Systems. MIT Press, Cambridge,MA, 1993."},{"key":"11_CR16","doi-asserted-by":"crossref","DOI":"10.1002\/9780470316641","volume-title":"Multivariate Observations","author":"G. A. F. Seber","year":"1984","unstructured":"George A. F. Seber. Multivariate Observations. Wiley, New York, 1984."},{"key":"11_CR17","doi-asserted-by":"publisher","first-page":"101","DOI":"10.1016\/0378-3758(93)90105-F","volume":"36","author":"J. Mi","year":"1993","unstructured":"J. Mi and Allan R. Sampson. A comparison of the Bonferroni and Scheff\u00e9 bounds. Journal of Statistical Planning and Inference, 36:101\u2013105, 1993.","journal-title":"Journal of Statistical Planning and Inference"}],"container-title":["Lecture Notes in Computer Science","Advances in Artificial Intelligence"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/3-540-45153-6_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,2,19]],"date-time":"2024-02-19T00:37:34Z","timestamp":1708303054000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/3-540-45153-6_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2001]]},"ISBN":["9783540421443","9783540451532"],"references-count":17,"URL":"https:\/\/doi.org\/10.1007\/3-540-45153-6_11","relation":{},"ISSN":["0302-9743"],"issn-type":[{"type":"print","value":"0302-9743"}],"subject":[],"published":{"date-parts":[[2001]]},"assertion":[{"value":"16 May 2001","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}