{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,7,22]],"date-time":"2024-07-22T14:30:32Z","timestamp":1721658632578},"reference-count":51,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2012,10,4]],"date-time":"2012-10-04T00:00:00Z","timestamp":1349308800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Int J of Soc Robotics"],"published-print":{"date-parts":[[2013,1]]},"DOI":"10.1007\/s12369-012-0167-6","type":"journal-article","created":{"date-parts":[[2012,10,3]],"date-time":"2012-10-03T10:27:30Z","timestamp":1349260050000},"page":"53-73","source":"Crossref","is-referenced-by-count":2,"title":["Learning Macro Actions from Instructional Videos Through Integration of Multiple Modalities"],"prefix":"10.1007","volume":"5","author":[{"given":"David O.","family":"Johnson","sequence":"first","affiliation":[]},{"given":"Arvin","family":"Agah","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2012,10,4]]},"reference":[{"issue":"2","key":"167_CR1","doi-asserted-by":"crossref","first-page":"299","DOI":"10.1109\/TSMCB.2006.886947","volume":"37","author":"A Alissandrakis","year":"2007","unstructured":"Alissandrakis A, Nehaniv C, Dautenhahn K (2007) Correspondence mapping induced state and action metrics for robotic imitation. IEEE Trans Syst Man Cybern, Part A, Syst Hum 37(2):299\u2013307. 2007","journal-title":"IEEE Trans Syst Man Cybern, Part A, Syst Hum"},{"key":"167_CR2","unstructured":"Bekey G, Ambrose R, Kumar V, Sanderson A, Wilcox B, Zheng\u00a0Y (2006) Final report. World Technology Evaluation Center, Inc. (WTEC) Panel on International, Assessment of Research and Development in Robotics, January 2006"},{"key":"167_CR3","volume-title":"Handbook of robotics","author":"A Billard","year":"2008","unstructured":"Billard A, Calinon S, Dillmann R, Schaal S (2008) Robot programming by demonstration. In: Siciliano B, Khatib O (eds) Handbook of robotics. Springer, Berlin. Chap.\u00a059"},{"key":"167_CR4","first-page":"708","volume-title":"Proceedings of IEEE\/RSJ international conference on intelligent robots and systems (IROS)","author":"C Breazeal","year":"2005","unstructured":"Breazeal C, Kidd C, Thomaz A, Hoffman G, Berlin M (2005) Effects of nonverbal communication on efficiency and robustness in human-robot teamwork. In: Proceedings of IEEE\/RSJ international conference on intelligent robots and systems (IROS), Edmonton, Alberta, Canada, 2\u20136\u00a0August 2005, pp\u00a0708\u2013713"},{"key":"167_CR5","first-page":"112","volume-title":"Proceedings of the ASER\u201903 1st international workshop on advances in service robotics","author":"G Bugmann","year":"2003","unstructured":"Bugmann G (2003) Challenges in verbal instruction of domestic robots. In: Proceedings of the ASER\u201903 1st international workshop on advances in service robotics, Bardolino, Italy, 13\u201315 March 2003, pp 112\u2013116"},{"key":"167_CR6","first-page":"96","volume-title":"Proceedings of the 8th international conference on intelligent autonomous systems (IAS-8)","author":"G Bugmann","year":"2004","unstructured":"Bugmann G, Klein E, Lauria S, Bos J, Kyriacou T (2004) Corpus-based robotics: a route instruction example. In: Proceedings of the 8th international conference on intelligent autonomous systems (IAS-8), Amsterdam, Netherlands, 10\u201313 March 2004, pp 96\u2013103."},{"key":"167_CR7","series-title":"Technical Report Series","volume-title":"Proceedings of the TIMR 01\u2014towards intelligent mobile robots","author":"G Bugmann","year":"2001","unstructured":"Bugmann G, Lauria S, Kyriacou T, Klein E, Bos J, Coventry K (2001) Using verbal instructions for route learning: instruction analysis. In: Proceedings of the TIMR 01\u2014towards intelligent mobile robots, Manchester, UK, 5 April 2001. Technical Report Series. Department of Computer Science, Manchester University. ISSN 1361-6161, Report number UMC-01-4-1"},{"key":"167_CR8","doi-asserted-by":"crossref","first-page":"105","DOI":"10.1145\/1102351.1102365","volume-title":"Proceedings of the 22nd international conference on machine learning","author":"S Calinon","year":"2005","unstructured":"Calinon S, Billard A (2005) Recognition and reproduction of gestures using a probabilistic framework combining PCA, ICA and HMM. In: Proceedings of the 22nd international conference on machine learning, Bonn, Germany, 7\u201311 August 2005, pp 105\u2013112"},{"key":"167_CR9","doi-asserted-by":"crossref","first-page":"299","DOI":"10.1109\/ROBOT.2005.1570135","volume-title":"Proceedings of the 2005 IEEE international conference on robotics and automation","author":"S Calinon","year":"2005","unstructured":"Calinon S, Guenter F, Billard A (2005) Goal-directed imitation in a humanoid robot. In: Proceedings of the 2005 IEEE international conference on robotics and automation, Barcelona, Spain, 18\u201322 April 2005, pp 299\u2013304"},{"key":"167_CR10","doi-asserted-by":"crossref","first-page":"2978","DOI":"10.1109\/ROBOT.2006.1642154","volume-title":"Proceedings of the 2006 IEEE international conference on robotics and automation","author":"S Calinon","year":"2006","unstructured":"Calinon S, Guenter F, Billard A (2006) On learning the statistical representation of a task and generalizing it to various contexts. In: Proceedings of the 2006 IEEE international conference on robotics and automation, Orlando, FL, USA, 15\u201319 May 2006, pp 2978\u20132983"},{"key":"167_CR11","doi-asserted-by":"crossref","unstructured":"Campbell M (2010) Towel-folding robot now on general sale. New scientist, 14 September 2010","DOI":"10.1016\/S0262-4079(10)63085-0"},{"key":"167_CR12","volume-title":"Natural, intelligent and effective interaction in multimodal dialogue systems","author":"J Chai","year":"2005","unstructured":"Chai J, Pan S, Zhou M (2005) MIND: a context-based multi-modal interpretation framework in conversational systems. In: Bernsen O, Dybkjaer L, van Kuppevelt J (eds) Natural, intelligent and effective interaction in multimodal dialogue systems. Kluwer Academic, Norwell"},{"key":"167_CR13","doi-asserted-by":"crossref","first-page":"43","DOI":"10.1145\/1040830.1040850","volume-title":"Proceedings of the 10th international conference on intelligent user interfaces (IUI-05)","author":"J Chai","year":"2005","unstructured":"Chai J, Prasov Z, Blaim J, Jin R (2005) Linguistic theories in efficient multi-modal reference resolution: an empirical investigation. In: Proceedings of the 10th international conference on intelligent user interfaces (IUI-05), San Diego, CA, USA, 9\u201312 January 2005, pp 43\u201350"},{"key":"167_CR14","doi-asserted-by":"crossref","first-page":"475","DOI":"10.1109\/ICHR.2005.1573612","volume-title":"Proceeding of the IEEE-RAS international conference on humanoid robots","author":"P Dominey","year":"2005","unstructured":"Dominey P, Alvarez M, Gao B, Jeambrun M, Cheylus A, Weitzenfeld A, Martinez A, Medrano A (2005) Robot command, interrogation and teaching via social interaction. In: Proceeding of the IEEE-RAS international conference on humanoid robots, Tsukuba, Japan, 7 December 2005, pp 475\u2013480"},{"key":"167_CR15","unstructured":"Drumwright E (2007) The task matrix: a robot-independent framework for programming humanoids. PhD dissertation, Department of Computer Science, University of Southern, California, Los Angeles, CA, USA"},{"key":"167_CR16","doi-asserted-by":"crossref","first-page":"448","DOI":"10.1109\/ROBOT.2006.1641752","volume-title":"Proceedings of the 2006 IEEE international conference on robotics and automation","author":"E Drumwright","year":"2006","unstructured":"Drumwright E, Ng-Thow-Hing V (2006) The task matrix: an extensible framework for creating versatile humanoid robots. In: Proceedings of the 2006 IEEE international conference on robotics and automation, Orlando, Florida, USA, 15\u201319 May 2006, pp 448\u2013455"},{"key":"167_CR17","unstructured":"eHow.com Website, www.ehow.com"},{"key":"167_CR18","doi-asserted-by":"crossref","first-page":"109","DOI":"10.1145\/958432.958455","volume-title":"Proceedings of the fifth international conference on multimodal interfaces (ICMI-PUI\u201903)","author":"F Flippo","year":"2003","unstructured":"Flippo F, Krebs A, Marsic I (2003) A framework for rapid development of multi-modal interfaces. In: Proceedings of the fifth international conference on multimodal interfaces (ICMI-PUI\u201903), Vancouver, Canada, 5\u20137 November 2003, pp 109\u2013116"},{"key":"167_CR19","unstructured":"Flippo F (2003) A natural human-computer interface for controlling wheeled robotic vehicles. Delft University of Technology, Department of Information Technology and Systems, Delft, Netherlands, August"},{"key":"167_CR20","unstructured":"Green, Severinson-Eklundh K (2001) Task-oriented dialogue for CERO: a user-centered approach. Royal Institute of Technology (KTH), Stockholm, Sweden"},{"key":"167_CR21","doi-asserted-by":"crossref","first-page":"4678","DOI":"10.1109\/IROS.2006.282256","volume-title":"Proceedings of the 2006 IEEE\/RSJ international conference on intelligent robots and systems","author":"A Green","year":"2006","unstructured":"Green A, Severinson-Eklundh K, Wrede B, Li S (2006) Integrating miscommunication analysis in natural language interface design for a service robot. In: Proceedings of the 2006 IEEE\/RSJ international conference on intelligent robots and systems, Beijing, China, 9\u201315 October 2006, pp 4678\u20134683"},{"key":"167_CR22","unstructured":"Hornyak T (2010) HRP-4 robot can strike a pose, pour drinks. Cnet news, 16 September 2010"},{"key":"167_CR23","first-page":"145","volume-title":"Proceedings of the 9th international conference on intelligent autonomous systems (IAS-9)","author":"T Inamura","year":"2006","unstructured":"Inamura T, Okadab K, Tokutsub S, Hataob N, Inabab M, Inoue\u00a0H (2006) HRP-2W: a humanoid platform for research on support behavior in daily life environments. In: Proceedings of the 9th international conference on intelligent autonomous systems (IAS-9), Tokyo, Japan, 7\u20139 March 2006, vol 57, pp 145\u2013154"},{"key":"167_CR24","doi-asserted-by":"crossref","first-page":"372","DOI":"10.1007\/3-540-36268-1_33","volume-title":"Experimental robotics VIII","author":"T Inamura","year":"2003","unstructured":"Inamura T, Toshima I, Nakamura Y (2003) Acquiring motion elements for bidirectional computation of motion recognition and generation. In: Siciliano B, Dario P (eds) Experimental robotics VIII, vol 5. Springer, Berlin, pp 372\u2013381"},{"key":"167_CR25","unstructured":"iRobot Corporation Website, www.irobot.com"},{"key":"167_CR26","unstructured":"Johnson DO (2008) Human robot interaction through semantic integration of multiple modalities, dialog management, and contexts. PhD dissertation, Department of Electrical Engineering and Computer Science, University of Kansas, Lawrence, KS, USA"},{"key":"167_CR27","author":"DO Johnson","year":"2009","unstructured":"Johnson DO, Agah A (2009) Human robot interaction through semantic integration of multiple modalities, dialog management, and contexts. Int J Soc Robot. September 2009. doi: 10.1007\/s12369-009-0028-0","journal-title":"Int J Soc Robot"},{"issue":"1","key":"167_CR28","first-page":"79","volume":"20","author":"DO Johnson","year":"2011","unstructured":"Johnson DO, Agah A (2011) A novel efficient algorithm for locating and tracking object parts in low resolution videos. Int J Intell Syst 20(1):79\u2013100. April\u00a02011. doi: 10.1515\/JISYS.2011.006","journal-title":"Int J Intell Syst"},{"key":"167_CR29","first-page":"95","volume-title":"Proceedings of the ICAI\u201911\u2014the 2011 international conference on artificial intelligence","author":"DO Johnson","year":"2011","unstructured":"Johnson DO, Agah A (2011) Recognition of Marker-less human actions in videos using hidden Markov models. In: Proceedings of the ICAI\u201911\u2014the 2011 international conference on artificial intelligence, Las Vegas, NV, USA, 18\u201321 July 2011, pp 95\u2013100"},{"issue":"2","key":"167_CR30","doi-asserted-by":"crossref","first-page":"114","DOI":"10.20965\/jaciii.2005.p0114","volume":"9","author":"H Kim","year":"2005","unstructured":"Kim H, Jung Y, Hwang Y (2005) Taxonomy of atomic actions for home-service robots. J Adv Comput Intell Intell Inform 9(2):114\u2013120","journal-title":"J Adv Comput Intell Intell Inform"},{"key":"167_CR31","unstructured":"Klingspor V, Demiris J, Kaiser M (1997) Human-robot-communication and machine learning. Universit\u00e4t Dortmund, Germany, University of Edinburgh, UK, Universit\u00e4t Karlsruhe, Germany"},{"key":"167_CR32","first-page":"74","volume-title":"Proceedings of the 9th European workshop on learning robots (EWLR-9)","author":"S Lauria","year":"2001","unstructured":"Lauria S, Bugmann G, Kyriacou T, Klein E (2001) Instruction based learning: how to instruct a personal robot to find HAL. In: Proceedings of the 9th European workshop on learning robots (EWLR-9), Prague, Czech Republic, 8\u20139 September 2001, pp 74\u201383"},{"key":"167_CR33","first-page":"528","volume-title":"Proceedings of the 2000 IEEE\/RSJ international conference on intelligent robots and systems","author":"L Lopes","year":"2000","unstructured":"Lopes L, Teixeira A (2000) Human-robot interaction through spoken language dialogue. In: Proceedings of the 2000 IEEE\/RSJ international conference on intelligent robots and systems, Takamatsu, Japan, 30 October\u20135 November 2000, pp 528\u2013534"},{"key":"167_CR34","doi-asserted-by":"crossref","first-page":"1150","DOI":"10.1109\/ICCV.1999.790410","volume-title":"Proceedings of the international conference on computer vision","author":"D Lowe","year":"1999","unstructured":"Lowe D (1999) Object recognition from local scale-invariant features. In: Proceedings of the international conference on computer vision, vol 2, pp 1150\u20131157"},{"key":"167_CR35","unstructured":"MacMahon M (2005) MARCO: a modular architecture for following route instructions. Department of Electrical and Computer Engineering, Intelligent Robotics Laboratory, University of Texas at Austin, Austin, TX, USA"},{"key":"167_CR36","unstructured":"The MATLAB image processing toolbox 6: (2009), MathWorks. www.mathworks.com"},{"key":"167_CR37","first-page":"32","volume-title":"Proceedings of the AAAI-05 workshop on modular construction of human-like intelligence","author":"N Mavridis","year":"2005","unstructured":"Mavridis N, Roy D (2005) Grounded situation models for robots: bridging language, perception, and action. In: Proceedings of the AAAI-05 workshop on modular construction of human-like intelligence, Pittsburgh, PA, USA, 10 July 2005, pp 32\u201339"},{"key":"167_CR38","unstructured":"Merriam-Webster Dictionary (2011) www.merriam-webster.com. Accessed 28 February 2011"},{"key":"167_CR39","unstructured":"National Institute of Technology and Standards (2009) The history of automatic speech recognition evaluations at NIST. http:\/\/www.itl.nist.gov\/iad\/mig\/publications\/ASRhistory\/index.html . Accessed 21 August 2011"},{"key":"167_CR40","doi-asserted-by":"crossref","first-page":"419","DOI":"10.1109\/3468.952716","volume":"31","author":"M Nicolescu","year":"2001","unstructured":"Nicolescu M, Mataric M (2001) Learning and interacting in human-robot domains. IEEE Trans Syst Man Cybern, Part A, Syst Hum, 31, 419\u2013430","journal-title":"IEEE Trans Syst Man Cybern, Part A, Syst Hum"},{"key":"167_CR41","volume-title":"Models and mechanisms of imitation and social learning in robots, humans and animals","author":"M Nicolescu","year":"2005","unstructured":"Nicolescu M, Mataric M (2005) Task learning through imitation and human-robot interaction. In: Dautenhahn K, Nehaniv C (eds) Models and mechanisms of imitation and social learning in robots, humans and animals. Cambridge University Press, Cambridge"},{"key":"167_CR42","unstructured":"The Phoenix parser user manual (2002) The Center for Spoken Language Research, University of Colorado, Boulder, CO, USA"},{"issue":"1\u20132","key":"167_CR43","doi-asserted-by":"crossref","first-page":"170","DOI":"10.1016\/j.artint.2005.04.007","volume":"167","author":"D Roy","year":"2005","unstructured":"Roy D (2005) Semiotic schemas: a framework for grounding language in action and perception. Artif Intell 167(1\u20132):170\u2013205","journal-title":"Artif Intell"},{"key":"167_CR44","volume-title":"The elements of grammar","author":"M Shertzer","year":"1986","unstructured":"Shertzer M (1986) The elements of grammar. Macmillan Pub, New York"},{"key":"167_CR45","first-page":"3327","volume-title":"Proceedings of the 2004 IEEE\/RSJ international conference on intelligent robots and systems (IROS 2004)","author":"J Suomela","year":"2004","unstructured":"Suomela J, Halme A (2004) Human robot interaction\u2014case WorkPartner. In: Proceedings of the 2004 IEEE\/RSJ international conference on intelligent robots and systems (IROS 2004), Sendai, Japan, 28 September\u20132 October 2004, pp 3327\u20133332"},{"key":"167_CR46","volume-title":"Proceedings of the interactive robot learning, robotics: science and systems (RSS) 2008 workshop","author":"A Thomaz","year":"2008","unstructured":"Thomaz A, Jacobsson H, Kruijff G, Skocaj D (2008) In: Proceedings of the interactive robot learning, robotics: science and systems (RSS) 2008 workshop, Zurich, Switzerland, June 28, 2008."},{"key":"167_CR47","first-page":"273","volume-title":"Proceedings of international conference on spoken language processing","author":"I Toptsis","year":"2004","unstructured":"Toptsis I, Li S, Wrede B, Fink G (2004) A multi-modal dialog system for a mobile robot. In: Proceedings of international conference on spoken language processing, Jeju, South Korea, 14\u201318 October 2004, pp 273\u2013276"},{"key":"167_CR48","doi-asserted-by":"crossref","unstructured":"Vedaldi A, Fulkerson B (2011) VLFeat: an open and portable library of computer vision algorithms. www.vlfeat.org","DOI":"10.1145\/1873951.1874249"},{"key":"167_CR49","unstructured":"Wikipedia (2011) Golf equipment, www.wikipedia.org . Accessed 28 February 2011"},{"key":"167_CR50","doi-asserted-by":"crossref","unstructured":"Wilske S, Kruijff G (2006) Service robots dealing with indirect speech acts. Language Technology Lab, German Research Center for Artificial Intelligence (DFKI), Saarbrucken, Germany","DOI":"10.1109\/IROS.2006.282259"},{"issue":"4","key":"167_CR51","doi-asserted-by":"crossref","first-page":"651","DOI":"10.1109\/TIE.2003.814767","volume":"50","author":"J Zhang","year":"2003","unstructured":"Zhang J, Knoll A (2003) A two-arm situated artificial communicator for human-robot cooperative assembly. IEEE Trans Ind Electron 50(4):651\u2013658","journal-title":"IEEE Trans Ind Electron"}],"container-title":["International Journal of Social Robotics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s12369-012-0167-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s12369-012-0167-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s12369-012-0167-6","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,29]],"date-time":"2022-01-29T23:05:20Z","timestamp":1643497520000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s12369-012-0167-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012,10,4]]},"references-count":51,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2013,1]]}},"alternative-id":["167"],"URL":"https:\/\/doi.org\/10.1007\/s12369-012-0167-6","relation":{},"ISSN":["1875-4791","1875-4805"],"issn-type":[{"value":"1875-4791","type":"print"},{"value":"1875-4805","type":"electronic"}],"subject":[],"published":{"date-parts":[[2012,10,4]]}}}