{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,2]],"date-time":"2026-04-02T05:57:15Z","timestamp":1775109435062,"version":"3.50.1"},"reference-count":28,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,5]]},"DOI":"10.1109\/icra.2018.8460937","type":"proceedings-article","created":{"date-parts":[[2018,9,21]],"date-time":"2018-09-21T22:28:03Z","timestamp":1537568883000},"page":"4430-4436","source":"Crossref","is-referenced-by-count":12,"title":["Learning to Parse Natural Language to Grounded Reward Functions with Weak Supervision"],"prefix":"10.1109","author":[{"given":"Edward C.","family":"Williams","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nakul","family":"Gopalan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mine","family":"Rhee","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Stefanie","family":"Tellex","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","article-title":"An object-oriented representation for efficient reinforcement learning","author":"diuk","year":"2008","journal-title":"International Conference on Machine Learning"},{"key":"ref11","first-page":"480","article-title":"Planning with abstract markov decision processes","author":"nakul","year":"2017","journal-title":"Proceedings of the Twenty-Seventh International Conference on Automated Planning and Scheduling"},{"key":"ref12","article-title":"From language to programs: Bridging reinforcement learning and maximum marginal likelihood","author":"guu","year":"2017","journal-title":"CoRR abs\/1704 07926"},{"key":"ref13","article-title":"Stefanie Tellex, and Nicholas Roy. A natural language planner interface for mobile manipulators","author":"howard","year":"2014","journal-title":"IEEE International Conference on Robotics and Automation"},{"key":"ref14","author":"janner","year":"2017","journal-title":"Representation learning for grounded spatial reasoning"},{"key":"ref15","article-title":"Weakly supervised training of semantic parsers","author":"krishnamurthy","year":"2012","journal-title":"Proceedings of the Joint Conference on Empirical Methods in Natural Language Processing and Computational Natural Language Learning"},{"key":"ref16","first-page":"1512","article-title":"Lexical generalization in ccg grammar induction for semantic parsing","author":"kwiatkowski","year":"2011","journal-title":"Proceedings of the Conference on Empirical Methods in Natural Language Processing"},{"key":"ref17","author":"macglashan","year":"2014","journal-title":"Brown-UMBC Reinforcement Learning and Planning (BURLAP)-Project"},{"key":"ref18","article-title":"Grounding english commands to reward functions","author":"macglashan","year":"2015","journal-title":"Robotics Science and Systems"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1106"},{"key":"ref28","article-title":"Online learning of relaxed ccg grammars for parsing to logical form","author":"zettlemoyer","year":"2007","journal-title":"Proc Joint Conf Empirical Methods in Natural Language Processing and Computational Natural Language Learning"},{"key":"ref4","doi-asserted-by":"crossref","DOI":"10.1162\/tacl_a_00209","article-title":"Weakly supervized learning of semantic parsers for mapping instructions to actions","author":"artzi","year":"2013","journal-title":"Annual Meeting of the Association for Computational Linguistics"},{"key":"ref27","article-title":"Learning to map sentences to logical form: Structured classification with probabilistic categorial grammars","author":"zettlemoyer","year":"2005","journal-title":"Proceedings of the Conference on Uncertainty in Artificial Intelligence"},{"key":"ref3","article-title":"Bootstrapping semantic parsers from conversations","author":"artzi","year":"2011","journal-title":"Proceedings of the Conference on Empirical Methods in Natural Language Processing"},{"key":"ref6","article-title":"and Stefanie Tellex. Accurately and efficiently interpreting human-robot instructions of varying granularities","author":"dilip","year":"2017","journal-title":"Proceedings of Robotics Science and Systems XII"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1134"},{"key":"ref8","author":"carpenter","year":"1997","journal-title":"Type-Logical Semantics"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1512\/iumj.1957.6.56038"},{"key":"ref2","author":"artzi","year":"2016","journal-title":"Cornell SPF Cornell Semantic Parsing Framework"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1162\/coli.2007.33.4.493"},{"key":"ref1","author":"anderson","year":"2013","journal-title":"The jscheme language and implementation"},{"key":"ref20","first-page":"663","article-title":"Algorithms for inverse reinforcement learning","author":"ng","year":"2000","journal-title":"ICML Machine Learning Proceedings of the Seventh International Conference"},{"key":"ref22","author":"quigley","year":"0","journal-title":"ROS An Open-source Robot Operating System"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/SFCS.1977.32"},{"key":"ref24","doi-asserted-by":"crossref","DOI":"10.7551\/mitpress\/6591.001.0001","author":"steedman","year":"2000","journal-title":"The Syntactic Process"},{"key":"ref23","article-title":"Unsupervised perceptual rewards for imitation learning","author":"sermanet","year":"2016","journal-title":"CoRR abs\/1612 06699"},{"key":"ref26","article-title":"Learning to parse natural language to grounded reward functions with weak supervision","author":"williams","year":"2017","journal-title":"AAAI Fall Symposium on Natural Communication for Human-Robot Collaboration"},{"key":"ref25","article-title":"Understanding natural language commands for robotic navigation and mobile manipulation","author":"stefanie","year":"2011","journal-title":"AAAI Conference on Artificial Intelligence"}],"event":{"name":"2018 IEEE International Conference on Robotics and Automation (ICRA)","location":"Brisbane, QLD","start":{"date-parts":[[2018,5,21]]},"end":{"date-parts":[[2018,5,25]]}},"container-title":["2018 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8449910\/8460178\/08460937.pdf?arnumber=8460937","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,8]],"date-time":"2025-07-08T18:05:56Z","timestamp":1751997956000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8460937\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,5]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/icra.2018.8460937","relation":{},"subject":[],"published":{"date-parts":[[2018,5]]}}}