{"id":"https://openalex.org/W2890809352","doi":"https://doi.org/10.1109/icra.2018.8460937","title":"Learning to Parse Natural Language to Grounded Reward Functions with Weak Supervision","display_name":"Learning to Parse Natural Language to Grounded Reward Functions with Weak Supervision","publication_year":2018,"publication_date":"2018-05-01","ids":{"openalex":"https://openalex.org/W2890809352","doi":"https://doi.org/10.1109/icra.2018.8460937","mag":"2890809352"},"language":"en","primary_location":{"id":"doi:10.1109/icra.2018.8460937","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra.2018.8460937","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110575233","display_name":"Edward Williams","orcid":"https://orcid.org/0000-0002-5812-2831"},"institutions":[{"id":"https://openalex.org/I27804330","display_name":"Brown University","ror":"https://ror.org/05gq02987","country_code":"US","type":"education","lineage":["https://openalex.org/I27804330"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Edward C. Williams","raw_affiliation_strings":["Department of Computer Science, Brown University, Providence, RI, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Brown University, Providence, RI, USA","institution_ids":["https://openalex.org/I27804330"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089421543","display_name":"Nakul Gopalan","orcid":"https://orcid.org/0000-0002-6947-5501"},"institutions":[{"id":"https://openalex.org/I27804330","display_name":"Brown University","ror":"https://ror.org/05gq02987","country_code":"US","type":"education","lineage":["https://openalex.org/I27804330"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nakul Gopalan","raw_affiliation_strings":["Department of Computer Science, Brown University, Providence, RI, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Brown University, Providence, RI, USA","institution_ids":["https://openalex.org/I27804330"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058722672","display_name":"Mine Rhee","orcid":null},"institutions":[{"id":"https://openalex.org/I27804330","display_name":"Brown University","ror":"https://ror.org/05gq02987","country_code":"US","type":"education","lineage":["https://openalex.org/I27804330"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mine Rhee","raw_affiliation_strings":["Department of Computer Science, Brown University, Providence, RI, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Brown University, Providence, RI, USA","institution_ids":["https://openalex.org/I27804330"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059273574","display_name":"Stefanie Tellex","orcid":"https://orcid.org/0000-0002-2905-4075"},"institutions":[{"id":"https://openalex.org/I27804330","display_name":"Brown University","ror":"https://ror.org/05gq02987","country_code":"US","type":"education","lineage":["https://openalex.org/I27804330"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Stefanie Tellex","raw_affiliation_strings":["Department of Computer Science, Brown University, Providence, RI, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Brown University, Providence, RI, USA","institution_ids":["https://openalex.org/I27804330"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":5.0687,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.96224827,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"4430","last_page":"4436"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.849445104598999},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.7671708464622498},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.69759202003479},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6952861547470093},{"id":"https://openalex.org/keywords/combinatory-categorial-grammar","display_name":"Combinatory categorial grammar","score":0.6103706955909729},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.5023698806762695},{"id":"https://openalex.org/keywords/lexicon","display_name":"Lexicon","score":0.487533301115036},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.42199790477752686},{"id":"https://openalex.org/keywords/grammar","display_name":"Grammar","score":0.41976478695869446},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3787999153137207},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.37055253982543945},{"id":"https://openalex.org/keywords/context-free-grammar","display_name":"Context-free grammar","score":0.16109907627105713}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.849445104598999},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.7671708464622498},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.69759202003479},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6952861547470093},{"id":"https://openalex.org/C199837984","wikidata":"https://www.wikidata.org/wiki/Q730974","display_name":"Combinatory categorial grammar","level":5,"score":0.6103706955909729},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.5023698806762695},{"id":"https://openalex.org/C2778121359","wikidata":"https://www.wikidata.org/wiki/Q8096","display_name":"Lexicon","level":2,"score":0.487533301115036},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.42199790477752686},{"id":"https://openalex.org/C26022165","wikidata":"https://www.wikidata.org/wiki/Q8091","display_name":"Grammar","level":2,"score":0.41976478695869446},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3787999153137207},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.37055253982543945},{"id":"https://openalex.org/C97212296","wikidata":"https://www.wikidata.org/wiki/Q338047","display_name":"Context-free grammar","level":3,"score":0.16109907627105713},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C134083981","wikidata":"https://www.wikidata.org/wiki/Q1754022","display_name":"Tree-adjoining grammar","level":4,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra.2018.8460937","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra.2018.8460937","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W147290778","https://openalex.org/W1496189301","https://openalex.org/W1567277581","https://openalex.org/W1969245183","https://openalex.org/W2006406454","https://openalex.org/W2007820193","https://openalex.org/W2023808162","https://openalex.org/W2061562262","https://openalex.org/W2076337359","https://openalex.org/W2096968458","https://openalex.org/W2101355568","https://openalex.org/W2111742432","https://openalex.org/W2137607685","https://openalex.org/W2189089430","https://openalex.org/W2227250678","https://openalex.org/W2236233024","https://openalex.org/W2277684984","https://openalex.org/W2531080099","https://openalex.org/W2583137229","https://openalex.org/W2734458248","https://openalex.org/W2758731390","https://openalex.org/W2890809352","https://openalex.org/W2901136733","https://openalex.org/W2963367210","https://openalex.org/W2964224049","https://openalex.org/W4240963309","https://openalex.org/W4293584348","https://openalex.org/W6605926748","https://openalex.org/W6629631241","https://openalex.org/W6674880660","https://openalex.org/W6675130473","https://openalex.org/W6676848125","https://openalex.org/W6689626956","https://openalex.org/W6694951568","https://openalex.org/W6732465633","https://openalex.org/W6737522998","https://openalex.org/W6754663516"],"related_works":["https://openalex.org/W2140536630","https://openalex.org/W3195005284","https://openalex.org/W2391730868","https://openalex.org/W2759814045","https://openalex.org/W2108227097","https://openalex.org/W2118055728","https://openalex.org/W2736760277","https://openalex.org/W2293063786","https://openalex.org/W2911292476","https://openalex.org/W1586222814"],"abstract_inverted_index":{"In":[0],"order":[1],"to":[2,12,40,49,132,203,227],"intuitively":[3],"and":[4,69,102,110,120,160],"efficiently":[5,42],"collaborate":[6],"with":[7,163,198],"humans,":[8],"robots":[9,39],"must":[10],"learn":[11,54,98],"complete":[13],"tasks":[14,152],"specified":[15,28],"using":[16,29,115,212],"natural":[17,21],"language.":[18],"We":[19,123,139,215],"represent":[20],"language":[22,36],"instructions":[23],"as":[24,35],"goal-state":[25],"reward":[26,33,51,88],"functions":[27,34],"lambda":[30],"calculus.":[31],"Using":[32],"representations":[37],"allows":[38],"plan":[41],"in":[43,178],"stochastic":[44],"environments.":[45],"To":[46,97],"map":[47],"sentences":[48],"such":[50],"functions,":[52,89],"we":[53,105,194],"a":[55,76,85,99,147,182,209],"weighted":[56],"linear":[57],"Combinatory":[58],"Categorial":[59],"Grammar":[60],"(CCG)":[61],"semantic":[62],"parser.":[63],"The":[64],"parser,":[65],"including":[66],"both":[67],"parameters":[68],"the":[70,116,127,134,205],"CCG":[71,100],"lexicon,":[72],"is":[73],"learned":[74,220],"from":[75,221],"validation":[77],"procedure":[78],"that":[79,184,217],"does":[80],"not":[81,229],"require":[82],"execution":[83],"of":[84,118,136,144,150,155,174,176,207],"planner,":[86],"annotating":[87],"or":[90],"labeling":[91],"parse":[92,103],"trees,":[93],"unlike":[94],"prior":[95],"approaches.":[96],"lexicon":[101],"weights,":[104],"use":[106],"coarse":[107],"lexical":[108],"generation":[109],"validation-driven":[111],"perceptron":[112],"weight":[113],"updates":[114],"approach":[117,170],"Artzi":[119],"Zettlemoyer":[121],"[4].":[122],"present":[124],"results":[125],"on":[126,146],"Cleanup":[128],"World":[129],"domain":[130],"[18]":[131],"demonstrate":[133],"potential":[135],"our":[137,213],"approach.":[138],"report":[140],"an":[141,172,196],"F1":[142],"score":[143],"0.82":[145],"collected":[148],"corpus":[149],"23":[151],"containing":[153],"combinations":[154],"nested":[156],"referential":[157],"expressions,":[158],"comparators":[159],"object":[161],"properties":[162],"2037":[164],"corresponding":[165],"sentences.":[166],"Our":[167],"goal-condition":[168],"learning":[169],"enables":[171],"improvement":[173],"orders":[175],"magnitude":[177],"computation":[179],"time":[180],"over":[181],"baseline":[183],"performs":[185],"planning":[186],"during":[187,231],"learning,":[188],"while":[189],"achieving":[190],"comparable":[191],"results.":[192],"Further,":[193],"conduct":[195],"experiment":[197],"just":[199],"6":[200],"labeled":[201],"demonstrations":[202],"show":[204,216],"ease":[206],"teaching":[208],"robot":[210],"behaviors":[211],"method.":[214],"parsing":[218],"models":[219],"small":[222],"data":[223],"sets":[224],"can":[225],"generalize":[226],"commands":[228],"seen":[230],"training.":[232]},"counts_by_year":[{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":12},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
