{"id":"https://openalex.org/W2903849022","doi":"https://doi.org/10.1017/s0269888918000279","title":"Towards life-long adaptive agents: using metareasoning for combining knowledge-based planning with situated learning","display_name":"Towards life-long adaptive agents: using metareasoning for combining knowledge-based planning with situated learning","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2903849022","doi":"https://doi.org/10.1017/s0269888918000279","mag":"2903849022"},"language":"en","primary_location":{"id":"doi:10.1017/s0269888918000279","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s0269888918000279","pdf_url":null,"source":{"id":"https://openalex.org/S137506714","display_name":"The Knowledge Engineering Review","issn_l":"0269-8889","issn":["0269-8889","1469-8005"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Knowledge Engineering Review","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041724598","display_name":"Priyam Parashar","orcid":"https://orcid.org/0000-0003-2154-5889"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]},{"id":"https://openalex.org/I4210128771","display_name":"Contextual Change (United States)","ror":"https://ror.org/03bskcm82","country_code":"US","type":"company","lineage":["https://openalex.org/I4210128771"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Priyam Parashar","raw_affiliation_strings":["Contextual Robotics Institute, UC San Diego, La Jolla, CA 92093, USA; e-mail:","e-mail:","Contextual Robotics Institute, UC San Diego, La Jolla, CA 92093, USA"],"raw_orcid":"https://orcid.org/0000-0003-2154-5889","affiliations":[{"raw_affiliation_string":"Contextual Robotics Institute, UC San Diego, La Jolla, CA 92093, USA; e-mail:","institution_ids":["https://openalex.org/I4210128771"]},{"raw_affiliation_string":"e-mail:","institution_ids":[]},{"raw_affiliation_string":"Contextual Robotics Institute, UC San Diego, La Jolla, CA 92093, USA","institution_ids":["https://openalex.org/I4210128771","https://openalex.org/I36258959"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007028896","display_name":"Ashok K. Goel","orcid":null},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ashok K. Goel","raw_affiliation_strings":["Design & Intelligence Laboratory, Georgia Institute of Technology, Atlanta, GA 30308, USA; e-mail:","Design & Intelligence Laboratory, Georgia Institute of Technology, Atlanta, GA 30308, USA","e-mail:"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Design & Intelligence Laboratory, Georgia Institute of Technology, Atlanta, GA 30308, USA; e-mail:","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"Design & Intelligence Laboratory, Georgia Institute of Technology, Atlanta, GA 30308, USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"e-mail:","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070629168","display_name":"Bradley Sheneman","orcid":null},"institutions":[{"id":"https://openalex.org/I2803034721","display_name":"American Indian Center","ror":"https://ror.org/001040h60","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I2803034721"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bradley Sheneman","raw_affiliation_strings":["American Family Insurance, Chicago, IL; e-mail:","American Family Insurance, Chicago, IL","e-mail:"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"American Family Insurance, Chicago, IL; e-mail:","institution_ids":["https://openalex.org/I2803034721"]},{"raw_affiliation_string":"American Family Insurance, Chicago, IL","institution_ids":[]},{"raw_affiliation_string":"e-mail:","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066237365","display_name":"Henrik I. Christensen","orcid":"https://orcid.org/0000-0002-7465-7502"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]},{"id":"https://openalex.org/I4210128771","display_name":"Contextual Change (United States)","ror":"https://ror.org/03bskcm82","country_code":"US","type":"company","lineage":["https://openalex.org/I4210128771"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Henrik I. Christensen","raw_affiliation_strings":["Contextual Robotics Institute, UC San Diego, La Jolla, CA 92093, USA; e-mail:","e-mail:","Contextual Robotics Institute, UC San Diego, La Jolla, CA 92093, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Contextual Robotics Institute, UC San Diego, La Jolla, CA 92093, USA; e-mail:","institution_ids":["https://openalex.org/I4210128771"]},{"raw_affiliation_string":"e-mail:","institution_ids":[]},{"raw_affiliation_string":"Contextual Robotics Institute, UC San Diego, La Jolla, CA 92093, USA","institution_ids":["https://openalex.org/I4210128771","https://openalex.org/I36258959"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5041724598"],"corresponding_institution_ids":["https://openalex.org/I36258959","https://openalex.org/I4210128771"],"apc_list":null,"apc_paid":null,"fwci":1.0154,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.83274185,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"33","issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11010","display_name":"Logic, Reasoning, and Knowledge","score":0.9882000088691711,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/situated","display_name":"Situated","score":0.9343909025192261},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7772723436355591},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7447638511657715},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6592211723327637},{"id":"https://openalex.org/keywords/semantic-reasoner","display_name":"Semantic reasoner","score":0.6041681170463562},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.569832980632782},{"id":"https://openalex.org/keywords/plan","display_name":"Plan (archaeology)","score":0.47670692205429077},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.47186511754989624},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4705560505390167},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.42452430725097656},{"id":"https://openalex.org/keywords/situated-learning","display_name":"Situated learning","score":0.42137232422828674},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3746778666973114},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3554152250289917},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.08917608857154846},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07794195413589478}],"concepts":[{"id":"https://openalex.org/C132829578","wikidata":"https://www.wikidata.org/wiki/Q581151","display_name":"Situated","level":2,"score":0.9343909025192261},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7772723436355591},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7447638511657715},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6592211723327637},{"id":"https://openalex.org/C9616225","wikidata":"https://www.wikidata.org/wiki/Q3929429","display_name":"Semantic reasoner","level":2,"score":0.6041681170463562},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.569832980632782},{"id":"https://openalex.org/C2776505523","wikidata":"https://www.wikidata.org/wiki/Q4785468","display_name":"Plan (archaeology)","level":2,"score":0.47670692205429077},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.47186511754989624},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4705560505390167},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.42452430725097656},{"id":"https://openalex.org/C200380349","wikidata":"https://www.wikidata.org/wiki/Q2290699","display_name":"Situated learning","level":2,"score":0.42137232422828674},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3746778666973114},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3554152250289917},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.08917608857154846},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07794195413589478},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1017/s0269888918000279","is_oa":false,"landing_page_url":"https://doi.org/10.1017/s0269888918000279","pdf_url":null,"source":{"id":"https://openalex.org/S137506714","display_name":"The Knowledge Engineering Review","issn_l":"0269-8889","issn":["0269-8889","1469-8005"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311721","host_organization_name":"Cambridge University Press","host_organization_lineage":["https://openalex.org/P4310311721","https://openalex.org/P4310311702"],"host_organization_lineage_names":["Cambridge University Press","University of Cambridge"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Knowledge Engineering Review","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.550000011920929,"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W9419878","https://openalex.org/W32403112","https://openalex.org/W41554520","https://openalex.org/W81346543","https://openalex.org/W124680240","https://openalex.org/W602493290","https://openalex.org/W1487906362","https://openalex.org/W1497390930","https://openalex.org/W1500151553","https://openalex.org/W1505738976","https://openalex.org/W1509999309","https://openalex.org/W1540659332","https://openalex.org/W1563716826","https://openalex.org/W1591434728","https://openalex.org/W1595732857","https://openalex.org/W1749317873","https://openalex.org/W1774329048","https://openalex.org/W1777239053","https://openalex.org/W1966527069","https://openalex.org/W1968813584","https://openalex.org/W1986014385","https://openalex.org/W2025460523","https://openalex.org/W2032680755","https://openalex.org/W2081944499","https://openalex.org/W2100988719","https://openalex.org/W2111316871","https://openalex.org/W2116287365","https://openalex.org/W2118957105","https://openalex.org/W2121863487","https://openalex.org/W2126872172","https://openalex.org/W2128103053","https://openalex.org/W2130039570","https://openalex.org/W2139306379","https://openalex.org/W2142600926","https://openalex.org/W2146934839","https://openalex.org/W2147357263","https://openalex.org/W2150500908","https://openalex.org/W2152475379","https://openalex.org/W2165008406","https://openalex.org/W2167340365","https://openalex.org/W2250340166","https://openalex.org/W2257771522","https://openalex.org/W2263969997","https://openalex.org/W2308567354","https://openalex.org/W2336416123","https://openalex.org/W2477981996","https://openalex.org/W2577801266","https://openalex.org/W2578350735","https://openalex.org/W2618829310","https://openalex.org/W4210992782","https://openalex.org/W4291280180","https://openalex.org/W4301306983","https://openalex.org/W6630573394","https://openalex.org/W6632290893","https://openalex.org/W6638116338","https://openalex.org/W6675301218"],"related_works":["https://openalex.org/W2063544616","https://openalex.org/W4245961435","https://openalex.org/W2005493456","https://openalex.org/W2109104809","https://openalex.org/W3017673946","https://openalex.org/W2272258203","https://openalex.org/W2357503665","https://openalex.org/W2145415711","https://openalex.org/W2043664783","https://openalex.org/W2373279890"],"abstract_inverted_index":{"Abstract":[0],"We":[1,35,81,150,172],"consider":[2],"task":[3,47,143],"planning":[4,48,74],"for":[5,65,89,110,131,147,170,195],"long-living":[6],"intelligent":[7],"agents":[8],"situated":[9,50,67],"in":[10,96,154],"dynamic":[11],"environments.":[12],"Specifically,":[13],"we":[14],"address":[15],"the":[16,22,26,66,72,78,90,97,102,114,117,121,132,135,141,155,162,165,168,192],"problem":[17],"of":[18,21,28,164,189],"incomplete":[19],"knowledge":[20,75],"world":[23,59,99],"due":[24,100],"to":[25,44,77,93,101,126,140,160],"addition":[27],"new":[29,79],"objects":[30],"with":[31],"unknown":[32],"action":[33],"models.":[34],"propose":[36],"a":[37,56,86,107],"multilayered":[38],"agent":[39],"architecture":[40,166],"that":[41],"uses":[42,123],"meta-reasoning":[43],"control":[45],"hierarchical":[46,142],"and":[49,63,70,105,116,129,134,157,167,183],"learning,":[51],"monitor":[52],"expectations":[53,92,115],"generated":[54],"by":[55],"plan":[57,145],"against":[58,176],"observations,":[60],"forms":[61],"goals":[62,128],"rewards":[64,130],"reinforcement":[68,179],"learner,":[69,133],"learns":[71],"missing":[73],"relevant":[76],"objects.":[80],"use":[82],"occupancy":[83],"grids":[84],"as":[85],"low-level":[87],"representation":[88],"high-level":[91],"capture":[94],"changes":[95],"physical":[98],"additional":[103],"objects,":[104],"provide":[106],"similarity":[108],"method":[109],"detecting":[111],"discrepancies":[112,125],"between":[113],"observations":[118],"at":[119],"run-time;":[120],"meta-reasoner":[122],"these":[124],"formulate":[127],"learned":[136],"policies":[137],"are":[138],"added":[139],"network":[144],"library":[146],"future":[148],"re-use.":[149],"describe":[151],"our":[152,174,184],"experiments":[153],"Minecraft":[156],"Gazebo":[158],"microworlds":[159],"demonstrate":[161],"efficacy":[163],"technique":[169],"learning.":[171],"test":[173],"approach":[175],"an":[177],"ablated":[178],"learning":[180,193],"(RL)":[181],"version,":[182],"results":[185],"indicate":[186],"this":[187],"form":[188],"expectation":[190],"enhances":[191],"curve":[194],"RL":[196],"while":[197],"being":[198],"more":[199],"generic":[200],"than":[201],"propositional":[202],"representations.":[203]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2026-01-08T20:05:33.558190","created_date":"2025-10-10T00:00:00"}
