{"id":"https://openalex.org/W4393241288","doi":"https://doi.org/10.1109/lra.2024.3382477","title":"Improving the Performance of Learned Controllers in Behavior Trees Using Value Function Estimates at Switching Boundaries","display_name":"Improving the Performance of Learned Controllers in Behavior Trees Using Value Function Estimates at Switching Boundaries","publication_year":2024,"publication_date":"2024-03-27","ids":{"openalex":"https://openalex.org/W4393241288","doi":"https://doi.org/10.1109/lra.2024.3382477"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2024.3382477","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/lra.2024.3382477","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001360476","display_name":"Mart Karta\u0161ev","orcid":"https://orcid.org/0000-0001-8264-611X"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Mart Karta\u0161ev","raw_affiliation_strings":["RPL Lab, Royal Institute of Technology (KTH), Stockholm, Sweden"],"raw_orcid":"https://orcid.org/0000-0001-8264-611X","affiliations":[{"raw_affiliation_string":"RPL Lab, Royal Institute of Technology (KTH), Stockholm, Sweden","institution_ids":["https://openalex.org/I86987016"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070754732","display_name":"Petter \u00d6gren","orcid":"https://orcid.org/0000-0002-7714-928X"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Petter \u00d6gren","raw_affiliation_strings":["RPL Lab, Royal Institute of Technology (KTH), Stockholm, Sweden"],"raw_orcid":"https://orcid.org/0000-0002-7714-928X","affiliations":[{"raw_affiliation_string":"RPL Lab, Royal Institute of Technology (KTH), Stockholm, Sweden","institution_ids":["https://openalex.org/I86987016"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3055,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.60237652,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"9","issue":"5","first_page":"4647","last_page":"4654"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.89410001039505,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.89410001039505,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.8156999945640564,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10820","display_name":"Fuzzy Logic and Control Systems","score":0.8069999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.6500928997993469},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.6171616315841675},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.49005401134490967},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3783680200576782},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.34742555022239685},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.2515485882759094},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.25028595328330994},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.20993733406066895},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.08344033360481262}],"concepts":[{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.6500928997993469},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.6171616315841675},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.49005401134490967},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3783680200576782},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.34742555022239685},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2515485882759094},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.25028595328330994},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.20993733406066895},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.08344033360481262},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2024.3382477","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/lra.2024.3382477","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W2007506196","https://openalex.org/W2109910161","https://openalex.org/W2121517924","https://openalex.org/W2132714442","https://openalex.org/W2261683202","https://openalex.org/W2465895732","https://openalex.org/W2521617762","https://openalex.org/W2736601468","https://openalex.org/W2784013554","https://openalex.org/W2889987506","https://openalex.org/W3024044737","https://openalex.org/W3082488836","https://openalex.org/W3145123113","https://openalex.org/W4200408523","https://openalex.org/W4214717370","https://openalex.org/W4285145746","https://openalex.org/W4389667323","https://openalex.org/W6719354989","https://openalex.org/W6741002519","https://openalex.org/W6753526802","https://openalex.org/W6758134627"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W1979597421","https://openalex.org/W2007980826","https://openalex.org/W2061531152","https://openalex.org/W3002753104","https://openalex.org/W2077600819","https://openalex.org/W2142036596","https://openalex.org/W2072657027","https://openalex.org/W2600246793","https://openalex.org/W4238204885"],"abstract_inverted_index":{"Behavior":[0],"trees":[1],"offer":[2],"a":[3,12,116,135],"modular":[4],"approach":[5],"to":[6,84,111,134,167],"developing":[7],"an":[8],"overall":[9,40,75,99,173],"controller":[10,76,100,138,174],"from":[11],"set":[13],"of":[14,48,63,97,108,115,118,121,154],"sub-controllers":[15,21,156],"that":[16,162],"solve":[17],"different":[18],"sub-problems.":[19],"These":[20],"can":[22,101],"be":[23,56,80,102,176],"created":[24],"using":[25],"various":[26],"methods,":[27],"such":[28],"as":[29],"classical":[30],"model-based":[31],"control":[32],"or":[33],"reinforcement":[34],"learning":[35],"(RL).":[36],"To":[37],"achieve":[38],"the":[39,46,49,61,64,74,85,95,98,113,119,122,140,155,172],"goal,":[41],"each":[42],"sub-controller":[43,54,117],"must":[44],"satisfy":[45],"preconditions":[47,62],"next":[50,65,123],"sub-controller.":[51],"Although":[52],"every":[53],"may":[55,77],"locally":[57],"optimal":[58,81,137],"in":[59],"achieving":[60],"one,":[66],"given":[67,179],"some":[68,153,169],"performance":[69,87,96],"metric":[70],"like":[71],"completion":[72],"time,":[73],"still":[78],"not":[79],"with":[82],"respect":[83],"same":[86],"metric.":[88],"In":[89],"this":[90,132,148,180],"paper,":[91],"we":[92,105,164],"demonstrate":[93],"how":[94],"improved":[103],"if":[104,163],"use":[106,168],"approximations":[107],"value":[109],"functions":[110],"inform":[112],"design":[114],"needs":[120],"controller.":[124],"We":[125],"also":[126,150],"show":[127],"how,":[128],"under":[129],"certain":[130],"assumptions,":[131],"leads":[133],"globally":[136,177],"when":[139,152],"process":[141],"is":[142],"executed":[143],"on":[144],"all":[145],"sub-controllers.":[146],"Finally,":[147],"result":[149],"holds":[151],"are":[157,165],"already":[158],"given.":[159],"This":[160],"means":[161],"constrained":[166],"existing":[170],"sub-controllers,":[171],"will":[175],"optimal,":[178],"constraint.":[181]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
