{"id":"https://openalex.org/W2913878882","doi":"https://doi.org/10.1109/lra.2019.2903259","title":"Bi-Directional Value Learning for Risk-Aware Planning Under Uncertainty","display_name":"Bi-Directional Value Learning for Risk-Aware Planning Under Uncertainty","publication_year":2019,"publication_date":"2019-03-06","ids":{"openalex":"https://openalex.org/W2913878882","doi":"https://doi.org/10.1109/lra.2019.2903259","mag":"2913878882"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2019.2903259","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2019.2903259","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1902.05698","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019692184","display_name":"Sung-Kyun Kim","orcid":"https://orcid.org/0000-0003-2460-1153"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sung-Kyun Kim","raw_affiliation_strings":["Robotics Institute, Carnegie Mellon University, Pittsburgh, PA, USA","Robotics Institute, Carnegie Mellon University, Pittsburgh, Pa, USA"],"affiliations":[{"raw_affiliation_string":"Robotics Institute, Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Robotics Institute, Carnegie Mellon University, Pittsburgh, Pa, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113893653","display_name":"Rohan Thakker","orcid":null},"institutions":[{"id":"https://openalex.org/I1334627681","display_name":"Jet Propulsion Laboratory","ror":"https://ror.org/027k65916","country_code":"US","type":"facility","lineage":["https://openalex.org/I122411786","https://openalex.org/I1334627681","https://openalex.org/I4210124779"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rohan Thakker","raw_affiliation_strings":["Jet Propulsion Laboratory, Pasadena, CA, USA","Jet Propulsion Laboratory Pasadena, CA, USA"],"affiliations":[{"raw_affiliation_string":"Jet Propulsion Laboratory, Pasadena, CA, USA","institution_ids":["https://openalex.org/I1334627681"]},{"raw_affiliation_string":"Jet Propulsion Laboratory Pasadena, CA, USA","institution_ids":["https://openalex.org/I1334627681"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042186658","display_name":"Ali\u2010akbar Agha\u2010mohammadi","orcid":"https://orcid.org/0000-0001-5509-1841"},"institutions":[{"id":"https://openalex.org/I1334627681","display_name":"Jet Propulsion Laboratory","ror":"https://ror.org/027k65916","country_code":"US","type":"facility","lineage":["https://openalex.org/I122411786","https://openalex.org/I1334627681","https://openalex.org/I4210124779"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ali-Akbar Agha-Mohammadi","raw_affiliation_strings":["Jet Propulsion Laboratory, Pasadena, CA, USA","Jet Propulsion Laboratory Pasadena, CA, USA"],"affiliations":[{"raw_affiliation_string":"Jet Propulsion Laboratory, Pasadena, CA, USA","institution_ids":["https://openalex.org/I1334627681"]},{"raw_affiliation_string":"Jet Propulsion Laboratory Pasadena, CA, USA","institution_ids":["https://openalex.org/I1334627681"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5019692184"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":1.5402,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.86986482,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"4","issue":"3","first_page":"2493","last_page":"2500"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.9846000075340271,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.9846000075340271,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9399999976158142,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9333000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/partially-observable-markov-decision-process","display_name":"Partially observable Markov decision process","score":0.8964501023292542},{"id":"https://openalex.org/keywords/planner","display_name":"Planner","score":0.7507575154304504},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.7441471815109253},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7300508618354797},{"id":"https://openalex.org/keywords/bellman-equation","display_name":"Bellman equation","score":0.6508626341819763},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6437521576881409},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.5913248062133789},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.5588369965553284},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5076128244400024},{"id":"https://openalex.org/keywords/observable","display_name":"Observable","score":0.4741342067718506},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4664648771286011},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4498039782047272},{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.4158977270126343},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.4087814390659332},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34136033058166504},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.21990862488746643},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1621711552143097},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12568175792694092}],"concepts":[{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.8964501023292542},{"id":"https://openalex.org/C2776999362","wikidata":"https://www.wikidata.org/wiki/Q2349274","display_name":"Planner","level":2,"score":0.7507575154304504},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.7441471815109253},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7300508618354797},{"id":"https://openalex.org/C14646407","wikidata":"https://www.wikidata.org/wiki/Q1430750","display_name":"Bellman equation","level":2,"score":0.6508626341819763},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6437521576881409},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.5913248062133789},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.5588369965553284},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5076128244400024},{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.4741342067718506},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4664648771286011},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4498039782047272},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.4158977270126343},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.4087814390659332},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34136033058166504},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.21990862488746643},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1621711552143097},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12568175792694092},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/lra.2019.2903259","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2019.2903259","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},{"id":"mag:2913878882","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1902.05698","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null}],"best_oa_location":{"id":"mag:2913878882","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1902.05698","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7200000286102295,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1557517019","https://openalex.org/W1997840820","https://openalex.org/W2001009060","https://openalex.org/W2053833381","https://openalex.org/W2068945175","https://openalex.org/W2099430963","https://openalex.org/W2128990851","https://openalex.org/W2168359464","https://openalex.org/W2168992242","https://openalex.org/W2339179100","https://openalex.org/W2473222174","https://openalex.org/W2769509614","https://openalex.org/W2781538372","https://openalex.org/W2806880272","https://openalex.org/W2897946272","https://openalex.org/W2911695803","https://openalex.org/W3148740559","https://openalex.org/W6631864160","https://openalex.org/W6678541622","https://openalex.org/W6684973485","https://openalex.org/W6745500190","https://openalex.org/W6929267929"],"related_works":["https://openalex.org/W3104551220","https://openalex.org/W2964126058","https://openalex.org/W2967385712","https://openalex.org/W2795609531","https://openalex.org/W2783797945","https://openalex.org/W2903683378","https://openalex.org/W3111597472","https://openalex.org/W2110322955","https://openalex.org/W78785118","https://openalex.org/W85990829","https://openalex.org/W2883906040","https://openalex.org/W2783782435","https://openalex.org/W2561666900","https://openalex.org/W2462780152","https://openalex.org/W3042298952","https://openalex.org/W2911281373","https://openalex.org/W2963645163","https://openalex.org/W2965787007","https://openalex.org/W2909922236"],"abstract_inverted_index":{"Decision-making":[0],"under":[1],"uncertainty":[2],"is":[3,49,75],"a":[4,21,32,39,68,81,93,116],"crucial":[5],"ability":[6],"for":[7],"autonomous":[8],"systems.":[9],"In":[10,42],"its":[11],"most":[12],"general":[13],"form,":[14],"this":[15],"problem":[16],"can":[17,34],"be":[18,35],"formulated":[19],"as":[20,38],"partially":[22,43],"observable":[23,44],"Markov":[24],"decision":[25],"process":[26,91,103],"(POMDP).":[27],"The":[28,136],"solution":[29],"policy":[30,110],"of":[31,55,118,132,141,149],"POMDP":[33],"implicitly":[36],"encoded":[37],"value":[40,47,73,89,101],"function.":[41],"settings,":[45],"the":[46,56,72,109,127,133,139,142,150],"function":[48,74],"typically":[50],"learned":[51,76],"via":[52,80,111],"forward":[53,100,112],"simulation":[54],"system":[57],"evolution.":[58],"Focusing":[59],"on":[60],"accurate":[61],"and":[62,95,107,120,130],"long-range":[63,94,147],"risk":[64],"assessment,":[65],"we":[66],"propose":[67],"novel":[69],"method,":[70],"where":[71],"in":[77,84,145],"different":[78],"phases":[79],"bi-directional":[82],"search":[83],"belief":[85],"space.":[86],"A":[87,99],"backward":[88],"learning":[90,102],"provides":[92],"risk-aware":[96],"base":[97],"policy.":[98],"ensures":[104],"local":[105],"optimality":[106,131],"updates":[108],"simulations.":[113],"We":[114],"consider":[115],"class":[117],"scalable":[119],"continuous-space":[121],"rover":[122],"navigation":[123],"problems":[124,155],"to":[125],"assess":[126],"safety,":[128],"scalability,":[129],"proposed":[134,143],"algorithm.":[135],"results":[137],"demonstrate":[138],"capabilities":[140],"algorithm":[144],"evaluating":[146],"risk/safety":[148],"planner":[151],"while":[152],"addressing":[153],"continuous":[154],"with":[156],"long":[157],"planning":[158],"horizons.":[159]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
