{"id":"https://openalex.org/W3206157676","doi":"https://doi.org/10.1109/icra48506.2021.9561853","title":"Using Reinforcement Learning to Create Control Barrier Functions for Explicit Risk Mitigation in Adversarial Environments","display_name":"Using Reinforcement Learning to Create Control Barrier Functions for Explicit Risk Mitigation in Adversarial Environments","publication_year":2021,"publication_date":"2021-05-30","ids":{"openalex":"https://openalex.org/W3206157676","doi":"https://doi.org/10.1109/icra48506.2021.9561853","mag":"3206157676"},"language":"en","primary_location":{"id":"doi:10.1109/icra48506.2021.9561853","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra48506.2021.9561853","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://urn.kb.se/resolve?urn=urn:nbn:se:kth:diva-293491","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012980304","display_name":"Edvards Scukins","orcid":"https://orcid.org/0000-0003-4662-441X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Edvards Scukins","raw_affiliation_strings":["SAAB,Aeronautics Division,Link&#x00F6;ping,Sweden,SE-582 54","ping, Sweden"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"SAAB,Aeronautics Division,Link&#x00F6;ping,Sweden,SE-582 54","institution_ids":[]},{"raw_affiliation_string":"ping, Sweden","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070754732","display_name":"Petter \u00d6gren","orcid":"https://orcid.org/0000-0002-7714-928X"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Petter Ogren","raw_affiliation_strings":["Royal Institute of Technology (KTH),Robotics, Perception and Learning Lab., School of Electrical Engineering and Computer Science,Stockholm,Sweden,SE-100 44"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Royal Institute of Technology (KTH),Robotics, Perception and Learning Lab., School of Electrical Engineering and Computer Science,Stockholm,Sweden,SE-100 44","institution_ids":["https://openalex.org/I86987016"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":8.7889,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.97175227,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"10734","last_page":"10740"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12158","display_name":"Guidance and Control Systems","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12158","display_name":"Guidance and Control Systems","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9807999730110168,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13371","display_name":"Military Defense Systems Analysis","score":0.9674000144004822,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7511903643608093},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6706158518791199},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.6302071809768677},{"id":"https://openalex.org/keywords/missile","display_name":"Missile","score":0.6000162363052368},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.5598888993263245},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5556753873825073},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.5375610589981079},{"id":"https://openalex.org/keywords/adversary","display_name":"Adversary","score":0.5168519616127014},{"id":"https://openalex.org/keywords/risk-analysis","display_name":"Risk analysis (engineering)","score":0.5112905502319336},{"id":"https://openalex.org/keywords/risk-management","display_name":"Risk management","score":0.4475194811820984},{"id":"https://openalex.org/keywords/command-and-control","display_name":"Command and control","score":0.44360607862472534},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.324134886264801},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.2764110267162323},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.25499075651168823},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.19295784831047058}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7511903643608093},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6706158518791199},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.6302071809768677},{"id":"https://openalex.org/C2778857364","wikidata":"https://www.wikidata.org/wiki/Q974850","display_name":"Missile","level":2,"score":0.6000162363052368},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.5598888993263245},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5556753873825073},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.5375610589981079},{"id":"https://openalex.org/C41065033","wikidata":"https://www.wikidata.org/wiki/Q2825412","display_name":"Adversary","level":2,"score":0.5168519616127014},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.5112905502319336},{"id":"https://openalex.org/C32896092","wikidata":"https://www.wikidata.org/wiki/Q189447","display_name":"Risk management","level":2,"score":0.4475194811820984},{"id":"https://openalex.org/C506615639","wikidata":"https://www.wikidata.org/wiki/Q21662260","display_name":"Command and control","level":2,"score":0.44360607862472534},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.324134886264801},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.2764110267162323},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25499075651168823},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.19295784831047058},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icra48506.2021.9561853","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra48506.2021.9561853","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},{"id":"pmh:oai:DiVA.org:kth-293491","is_oa":true,"landing_page_url":"http://urn.kb.se/resolve?urn=urn:nbn:se:kth:diva-293491","pdf_url":null,"source":{"id":"https://openalex.org/S4306401559","display_name":"KTH Publication Database DiVA (KTH Royal Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:DiVA.org:kth-293491","is_oa":true,"landing_page_url":"http://urn.kb.se/resolve?urn=urn:nbn:se:kth:diva-293491","pdf_url":null,"source":{"id":"https://openalex.org/S4306401559","display_name":"KTH Publication Database DiVA (KTH Royal Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321030","display_name":"VINNOVA","ror":"https://ror.org/01kd5m353"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1985204762","https://openalex.org/W1987725948","https://openalex.org/W2062122188","https://openalex.org/W2101075098","https://openalex.org/W2145339207","https://openalex.org/W2173248099","https://openalex.org/W2222789563","https://openalex.org/W2534060593","https://openalex.org/W2560504659","https://openalex.org/W2586067474","https://openalex.org/W2594829461","https://openalex.org/W2736601468","https://openalex.org/W2891830784","https://openalex.org/W2899771611","https://openalex.org/W2945088828","https://openalex.org/W2949267040","https://openalex.org/W2963575966","https://openalex.org/W2963864421","https://openalex.org/W2964118262","https://openalex.org/W2966735560","https://openalex.org/W2968945909","https://openalex.org/W3005347330","https://openalex.org/W3012097656","https://openalex.org/W3098925401","https://openalex.org/W3106238320","https://openalex.org/W4285719527","https://openalex.org/W4294578467","https://openalex.org/W6647175844","https://openalex.org/W6684921986","https://openalex.org/W6729130418","https://openalex.org/W6733118196","https://openalex.org/W6734215269","https://openalex.org/W6741002519","https://openalex.org/W6756040250","https://openalex.org/W6773842061"],"related_works":["https://openalex.org/W2502115930","https://openalex.org/W2482350142","https://openalex.org/W4246396837","https://openalex.org/W4320018150","https://openalex.org/W4239582170","https://openalex.org/W2918664383","https://openalex.org/W106056076","https://openalex.org/W4320855730","https://openalex.org/W2135200719","https://openalex.org/W2383556788"],"abstract_inverted_index":{"Air":[0],"Combat":[1],"is":[2,103],"a":[3,17,94,99,140],"high-risk":[4],"activity":[5],"carried":[6],"out":[7],"by":[8],"trained":[9],"professionals":[10],"operating":[11],"sophisticated":[12],"equipment.":[13],"During":[14],"this":[15,53,102,160],"activity,":[16],"number":[18],"of":[19,73,143,146,199,208],"trade-offs":[20],"have":[21,39],"to":[22,60,117,129,172,185,202],"be":[23,127,155],"made,":[24],"such":[25,97],"as":[26,89,98,157],"the":[27,68,78,165,174,182,194,197,200,209],"balance":[28],"between":[29,77],"risk":[30,37,183],"and":[31,43,80,179],"efficiency.":[32],"A":[33],"policy":[34],"that":[35,45,66,124,153,204],"minimizes":[36],"could":[38],"very":[40,50],"low":[41],"efficiency,":[42],"one":[44],"maximizes":[46],"efficiency":[47],"may":[48],"involve":[49],"high":[51,113],"risk.In":[52],"study,":[54],"we":[55,107],"use":[56],"Reinforcement":[57],"Learning":[58],"(RL)":[59],"create":[61],"Control":[62],"Barrier":[63],"Functions":[64],"(CBF)":[65],"captures":[67],"current":[69],"risk,":[70,193],"in":[71,132,150,159,167],"terms":[72],"worst-case":[74],"future":[75,206],"separation":[76],"aircraft":[79],"an":[81,109,168],"enemy":[82],"missile.":[83],"CBFs":[84,158],"are":[85],"usually":[86],"designed":[87],"manually":[88],"closed-form":[90],"expressions,":[91],"but":[92],"for":[93],"complex":[95],"system":[96,195],"guided":[100],"missile,":[101],"not":[104],"possible.":[105],"Instead,":[106],"solve":[108],"RL":[110,147],"problem":[111],"using":[112],"fidelity":[114],"simulation":[115],"models":[116],"find":[118],"value":[119,151],"functions":[120,152],"with":[121],"CBF":[122],"properties,":[123],"can":[125,154],"then":[126],"used":[128,156],"guarantee":[130,205],"safety":[131],"real":[133],"air":[134,169],"combat":[135,170],"situations.":[136],"We":[137],"also":[138],"provide":[139],"theoretical":[141],"analysis":[142],"what":[144],"family":[145],"problems":[148],"result":[149],"way.The":[161],"proposed":[162],"approach":[163],"allows":[164],"pilot":[166,201],"scenario":[171],"set":[173],"exposure":[175],"level":[176],"deemed":[177],"acceptable":[178,192],"continuously":[180],"monitor":[181],"related":[184],"his/her":[186],"own":[187],"safety.":[188],"Given":[189],"input":[190],"regarding":[191],"limits":[196],"choices":[198],"those":[203],"satisfaction":[207],"provided":[210],"bound.":[211]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
