{"id":"https://openalex.org/W4223511664","doi":"https://doi.org/10.1145/3529399.3529432","title":"Automatically Learning Fallback Strategies with Model-Free Reinforcement Learning in Safety-Critical Driving Scenarios","display_name":"Automatically Learning Fallback Strategies with Model-Free Reinforcement Learning in Safety-Critical Driving Scenarios","publication_year":2022,"publication_date":"2022-03-11","ids":{"openalex":"https://openalex.org/W4223511664","doi":"https://doi.org/10.1145/3529399.3529432"},"language":"en","primary_location":{"id":"doi:10.1145/3529399.3529432","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3529399.3529432","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 7th International Conference on Machine Learning Technologies (ICMLT)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2204.05196","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065194144","display_name":"Ugo Lecerf","orcid":null},"institutions":[{"id":"https://openalex.org/I1301102746","display_name":"Renault (France)","ror":"https://ror.org/04v98kq37","country_code":"FR","type":"company","lineage":["https://openalex.org/I1301102746"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Ugo Lecerf","raw_affiliation_strings":["Renault Software Labs, France"],"affiliations":[{"raw_affiliation_string":"Renault Software Labs, France","institution_ids":["https://openalex.org/I1301102746"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015957130","display_name":"Christelle Yemdji-Tchassi","orcid":null},"institutions":[{"id":"https://openalex.org/I1301102746","display_name":"Renault (France)","ror":"https://ror.org/04v98kq37","country_code":"FR","type":"company","lineage":["https://openalex.org/I1301102746"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Christelle Yemdji-Tchassi","raw_affiliation_strings":["Renault Software Labs, France"],"affiliations":[{"raw_affiliation_string":"Renault Software Labs, France","institution_ids":["https://openalex.org/I1301102746"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032005688","display_name":"S\u00e9bastien Aubert","orcid":null},"institutions":[{"id":"https://openalex.org/I1301102746","display_name":"Renault (France)","ror":"https://ror.org/04v98kq37","country_code":"FR","type":"company","lineage":["https://openalex.org/I1301102746"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Sebastien Aubert","raw_affiliation_strings":["Renault Software Labs, France"],"affiliations":[{"raw_affiliation_string":"Renault Software Labs, France","institution_ids":["https://openalex.org/I1301102746"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017009335","display_name":"Pietro Michiardi","orcid":"https://orcid.org/0000-0003-4675-7677"},"institutions":[{"id":"https://openalex.org/I1902872","display_name":"EURECOM","ror":"https://ror.org/00sse7z02","country_code":"FR","type":"education","lineage":["https://openalex.org/I1902872","https://openalex.org/I205703379"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Pietro Michiardi","raw_affiliation_strings":["Data Science, EURECOM, France"],"affiliations":[{"raw_affiliation_string":"Data Science, EURECOM, France","institution_ids":["https://openalex.org/I1902872"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5065194144"],"corresponding_institution_ids":["https://openalex.org/I1301102746"],"apc_list":null,"apc_paid":null,"fwci":0.138,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.51605152,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"209","last_page":"215"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9821000099182129,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8704893589019775},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.704479455947876},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3737267255783081},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3544754385948181}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8704893589019775},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.704479455947876},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3737267255783081},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3544754385948181}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3529399.3529432","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3529399.3529432","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 7th International Conference on Machine Learning Technologies (ICMLT)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2204.05196","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.05196","pdf_url":"https://arxiv.org/pdf/2204.05196","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2204.05196","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.05196","pdf_url":"https://arxiv.org/pdf/2204.05196","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.5099999904632568,"id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W567721252","https://openalex.org/W1771410628","https://openalex.org/W2121092017","https://openalex.org/W2126316555","https://openalex.org/W2145339207","https://openalex.org/W2201581102","https://openalex.org/W2545546008","https://openalex.org/W2607662938","https://openalex.org/W2607713949","https://openalex.org/W2751621024","https://openalex.org/W2761873684","https://openalex.org/W2913668833","https://openalex.org/W2945850646","https://openalex.org/W2950040888","https://openalex.org/W2953021786","https://openalex.org/W2953303875","https://openalex.org/W2970787054","https://openalex.org/W2979869797","https://openalex.org/W2989958156","https://openalex.org/W2996037775","https://openalex.org/W3018207341","https://openalex.org/W3034956653","https://openalex.org/W3119981760","https://openalex.org/W3148740559","https://openalex.org/W4212774754","https://openalex.org/W4214717370","https://openalex.org/W4287867830","https://openalex.org/W4288328070","https://openalex.org/W4288331462","https://openalex.org/W4300799055","https://openalex.org/W4301379696","https://openalex.org/W6687681856"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4306904969","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2138720691","https://openalex.org/W2376932109","https://openalex.org/W4362501864","https://openalex.org/W2001405890"],"abstract_inverted_index":{"When":[0],"learning":[1],"to":[2,25,32,45,60,83,93,97,106],"behave":[3],"in":[4,17,41,78,87],"a":[5,15,30,75],"stochastic":[6],"environment":[7],"where":[8],"safety":[9],"is":[10,20,37,104],"critical,":[11],"such":[12,52],"as":[13,29],"driving":[14],"vehicle":[16],"traffic,":[18],"it":[19,103],"natural":[21],"for":[22,51,57],"human":[23],"drivers":[24],"plan":[26],"fallback":[27,85],"strategies":[28,86,109],"backup":[31],"use":[33,84],"if":[34],"ever":[35],"there":[36],"an":[38,98],"unexpected":[39],"change":[40],"the":[42,47,88,111,120],"environment.":[43],"Knowing":[44],"expect":[46],"unexpected,":[48],"and":[49,63,81],"planning":[50],"outcomes,":[53],"increases":[54],"our":[55],"capability":[56],"being":[58],"robust":[59],"unseen":[61],"scenarios":[62],"may":[64],"help":[65],"prevent":[66],"catastrophic":[67],"failures.":[68],"Control":[69],"of":[70,90],"Autonomous":[71],"Vehicles":[72],"(AVs)":[73],"has":[74],"particular":[76],"interest":[77,89],"knowing":[79],"when":[80],"how":[82],"safety.":[91],"Due":[92],"imperfect":[94],"information":[95],"available":[96],"AV":[99],"about":[100],"its":[101],"environment,":[102],"important":[105],"have":[107,116],"alternate":[108],"at":[110],"ready":[112],"which":[113],"might":[114],"not":[115],"been":[117],"deduced":[118],"from":[119],"original":[121],"training":[122],"data":[123],"distribution.":[124]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
