{"id":"https://openalex.org/W3206683817","doi":"https://doi.org/10.1109/access.2021.3119915","title":"Safe Adaptive Deep Reinforcement Learning for Autonomous Driving in Urban Environments. Additional Filter? How and Where?","display_name":"Safe Adaptive Deep Reinforcement Learning for Autonomous Driving in Urban Environments. Additional Filter? How and Where?","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3206683817","doi":"https://doi.org/10.1109/access.2021.3119915","mag":"3206683817"},"language":"en","primary_location":{"id":"doi:10.1109/access.2021.3119915","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3119915","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09570336.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09570336.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043090172","display_name":"Sina Alighanbari","orcid":null},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Sina Alighanbari","raw_affiliation_strings":["SHEVS lab at the Department of Systems Design Engineering, University of Waterloo, ON, Canada. (e-mail: salighanbari@uwaterloo.ca)","Sina Alighanbari is with SHEVS lab at the Department of Systems Design Engineering, University of Waterloo, ON, Canada"],"raw_orcid":"https://orcid.org/0000-0002-5409-7149","affiliations":[{"raw_affiliation_string":"SHEVS lab at the Department of Systems Design Engineering, University of Waterloo, ON, Canada. (e-mail: salighanbari@uwaterloo.ca)","institution_ids":["https://openalex.org/I151746483"]},{"raw_affiliation_string":"Sina Alighanbari is with SHEVS lab at the Department of Systems Design Engineering, University of Waterloo, ON, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033006881","display_name":"Nasser L. Azad","orcid":null},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Nasser L. Azad","raw_affiliation_strings":["Faculty of Engineering, Department of Systems Design Engineering, University of Waterloo, Waterloo, ON, Canada"],"raw_orcid":"https://orcid.org/0000-0003-1412-7961","affiliations":[{"raw_affiliation_string":"Faculty of Engineering, Department of Systems Design Engineering, University of Waterloo, Waterloo, ON, Canada","institution_ids":["https://openalex.org/I151746483"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5043090172"],"corresponding_institution_ids":["https://openalex.org/I151746483"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.2789,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.56047061,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"9","issue":null,"first_page":"141347","last_page":"141359"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10524","display_name":"Traffic control and management","score":0.9883999824523926,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7891319990158081},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6774348020553589},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.606794536113739},{"id":"https://openalex.org/keywords/bounded-function","display_name":"Bounded function","score":0.5754551887512207},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5652316808700562},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.5348721146583557},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.5123025178909302},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.49972009658813477},{"id":"https://openalex.org/keywords/automotive-industry","display_name":"Automotive industry","score":0.47977739572525024},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.42795974016189575},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.16267302632331848},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.16074687242507935},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.1063598096370697}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7891319990158081},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6774348020553589},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.606794536113739},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.5754551887512207},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5652316808700562},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.5348721146583557},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.5123025178909302},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.49972009658813477},{"id":"https://openalex.org/C526921623","wikidata":"https://www.wikidata.org/wiki/Q190117","display_name":"Automotive industry","level":2,"score":0.47977739572525024},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.42795974016189575},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.16267302632331848},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.16074687242507935},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.1063598096370697},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2021.3119915","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3119915","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09570336.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:76e3490880734ef799bb7dbb20fe0760","is_oa":true,"landing_page_url":"https://doaj.org/article/76e3490880734ef799bb7dbb20fe0760","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 9, Pp 141347-141359 (2021)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2021.3119915","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3119915","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09570336.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.8100000023841858,"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320322622","display_name":"Toyota Motor Corporation","ror":"https://ror.org/02zqm6r10"},{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3206683817.pdf","grobid_xml":"https://content.openalex.org/works/W3206683817.grobid-xml"},"referenced_works_count":68,"referenced_works":["https://openalex.org/W75331681","https://openalex.org/W241118364","https://openalex.org/W1515851193","https://openalex.org/W1554663460","https://openalex.org/W1845972764","https://openalex.org/W1972149633","https://openalex.org/W1999874108","https://openalex.org/W2121863487","https://openalex.org/W2124136621","https://openalex.org/W2134491302","https://openalex.org/W2139137304","https://openalex.org/W2145339207","https://openalex.org/W2173248099","https://openalex.org/W2257979135","https://openalex.org/W2462906003","https://openalex.org/W2534320940","https://openalex.org/W2560504659","https://openalex.org/W2619551236","https://openalex.org/W2795485095","https://openalex.org/W2889711700","https://openalex.org/W2892521964","https://openalex.org/W2903709398","https://openalex.org/W2919820522","https://openalex.org/W2930426397","https://openalex.org/W2948802787","https://openalex.org/W2952720101","https://openalex.org/W2962789054","https://openalex.org/W2962867954","https://openalex.org/W2963525569","https://openalex.org/W2963704386","https://openalex.org/W2963744427","https://openalex.org/W2963864421","https://openalex.org/W2966735560","https://openalex.org/W2968788589","https://openalex.org/W2971188105","https://openalex.org/W2972163183","https://openalex.org/W2977639220","https://openalex.org/W2990123902","https://openalex.org/W2992833799","https://openalex.org/W2996430598","https://openalex.org/W2998563746","https://openalex.org/W3003329097","https://openalex.org/W3098925401","https://openalex.org/W3099352109","https://openalex.org/W3105252106","https://openalex.org/W3117590843","https://openalex.org/W3127561923","https://openalex.org/W3129059695","https://openalex.org/W3142005321","https://openalex.org/W3148402047","https://openalex.org/W4214717370","https://openalex.org/W4289119149","https://openalex.org/W4295719664","https://openalex.org/W4297780563","https://openalex.org/W4388297464","https://openalex.org/W6603061627","https://openalex.org/W6682367392","https://openalex.org/W6684921986","https://openalex.org/W6718836005","https://openalex.org/W6745935785","https://openalex.org/W6762806541","https://openalex.org/W6763688752","https://openalex.org/W6768003243","https://openalex.org/W6772666310","https://openalex.org/W6773319185","https://openalex.org/W6777063277","https://openalex.org/W6790735769","https://openalex.org/W6791266996"],"related_works":["https://openalex.org/W4382644535","https://openalex.org/W2522768275","https://openalex.org/W2352938035","https://openalex.org/W4306904969","https://openalex.org/W2351672553","https://openalex.org/W2373392303","https://openalex.org/W2765894405","https://openalex.org/W1884735063","https://openalex.org/W2372668238","https://openalex.org/W2138720691"],"abstract_inverted_index":{"Autonomous":[0],"driving":[1,9],"(AD)":[2],"provides":[3,69],"a":[4,86,261,289],"reliable":[5],"solution":[6],"for":[7,15,104,200,237,270,288],"safe":[8],"by":[10,100,182,216],"replacing":[11],"human":[12],"drivers":[13],"responsible":[14],"the":[16,66,83,114,140,145,150,177,194,211,221,231,271],"majority":[17],"of":[18,22,61,85,116,147,152,196,205,264],"accidents.":[19],"The":[20,59,281],"emergence":[21],"Machine":[23],"Learning,":[24],"specifically":[25],"Deep":[26,105,183],"Reinforcement":[27],"Learning":[28,185],"(DRL),":[29],"and":[30,75,94,134,155,158,170,186,218,227,253,278],"its":[31,38],"ability":[32],"to":[33,40,65,110,131,176,220,292],"solve":[34],"complex":[35],"games":[36],"proved":[37],"potential":[39],"address":[41],"AD":[42],"challenges.":[43],"However,":[44],"model-free":[45],"methods":[46],"still":[47],"suffer":[48],"from":[49,102],"safety-related":[50],"issues":[51],"that":[52,160],"can":[53],"be":[54],"resolved":[55],"using":[56,197],"safe-DRL":[57],"approaches.":[58],"addition":[60,84],"model-based":[62],"safety":[63,70,87,117,248],"filters":[64,118,148],"learning-based":[67],"algorithms":[68],"bounds":[71],"on":[72,90,139],"their":[73],"performance":[74,99,128,223],"constraint":[76],"satisfaction.":[77],"In":[78],"this":[79,276],"paper,":[80],"we":[81,192],"investigate":[82,193],"filter":[88,249],"based":[89],"Model":[91],"Predictive":[92],"Control":[93],"show":[95],"an":[96],"increase":[97,129,166],"in":[98,149,164,167,173,250,275],"110%":[101],"-75":[103],"Deterministic":[106],"Policy":[107],"Gradient":[108],"(DDPG)":[109],"7.758.":[111],"We":[112,143],"study":[113],"impacts":[115],"(7.758":[119],"mean":[120,137,168,212,225],"reward),":[121],"heuristic":[122],"rules,":[123],"bounded":[124,156,161,251],"additive":[125],"noises":[126],"(0.49%":[127],"comparing":[130,175],"noise-free":[132],"case),":[133],"exploration":[135,154,157,162,252],"(3.425":[136],"reward)":[138],"learning":[141,255],"algorithm.":[142],"compare":[144],"effects":[146],"context":[151],"simulated":[153],"prove":[159],"results":[163,232,236,285],"9.86%":[165],"reward":[169,215,226],"12.95%":[171],"decrease":[172],"std":[174],"other":[178,296],"method.":[179],"Additionally,":[180],"inspired":[181],"Internal":[184],"biological":[187],"mechanisms":[188],"like":[189],"brain":[190],"plasticity,":[191],"idea":[195],"each":[198],"sample":[199],"training":[201],"only":[202],"once":[203],"instead":[204],"utilizing":[206],"stochastic":[207],"batches":[208],"which":[209],"increases":[210],"testing":[213],"accumulated":[214],"1.87%":[217],"leads":[219],"best":[222],"(7.942":[224],"0.048":[228],"std).":[229],"Finally,":[230],"demonstrate":[233],"better":[234],"automotive":[235,284],"our":[238,279],"proposed":[239,244,282],"method":[240],"than":[241],"DDPG.":[242],"Our":[243],"method,":[245],"DDPG":[246],"with":[247,295],"adaptive":[254],"under":[256,266],"noisy":[257],"input":[258],"conditions,":[259],"has":[260],"success":[262],"rate":[263],"100%":[265],"different":[267],"traffic":[268],"densities":[269],"simulation":[272],"environment":[273],"used":[274],"paper":[277],"assumptions.":[280],"method\u2019s":[283],"are":[286],"shown":[287],"braking":[290],"scenario":[291],"avoid":[293],"collision":[294],"road":[297],"users.":[298]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
