{"id":"https://openalex.org/W7135063162","doi":"https://doi.org/10.1109/tits.2026.3670584","title":"Safety-Enhanced Deep Reinforcement Learning for Autonomous Driving: Dare to Make Mistakes to Learn Better and Faster","display_name":"Safety-Enhanced Deep Reinforcement Learning for Autonomous Driving: Dare to Make Mistakes to Learn Better and Faster","publication_year":2026,"publication_date":"2026-03-12","ids":{"openalex":"https://openalex.org/W7135063162","doi":"https://doi.org/10.1109/tits.2026.3670584"},"language":null,"primary_location":{"id":"doi:10.1109/tits.2026.3670584","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2026.3670584","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036776153","display_name":"Zhuoren Li","orcid":"https://orcid.org/0000-0001-6246-3404"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhuoren Li","raw_affiliation_strings":["College of Automotive and Energy Engineering, Tongji University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-6246-3404","affiliations":[{"raw_affiliation_string":"College of Automotive and Energy Engineering, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121462328","display_name":"Bo Leng","orcid":null},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Leng","raw_affiliation_strings":["College of Automotive and Energy Engineering, Tongji University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0003-3513-1708","affiliations":[{"raw_affiliation_string":"College of Automotive and Energy Engineering, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128867348","display_name":"Lu Xiong","orcid":null},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lu Xiong","raw_affiliation_strings":["College of Automotive and Energy Engineering, Tongji University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-1673-2658","affiliations":[{"raw_affiliation_string":"College of Automotive and Energy Engineering, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128833435","display_name":"Arno Eichberger","orcid":null},"institutions":[{"id":"https://openalex.org/I4092182","display_name":"Graz University of Technology","ror":"https://ror.org/00d7xrm67","country_code":"AT","type":"education","lineage":["https://openalex.org/I4092182"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Arno Eichberger","raw_affiliation_strings":["Institute of Automotive Engineering, Graz University of Technology, Graz, Austria"],"raw_orcid":"https://orcid.org/0000-0001-8246-8085","affiliations":[{"raw_affiliation_string":"Institute of Automotive Engineering, Graz University of Technology, Graz, Austria","institution_ids":["https://openalex.org/I4092182"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128826411","display_name":"Chao Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I5681781","display_name":"The University of Adelaide","ror":"https://ror.org/00892tw58","country_code":"AU","type":"education","lineage":["https://openalex.org/I5681781"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Chao Huang","raw_affiliation_strings":["School of Electrical and Mechanical Engineering, The University of Adelaide, Adelaide, SA, Australia"],"raw_orcid":"https://orcid.org/0000-0003-3023-4388","affiliations":[{"raw_affiliation_string":"School of Electrical and Mechanical Engineering, The University of Adelaide, Adelaide, SA, Australia","institution_ids":["https://openalex.org/I5681781"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5128874592","display_name":"Jia Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jia Hu","raw_affiliation_strings":["Key Laboratory of Road and Traffic Engineering of the Ministry of Education, Tongji University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-0900-7992","affiliations":[{"raw_affiliation_string":"Key Laboratory of Road and Traffic Engineering of the Ministry of Education, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5036776153"],"corresponding_institution_ids":["https://openalex.org/I116953780"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.44287843,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"27","issue":"5","first_page":"5136","last_page":"5148"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.34850001335144043,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.34850001335144043,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.20990000665187836,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.06480000168085098,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.669700026512146},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.32339999079704285},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.31220000982284546},{"id":"https://openalex.org/keywords/error-driven-learning","display_name":"Error-driven learning","score":0.28130000829696655}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.669700026512146},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5626000165939331},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5246999859809875},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.41200000047683716},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.3723999857902527},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.32339999079704285},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.31220000982284546},{"id":"https://openalex.org/C47932503","wikidata":"https://www.wikidata.org/wiki/Q5395689","display_name":"Error-driven learning","level":3,"score":0.28130000829696655},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.2653000056743622},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.24089999496936798}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tits.2026.3670584","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2026.3670584","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G351996751","display_name":null,"funder_award_id":"22120230311","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G5638582070","display_name":null,"funder_award_id":"52232015","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G570345465","display_name":null,"funder_award_id":"52372317","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6754950921","display_name":null,"funder_award_id":"52522219","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8125759999","display_name":null,"funder_award_id":"YDZX20233100004027","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320318553","display_name":"Shanghai Automotive Industry Science and Technology Development Foundation","ror":null},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Deep":[0],"Reinforcement":[1],"Learning":[2],"(DRL)":[3],"is":[4],"becoming":[5],"a":[6,47,72,88,196],"prominent":[7],"method":[8,52,193],"for":[9,58],"autonomous":[10],"driving":[11,20,75,94,103,123,156,198,212],"due":[12],"to":[13,17,70,85,99,116,119],"its":[14],"strong":[15],"capability":[16],"generate":[18],"complex":[19],"policy.":[21],"However,":[22],"DRL":[23,74],"motion":[24,60,113],"planning":[25],"still":[26],"has":[27],"limitations":[28],"in":[29,177],"safety":[30,39,55,104,185,207],"performance":[31,208],"including":[32,79],"learning":[33,51,87],"quality,":[34],"convergence":[35,202],"speed":[36],"and":[37,126,164,179],"the":[38,64,102,121,137,141,148,184,191,205,211],"guarantee.":[40],"To":[41],"this":[42,44],"end,":[43],"work":[45],"proposes":[46],"safety-enhanced":[48],"deep":[49],"reinforcement":[50],"with":[53,160,200],"dynamic":[54,174],"guidance":[56],"(DSG-DRL)":[57],"lane-change":[59],"planning.":[61],"It":[62],"bears":[63],"following":[65],"key":[66],"features:":[67],"1)":[68],"Able":[69,84,98],"learn":[71,120,195],"safer":[73,197],"policy":[76,90,124,199],"by":[77,91,105,173],"additionally":[78],"potentially":[80],"unsafe":[81],"behaviors;":[82],"2)":[83],"accelerate":[86],"safe":[89,122],"making":[92],"dangerous":[93,149],"experiences":[95,157],"impressive;":[96],"3)":[97],"further":[100,182],"enhance":[101],"avoiding":[106],"unexpected":[107],"reckless":[108,168],"action.":[109],"The":[110],"proposed":[111,192],"DSG-DRL":[112],"planner":[114],"dares":[115],"make":[117],"mistakes":[118],"better":[125],"faster.":[127],"By":[128],"evaluating":[129],"anticipated":[130],"risk,":[131],"it":[132],"learns":[133],"not":[134],"only":[135],"from":[136,147],"maneuvers":[138,150],"right":[139],"at":[140],"moments":[142],"of":[143],"collisions,":[144],"but":[145],"also":[146],"leading":[151],"towards":[152],"collisions.":[153],"Besides,":[154],"risk":[155],"are":[158],"enhanced":[159],"additional":[161],"memory":[162],"batches":[163],"sampling":[165],"prioritization.":[166],"Moreover,":[167],"actions":[169],"can":[170,194],"be":[171],"prevented":[172],"constraints":[175],"both":[176],"training":[178],"testing,":[180],"which":[181],"improves":[183],"performance.":[186],"Simulation":[187],"validation":[188],"shows":[189],"that":[190],"faster":[201],"speed,":[203],"achieving":[204],"high":[206],"while":[209],"keeping":[210],"efficiency.":[213]},"counts_by_year":[],"updated_date":"2026-05-08T13:12:06.581006","created_date":"2026-03-13T00:00:00"}
