{"id":"https://openalex.org/W4401414373","doi":"https://doi.org/10.1109/cec60901.2024.10611776","title":"Reinforcement Learning with Safe Action Generation for Autonomous Racing","display_name":"Reinforcement Learning with Safe Action Generation for Autonomous Racing","publication_year":2024,"publication_date":"2024-06-30","ids":{"openalex":"https://openalex.org/W4401414373","doi":"https://doi.org/10.1109/cec60901.2024.10611776"},"language":"en","primary_location":{"id":"doi:10.1109/cec60901.2024.10611776","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/cec60901.2024.10611776","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Congress on Evolutionary Computation (CEC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080051493","display_name":"Jiacheng Yang","orcid":"https://orcid.org/0009-0002-9581-9088"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiacheng Yang","raw_affiliation_strings":["School of Automation Southeast University,Nanjing,China"],"affiliations":[{"raw_affiliation_string":"School of Automation Southeast University,Nanjing,China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076608243","display_name":"Yuanda Wang","orcid":"https://orcid.org/0000-0001-8002-8131"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanda Wang","raw_affiliation_strings":["School of Automation Southeast University,Nanjing,China"],"affiliations":[{"raw_affiliation_string":"School of Automation Southeast University,Nanjing,China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088413924","display_name":"Lu Dong","orcid":"https://orcid.org/0000-0001-6737-1381"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lu Dong","raw_affiliation_strings":["School of Automation Southeast University,Nanjing,China"],"affiliations":[{"raw_affiliation_string":"School of Automation Southeast University,Nanjing,China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044749695","display_name":"Xin Yuan","orcid":null},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Yuan","raw_affiliation_strings":["School of Automation Southeast University,Nanjing,China"],"affiliations":[{"raw_affiliation_string":"School of Automation Southeast University,Nanjing,China","institution_ids":["https://openalex.org/I76569877"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5080051493"],"corresponding_institution_ids":["https://openalex.org/I76569877"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.10584848,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"30","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.781358003616333},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.597149133682251},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5866830945014954},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4818078875541687},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42339494824409485},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3655128479003906},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.27563440799713135},{"id":"https://openalex.org/keywords/structural-engineering","display_name":"Structural engineering","score":0.05695611238479614}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.781358003616333},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.597149133682251},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5866830945014954},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4818078875541687},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42339494824409485},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3655128479003906},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.27563440799713135},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.05695611238479614},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cec60901.2024.10611776","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/cec60901.2024.10611776","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Congress on Evolutionary Computation (CEC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2047372702","display_name":null,"funder_award_id":"62103104,62173251,62203113","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6287495588","display_name":null,"funder_award_id":"BK20210215","funder_id":"https://openalex.org/F4320322769","funder_display_name":"Natural Science Foundation of Jiangsu Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322769","display_name":"Natural Science Foundation of Jiangsu Province","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":54,"referenced_works":["https://openalex.org/W1574474448","https://openalex.org/W2154844948","https://openalex.org/W2558738305","https://openalex.org/W2586823359","https://openalex.org/W2736601468","https://openalex.org/W2784465508","https://openalex.org/W2869375357","https://openalex.org/W2907214660","https://openalex.org/W2914283047","https://openalex.org/W2948175577","https://openalex.org/W2968983352","https://openalex.org/W2981194798","https://openalex.org/W2999762404","https://openalex.org/W3006463925","https://openalex.org/W3021958118","https://openalex.org/W3044457827","https://openalex.org/W3068678661","https://openalex.org/W3096541271","https://openalex.org/W3096954237","https://openalex.org/W3102621632","https://openalex.org/W3112591948","https://openalex.org/W3126641549","https://openalex.org/W3136325136","https://openalex.org/W3174380524","https://openalex.org/W3201929238","https://openalex.org/W4211094662","https://openalex.org/W4226239849","https://openalex.org/W4226534167","https://openalex.org/W4244493510","https://openalex.org/W4281480521","https://openalex.org/W4281705700","https://openalex.org/W4283793632","https://openalex.org/W4285228542","https://openalex.org/W4286374783","https://openalex.org/W4287203155","https://openalex.org/W4294555834","https://openalex.org/W4312637175","https://openalex.org/W4313478129","https://openalex.org/W4317553716","https://openalex.org/W4366748330","https://openalex.org/W4391307842","https://openalex.org/W4393397186","https://openalex.org/W6634423325","https://openalex.org/W6683397050","https://openalex.org/W6730344819","https://openalex.org/W6738483526","https://openalex.org/W6741002519","https://openalex.org/W6747473740","https://openalex.org/W6747790125","https://openalex.org/W6748839928","https://openalex.org/W6758919432","https://openalex.org/W6768916879","https://openalex.org/W6784643869","https://openalex.org/W6838701874"],"related_works":["https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588","https://openalex.org/W2086122291","https://openalex.org/W1987513656"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1],"(RL)":[2],"has":[3],"been":[4],"successfully":[5],"applied":[6],"to":[7,60,107,144],"tackle":[8],"many":[9],"complex":[10],"decision-making":[11],"tasks.":[12],"However,":[13],"a":[14,45,52,72],"critical":[15],"problem":[16,48],"is":[17,42,97,105],"the":[18,62,86,89,95,101,113,116,145,148,154,159,165,168],"unsafe":[19,109],"exploration":[20,114],"when":[21],"deploying":[22],"classical":[23],"model-free":[24],"RL":[25,37,117],"methods":[26],"in":[27,91,121],"safety-critical":[28],"systems.":[29],"In":[30],"this":[31],"paper,":[32],"we":[33],"focus":[34],"on":[35],"safe":[36],"for":[38],"autonomous":[39],"racing,":[40],"which":[41],"formulated":[43],"as":[44,99],"multi-objective":[46],"optimization":[47],"(MOP).":[49],"We":[50],"propose":[51],"novel":[53],"mechanism,":[54,150],"named":[55],"Safe":[56],"Action":[57],"Generation":[58],"(SAG),":[59],"address":[61],"above":[63],"challenge.":[64],"The":[65,81,122],"mechanism":[66],"mainly":[67],"consists":[68],"of":[69,88,115,140,156],"two":[70],"modules:":[71],"risk":[73,82],"prediction":[74,83],"module":[75,84,104],"and":[76,93,175],"an":[77,137],"action":[78,102],"generation":[79,103],"module.":[80],"monitors":[85],"state":[87,96],"vehicle":[90,173],"real-time,":[92],"once":[94],"evaluated":[98],"risky,":[100],"activated":[106],"prevent":[108],"behavior":[110],"by":[111,161],"restricting":[112],"agent.":[118],"Extensive":[119],"experiments":[120],"Open":[123],"Racing":[124],"Car":[125],"Simulator":[126],"(TORCS)":[127],"demonstrate":[128],"that":[129],"our":[130,151],"approach":[131,152],"can":[132,171],"complete":[133],"one":[134],"lap":[135],"at":[136],"average":[138],"speed":[139],"108":[141],"km/h,":[142],"Compared":[143],"baseline":[146],"without":[147],"SAG":[149],"reduces":[153],"instances":[155],"driving":[157],"off":[158],"track":[160],"97.7%.":[162],"By":[163],"using":[164],"proposed":[166],"framework,":[167],"learned":[169],"policy":[170],"improve":[172],"safety":[174],"generalization":[176],"performance.":[177]},"counts_by_year":[],"updated_date":"2025-12-26T23:08:49.675405","created_date":"2025-10-10T00:00:00"}
