{"id":"https://openalex.org/W4405895876","doi":"https://doi.org/10.1109/tcyb.2024.3518697","title":"Risk-Conscious Mutations in Jump-Start Reinforcement Learning for Autonomous Racing Policy","display_name":"Risk-Conscious Mutations in Jump-Start Reinforcement Learning for Autonomous Racing Policy","publication_year":2024,"publication_date":"2024-12-30","ids":{"openalex":"https://openalex.org/W4405895876","doi":"https://doi.org/10.1109/tcyb.2024.3518697","pmid":"https://pubmed.ncbi.nlm.nih.gov/40030835"},"language":"en","primary_location":{"id":"doi:10.1109/tcyb.2024.3518697","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2024.3518697","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102936751","display_name":"Xiaohui Hou","orcid":"https://orcid.org/0000-0002-5673-2396"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiaohui Hou","raw_affiliation_strings":["School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Minggang Gan","orcid":"https://orcid.org/0000-0002-2163-2475"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Minggang Gan","raw_affiliation_strings":["School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046442810","display_name":"Wei Wu","orcid":"https://orcid.org/0000-0003-1388-3511"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Wu","raw_affiliation_strings":["School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068593680","display_name":"Shiyue Zhao","orcid":"https://orcid.org/0000-0001-6742-2767"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiyue Zhao","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107939210","display_name":"Yuan Ji","orcid":"https://orcid.org/0000-0002-5991-2421"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yuan Ji","raw_affiliation_strings":["School of Mechanical and Aerospace Engineering, Nanyang Technological University, Nanyang Avenue, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Mechanical and Aerospace Engineering, Nanyang Technological University, Nanyang Avenue, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":null,"display_name":"Jie Chen","orcid":"https://orcid.org/0000-0003-2449-9793"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Chen","raw_affiliation_strings":["National Key Laboratory of Autonomous Intelligent Unmanned Systems, Harbin Institute of Technology, Harbin, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Autonomous Intelligent Unmanned Systems, Harbin Institute of Technology, Harbin, China","institution_ids":["https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5102936751"],"corresponding_institution_ids":["https://openalex.org/I125839683"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21869131,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"55","issue":"2","first_page":"638","last_page":"648"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9621999859809875,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12810","display_name":"Real-time simulation and control systems","score":0.9465000033378601,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6630873680114746},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5903376340866089},{"id":"https://openalex.org/keywords/jump","display_name":"Jump","score":0.5828506946563721},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.422006756067276},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.3410831689834595},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.340015709400177},{"id":"https://openalex.org/keywords/aeronautics","display_name":"Aeronautics","score":0.3392123579978943},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3078664541244507},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.25866398215293884},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.23895490169525146},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.06370443105697632}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6630873680114746},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5903376340866089},{"id":"https://openalex.org/C2780695682","wikidata":"https://www.wikidata.org/wiki/Q4005959","display_name":"Jump","level":2,"score":0.5828506946563721},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.422006756067276},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.3410831689834595},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.340015709400177},{"id":"https://openalex.org/C178802073","wikidata":"https://www.wikidata.org/wiki/Q8421","display_name":"Aeronautics","level":1,"score":0.3392123579978943},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3078664541244507},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.25866398215293884},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.23895490169525146},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.06370443105697632},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tcyb.2024.3518697","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2024.3518697","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},{"id":"pmid:40030835","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40030835","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on cybernetics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1127291761","display_name":null,"funder_award_id":"62303058","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W159963257","https://openalex.org/W1777783943","https://openalex.org/W1974795838","https://openalex.org/W2020053297","https://openalex.org/W2053918437","https://openalex.org/W2083630125","https://openalex.org/W2100458216","https://openalex.org/W2335306738","https://openalex.org/W2410617946","https://openalex.org/W2771506457","https://openalex.org/W2796775309","https://openalex.org/W2811282447","https://openalex.org/W2908261578","https://openalex.org/W2990733219","https://openalex.org/W3034445502","https://openalex.org/W3112591948","https://openalex.org/W3130292943","https://openalex.org/W3135337759","https://openalex.org/W3168828539","https://openalex.org/W3209083247","https://openalex.org/W4210870706","https://openalex.org/W4220857253","https://openalex.org/W4225495521","https://openalex.org/W4225620867","https://openalex.org/W4225642194","https://openalex.org/W4226116356","https://openalex.org/W4284688875","https://openalex.org/W4285600734","https://openalex.org/W4285805523","https://openalex.org/W4287203155","https://openalex.org/W4294292690","https://openalex.org/W4315797158","https://openalex.org/W4366566350","https://openalex.org/W4366748330","https://openalex.org/W4385322538","https://openalex.org/W4385539610","https://openalex.org/W4387159219","https://openalex.org/W4387526460","https://openalex.org/W4400188071","https://openalex.org/W4402713068","https://openalex.org/W4402808998","https://openalex.org/W6606518713","https://openalex.org/W6746316224","https://openalex.org/W6747473740","https://openalex.org/W6768916879","https://openalex.org/W6810450869","https://openalex.org/W6810739325","https://openalex.org/W6839258344","https://openalex.org/W6848797572","https://openalex.org/W6851269015"],"related_works":["https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W2920061524","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588","https://openalex.org/W2086122291","https://openalex.org/W1987513656"],"abstract_inverted_index":{"This":[0],"study":[1],"focuses":[2],"on":[3,110],"trajectory":[4],"planning":[5,34],"and":[6,26,46,59,71,88,135,161],"motion":[7],"control":[8,35,50,95],"policies":[9],"in":[10,41,86,147,158],"autonomous":[11,166],"racing,":[12],"which":[13],"necessitates":[14],"pushing":[15],"the":[16,60,105,117,127,163],"capacity":[17],"boundaries":[18],"of":[19,132,165],"racing":[20],"vehicles":[21],"to":[22,76,99,126],"achieve":[23],"maximum":[24],"speeds":[25],"minimal":[27],"lap":[28],"times.":[29],"We":[30],"propose":[31],"an":[32],"innovative":[33],"framework":[36],"that":[37,97,141],"integrates":[38],"risk-conscious":[39,61],"mutations":[40],"jump-start":[42,56],"reinforcement":[43,65],"learning":[44,58],"(RCM-JSRL)":[45],"nonlinear":[47],"model":[48],"predictive":[49],"(NMPC).":[51],"The":[52],"RCM-JSRL":[53],"algorithm":[54,63],"incorporates":[55],"curriculum":[57],"genetic":[62],"into":[64],"learning,":[66],"leveraging":[67],"prior":[68],"expert":[69],"knowledge":[70],"a":[72,122],"curiosity-driven":[73],"exploration":[74],"mechanism":[75],"enhance":[77],"training":[78,109],"efficiency":[79,152],"while":[80,103],"avoiding":[81],"excessively":[82],"conservative":[83],"policy":[84,124],"generation":[85],"high-complexity":[87],"high-risk":[89],"scenarios.":[90],"NMPC":[91],"generates":[92],"locally":[93],"optimal":[94],"commands":[96],"adhere":[98],"vehicle":[100],"dynamics":[101],"constraints":[102],"following":[104],"designated":[106],"trajectory.":[107],"Following":[108],"track":[111],"maps":[112],"with":[113],"varying":[114],"difficulty":[115],"levels,":[116],"proposed":[118],"controller":[119],"successfully":[120],"executes":[121],"superior":[123],"compared":[125],"guide":[128],"policy,":[129],"providing":[130],"evidence":[131],"its":[133],"effectiveness":[134],"scalability.":[136],"It":[137],"is":[138],"our":[139],"belief":[140],"this":[142],"technology":[143],"can":[144],"be":[145],"applied":[146],"everyday":[148],"driving":[149,167],"scenarios,":[150],"improving":[151],"under":[153],"special":[154],"conditions,":[155],"ensuring":[156],"stability":[157],"critical":[159],"situations,":[160],"broadening":[162],"scope":[164],"applications.":[168]},"counts_by_year":[],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
