{"id":"https://openalex.org/W7135086063","doi":"https://doi.org/10.1111/exsy.70240","title":"<scp>EGSI</scp> \u2010 <scp>PPO</scp> : An Evolutionary\u2010Guided Self\u2010Imitation Reinforcement Learning Framework for Autonomous Parking","display_name":"<scp>EGSI</scp> \u2010 <scp>PPO</scp> : An Evolutionary\u2010Guided Self\u2010Imitation Reinforcement Learning Framework for Autonomous Parking","publication_year":2026,"publication_date":"2026-03-12","ids":{"openalex":"https://openalex.org/W7135086063","doi":"https://doi.org/10.1111/exsy.70240"},"language":"en","primary_location":{"id":"doi:10.1111/exsy.70240","is_oa":false,"landing_page_url":"https://doi.org/10.1111/exsy.70240","pdf_url":null,"source":{"id":"https://openalex.org/S72232612","display_name":"Expert Systems","issn_l":"0266-4720","issn":["0266-4720","1468-0394"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Expert Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128861411","display_name":"Liang Hou","orcid":null},"institutions":[{"id":"https://openalex.org/I22716506","display_name":"Lanzhou University of Technology","ror":"https://ror.org/03panb555","country_code":"CN","type":"education","lineage":["https://openalex.org/I22716506"]},{"id":"https://openalex.org/I4210096345","display_name":"City University","ror":"https://ror.org/00r1j9q42","country_code":"BD","type":"education","lineage":["https://openalex.org/I4210096345"]},{"id":"https://openalex.org/I4210140336","display_name":"Lanzhou City University","ror":"https://ror.org/03cd4ja39","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210140336"]},{"id":"https://openalex.org/I76214153","display_name":"Lanzhou University","ror":"https://ror.org/01mkqqe32","country_code":"CN","type":"education","lineage":["https://openalex.org/I76214153"]}],"countries":["BD","CN"],"is_corresponding":true,"raw_author_name":"Liang Hou","raw_affiliation_strings":["Gansu Engineering Research Center of Manufacturing Information Lanzhou University of Technology  Lanzhou China","School of Information Engineering Lanzhou City University  Lanzhou China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Gansu Engineering Research Center of Manufacturing Information Lanzhou University of Technology  Lanzhou China","institution_ids":["https://openalex.org/I22716506"]},{"raw_affiliation_string":"School of Information Engineering Lanzhou City University  Lanzhou China","institution_ids":["https://openalex.org/I4210140336","https://openalex.org/I76214153","https://openalex.org/I4210096345"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002467266","display_name":"F Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I22716506","display_name":"Lanzhou University of Technology","ror":"https://ror.org/03panb555","country_code":"CN","type":"education","lineage":["https://openalex.org/I22716506"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fan Zhang","raw_affiliation_strings":["School of Computer and Artificial Intelligence Lanzhou University of Technology  Lanzhou China"],"raw_orcid":"https://orcid.org/0009-0001-3173-6382","affiliations":[{"raw_affiliation_string":"School of Computer and Artificial Intelligence Lanzhou University of Technology  Lanzhou China","institution_ids":["https://openalex.org/I22716506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128890816","display_name":"Jie Cao","orcid":null},"institutions":[{"id":"https://openalex.org/I22716506","display_name":"Lanzhou University of Technology","ror":"https://ror.org/03panb555","country_code":"CN","type":"education","lineage":["https://openalex.org/I22716506"]},{"id":"https://openalex.org/I4210096345","display_name":"City University","ror":"https://ror.org/00r1j9q42","country_code":"BD","type":"education","lineage":["https://openalex.org/I4210096345"]},{"id":"https://openalex.org/I4210140336","display_name":"Lanzhou City University","ror":"https://ror.org/03cd4ja39","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210140336"]},{"id":"https://openalex.org/I76214153","display_name":"Lanzhou University","ror":"https://ror.org/01mkqqe32","country_code":"CN","type":"education","lineage":["https://openalex.org/I76214153"]}],"countries":["BD","CN"],"is_corresponding":false,"raw_author_name":"Jie Cao","raw_affiliation_strings":["Gansu Engineering Research Center of Manufacturing Information Lanzhou University of Technology  Lanzhou China","School of Information Engineering Lanzhou City University  Lanzhou China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Gansu Engineering Research Center of Manufacturing Information Lanzhou University of Technology  Lanzhou China","institution_ids":["https://openalex.org/I22716506"]},{"raw_affiliation_string":"School of Information Engineering Lanzhou City University  Lanzhou China","institution_ids":["https://openalex.org/I4210140336","https://openalex.org/I76214153","https://openalex.org/I4210096345"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128906731","display_name":"Nana Lian","orcid":null},"institutions":[{"id":"https://openalex.org/I22716506","display_name":"Lanzhou University of Technology","ror":"https://ror.org/03panb555","country_code":"CN","type":"education","lineage":["https://openalex.org/I22716506"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nana Lian","raw_affiliation_strings":["School of Computer and Artificial Intelligence Lanzhou University of Technology  Lanzhou China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer and Artificial Intelligence Lanzhou University of Technology  Lanzhou China","institution_ids":["https://openalex.org/I22716506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5128882176","display_name":"Xudong Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210118272","display_name":"Gansu Provincial Maternal and Child Health Hospital","ror":"https://ror.org/02n9as466","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I4210118272"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xudong Liu","raw_affiliation_strings":["Medical Department Gansu Provincial Maternal and Child Health Hospital  Lanzhou China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Medical Department Gansu Provincial Maternal and Child Health Hospital  Lanzhou China","institution_ids":["https://openalex.org/I4210118272"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5128861411"],"corresponding_institution_ids":["https://openalex.org/I22716506","https://openalex.org/I4210096345","https://openalex.org/I4210140336","https://openalex.org/I76214153"],"apc_list":{"value":3860,"currency":"USD","value_usd":3860},"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.52400778,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"43","issue":"4","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.5214999914169312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.5214999914169312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.1451999992132187,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.08129999786615372,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8295999765396118},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.6344000101089478},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.5776000022888184},{"id":"https://openalex.org/keywords/smoothing","display_name":"Smoothing","score":0.4618000090122223},{"id":"https://openalex.org/keywords/evolutionary-algorithm","display_name":"Evolutionary algorithm","score":0.41819998621940613},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.3756999969482422},{"id":"https://openalex.org/keywords/autonomous-system","display_name":"Autonomous system (mathematics)","score":0.3296999931335449},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.3296999931335449}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8295999765396118},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8277000188827515},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.6344000101089478},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.5776000022888184},{"id":"https://openalex.org/C3770464","wikidata":"https://www.wikidata.org/wiki/Q775963","display_name":"Smoothing","level":2,"score":0.4618000090122223},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4458000063896179},{"id":"https://openalex.org/C159149176","wikidata":"https://www.wikidata.org/wiki/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.41819998621940613},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.3756999969482422},{"id":"https://openalex.org/C9628104","wikidata":"https://www.wikidata.org/wiki/Q788009","display_name":"Autonomous system (mathematics)","level":2,"score":0.3296999931335449},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.3296999931335449},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.32199999690055847},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.3203999996185303},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.31119999289512634},{"id":"https://openalex.org/C13687954","wikidata":"https://www.wikidata.org/wiki/Q4826847","display_name":"Autonomous agent","level":2,"score":0.3100999891757965},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.30169999599456787},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2921999990940094},{"id":"https://openalex.org/C105902424","wikidata":"https://www.wikidata.org/wiki/Q1197129","display_name":"Evolutionary computation","level":2,"score":0.29010000824928284},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.28540000319480896},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.2825999855995178},{"id":"https://openalex.org/C57869625","wikidata":"https://www.wikidata.org/wiki/Q1783502","display_name":"Rate of convergence","level":3,"score":0.27000001072883606},{"id":"https://openalex.org/C8880873","wikidata":"https://www.wikidata.org/wiki/Q187787","display_name":"Genetic algorithm","level":2,"score":0.25040000677108765},{"id":"https://openalex.org/C205875254","wikidata":"https://www.wikidata.org/wiki/Q17156857","display_name":"Decentralised system","level":3,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1111/exsy.70240","is_oa":false,"landing_page_url":"https://doi.org/10.1111/exsy.70240","pdf_url":null,"source":{"id":"https://openalex.org/S72232612","display_name":"Expert Systems","issn_l":"0266-4720","issn":["0266-4720","1468-0394"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Expert Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W3092297010","https://openalex.org/W3098094428","https://openalex.org/W3116329154","https://openalex.org/W3158260269","https://openalex.org/W3214452188","https://openalex.org/W4352977012","https://openalex.org/W4379518963","https://openalex.org/W4385566404","https://openalex.org/W4385758763","https://openalex.org/W4387460941","https://openalex.org/W4388430270","https://openalex.org/W4388579628","https://openalex.org/W4388783832","https://openalex.org/W4392208019","https://openalex.org/W4401120967","https://openalex.org/W4401162484","https://openalex.org/W4402209187","https://openalex.org/W4406250560","https://openalex.org/W4408657315","https://openalex.org/W4408859815","https://openalex.org/W4410915161","https://openalex.org/W4411152984","https://openalex.org/W4412195129","https://openalex.org/W4415281381"],"related_works":[],"abstract_inverted_index":{"ABSTRACT":[0],"With":[1],"advances":[2],"in":[3,34,170,214],"autonomous":[4,7,207],"driving":[5],"technology,":[6],"parking\u2014an":[8],"indispensable":[9],"capability":[10],"of":[11,54,61,105,132,185],"intelligent":[12],"vehicles\u2014has":[13],"emerged":[14],"as":[15],"a":[16,46,115,123],"focal":[17],"point":[18],"for":[19,206],"both":[20],"academia":[21],"and":[22,70,100,113,122,139,164,175,189,200,209],"industry.":[23],"To":[24,108],"mitigate":[25],"the":[26,51,58,72,84,102,129,145,154,182,186,190,211],"slow":[27],"convergence":[28,99,176],"caused":[29],"by":[30,219],"sparse":[31,88,220],"reward":[32,118],"signals":[33,93],"parking":[35,110,173,208],"tasks,":[36],"this":[37,195],"study":[38],"introduces":[39],"Evolutionary\u2010Guided":[40],"Self\u2010Imitation":[41],"Proximal":[42],"Policy":[43],"Optimisation":[44],"(EGSI\u2010PPO),":[45],"novel":[47],"algorithm":[48],"that":[49],"fuses":[50],"exploratory":[52],"diversity":[53,69],"evolutionary":[55,65,187],"strategies":[56],"with":[57,161],"trajectory\u2010guided":[59],"supervision":[60],"self\u2010imitation":[62,85,191],"learning.":[63],"The":[64],"component":[66,86,188],"maintains":[67],"policy":[68,103,146],"enlarges":[71],"search":[73],"space":[74],"through":[75],"population\u2010based":[76],"parallel":[77],"evolution,":[78],"thereby":[79],"enhancing":[80],"global":[81],"exploration,":[82],"while":[83],"transforms":[87],"rewards":[89],"into":[90],"dense":[91],"supervisory":[92],"using":[94],"high\u2010return":[95],"trajectories,":[96],"simultaneously":[97],"accelerating":[98],"guiding":[101],"out":[104],"suboptimal":[106],"traps.":[107],"balance":[109],"accuracy,":[111,174],"efficiency,":[112],"smoothness,":[114],"composite":[116],"multi\u2010objective":[117],"function":[119],"is":[120],"formulated,":[121],"meta\u2010gradient":[124],"weight\u2010balancing":[125],"mechanism":[126],"automatically":[127],"adjusts":[128],"relative":[130],"importance":[131],"each":[133],"sub\u2010objective.":[134],"In":[135],"addition,":[136],"action\u2010level":[137],"smoothing":[138],"physical":[140],"constraints":[141],"are":[142],"imposed":[143],"at":[144],"output":[147],"to":[148],"ensure":[149],"practical":[150],"deployability.":[151],"Experiments":[152],"on":[153],"Webots":[155],"simulation":[156],"platform":[157],"show":[158],"that,":[159],"compared":[160],"SAC,":[162],"DDPG,":[163],"TD3,":[165],"EGSI\u2010PPO":[166],"delivers":[167],"significant":[168],"improvements":[169],"success":[171],"rate,":[172],"speed.":[177],"Ablation":[178],"studies":[179],"further":[180],"confirm":[181],"individual":[183],"contributions":[184],"learning":[192,204],"module.":[193],"Overall,":[194],"work":[196],"provides":[197],"an":[198],"efficient":[199],"robust":[201],"deep":[202],"reinforcement":[203],"solution":[205],"demonstrates":[210],"algorithm's":[212],"potential":[213],"continuous":[215],"control":[216],"tasks":[217],"characterised":[218],"rewards.":[221]},"counts_by_year":[],"updated_date":"2026-03-14T06:41:57.775601","created_date":"2026-03-13T00:00:00"}
