{"id":"https://openalex.org/W4416366111","doi":"https://doi.org/10.1016/j.compeleceng.2025.110836","title":"Prioritized Experience Replay and Four-Trajectory Exploration - Multi-agents Proximal Policy Optimization: Multi-agents Reinforcement Learning-Based service migration strategy under vehicular edge computing","display_name":"Prioritized Experience Replay and Four-Trajectory Exploration - Multi-agents Proximal Policy Optimization: Multi-agents Reinforcement Learning-Based service migration strategy under vehicular edge computing","publication_year":2025,"publication_date":"2025-11-19","ids":{"openalex":"https://openalex.org/W4416366111","doi":"https://doi.org/10.1016/j.compeleceng.2025.110836"},"language":"en","primary_location":{"id":"doi:10.1016/j.compeleceng.2025.110836","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.compeleceng.2025.110836","pdf_url":null,"source":{"id":"https://openalex.org/S121340289","display_name":"Computers & Electrical Engineering","issn_l":"0045-7906","issn":["0045-7906","1879-0755"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers and Electrical Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1016/j.compeleceng.2025.110836","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101618343","display_name":"Lei Ye","orcid":"https://orcid.org/0009-0003-1093-6363"},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Ye","raw_affiliation_strings":["School of Microelectronics and Communication Engineering, Chongqing University, Chongqing, 400044, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Microelectronics and Communication Engineering, Chongqing University, Chongqing, 400044, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yulan Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yulan Chen","raw_affiliation_strings":["School of Microelectronics and Communication Engineering, Chongqing University, Chongqing, 400044, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Microelectronics and Communication Engineering, Chongqing University, Chongqing, 400044, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056655082","display_name":"Qingwen Han","orcid":"https://orcid.org/0000-0002-1517-7701"},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qingwen Han","raw_affiliation_strings":["School of Microelectronics and Communication Engineering, Chongqing University, Chongqing, 400044, China"],"raw_orcid":"https://orcid.org/0000-0002-1517-7701","affiliations":[{"raw_affiliation_string":"School of Microelectronics and Communication Engineering, Chongqing University, Chongqing, 400044, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101624634","display_name":"Lingqiu Zeng","orcid":"https://orcid.org/0000-0002-5133-4153"},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lingqiu Zeng","raw_affiliation_strings":["College of Computer Science, Chongqing University, Chongqing, 400044, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science, Chongqing University, Chongqing, 400044, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076324064","display_name":"Kaiwen Ling","orcid":"https://orcid.org/0000-0002-4920-0877"},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaiwen Ling","raw_affiliation_strings":["School of Microelectronics and Communication Engineering, Chongqing University, Chongqing, 400044, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Microelectronics and Communication Engineering, Chongqing University, Chongqing, 400044, China","institution_ids":["https://openalex.org/I158842170"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5056655082"],"corresponding_institution_ids":["https://openalex.org/I158842170"],"apc_list":{"value":3100,"currency":"USD","value_usd":3100},"apc_paid":{"value":3100,"currency":"USD","value_usd":3100},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.38513204,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"129","issue":null,"first_page":"110836","last_page":"110836"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.30570000410079956,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.30570000410079956,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10761","display_name":"Vehicular Ad Hoc Networks (VANETs)","score":0.21220000088214874,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.19769999384880066,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8025000095367432},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.6039999723434448},{"id":"https://openalex.org/keywords/quality-of-service","display_name":"Quality of service","score":0.5485000014305115},{"id":"https://openalex.org/keywords/edge-computing","display_name":"Edge computing","score":0.5349000096321106},{"id":"https://openalex.org/keywords/service","display_name":"Service (business)","score":0.46050000190734863},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.4438999891281128},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.43059998750686646},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.3756999969482422},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.36480000615119934}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8025000095367432},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7340999841690063},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.6039999723434448},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.5485000014305115},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5440999865531921},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.5349000096321106},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.46050000190734863},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.4438999891281128},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.43059998750686646},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.3756999969482422},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.36480000615119934},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.35499998927116394},{"id":"https://openalex.org/C116537","wikidata":"https://www.wikidata.org/wiki/Q2169973","display_name":"Service provider","level":3,"score":0.34940001368522644},{"id":"https://openalex.org/C47796450","wikidata":"https://www.wikidata.org/wiki/Q508378","display_name":"Intelligent transportation system","level":2,"score":0.3465999960899353},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.33570000529289246},{"id":"https://openalex.org/C140781008","wikidata":"https://www.wikidata.org/wiki/Q1221081","display_name":"Service quality","level":3,"score":0.33340001106262207},{"id":"https://openalex.org/C192448918","wikidata":"https://www.wikidata.org/wiki/Q682677","display_name":"Vehicular ad hoc network","level":4,"score":0.32659998536109924},{"id":"https://openalex.org/C107568181","wikidata":"https://www.wikidata.org/wiki/Q5319000","display_name":"Dynamic priority scheduling","level":3,"score":0.32280001044273376},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.28439998626708984},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28299999237060547},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.28029999136924744},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.2797999978065491},{"id":"https://openalex.org/C207267971","wikidata":"https://www.wikidata.org/wiki/Q120208","display_name":"Emerging technologies","level":2,"score":0.26980000734329224},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.2669000029563904},{"id":"https://openalex.org/C15587899","wikidata":"https://www.wikidata.org/wiki/Q7455812","display_name":"Service system","level":3,"score":0.2612000107765198},{"id":"https://openalex.org/C55416958","wikidata":"https://www.wikidata.org/wiki/Q6206757","display_name":"Job shop scheduling","level":3,"score":0.2578999996185303},{"id":"https://openalex.org/C2777958785","wikidata":"https://www.wikidata.org/wiki/Q17120940","display_name":"Resource efficiency","level":2,"score":0.2563999891281128}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.compeleceng.2025.110836","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.compeleceng.2025.110836","pdf_url":null,"source":{"id":"https://openalex.org/S121340289","display_name":"Computers & Electrical Engineering","issn_l":"0045-7906","issn":["0045-7906","1879-0755"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers and Electrical Engineering","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.compeleceng.2025.110836","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.compeleceng.2025.110836","pdf_url":null,"source":{"id":"https://openalex.org/S121340289","display_name":"Computers & Electrical Engineering","issn_l":"0045-7906","issn":["0045-7906","1879-0755"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers and Electrical Engineering","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1965370830","https://openalex.org/W2050765519","https://openalex.org/W2092939357","https://openalex.org/W2096145798","https://openalex.org/W2344607369","https://openalex.org/W2761862361","https://openalex.org/W2888704015","https://openalex.org/W2889540440","https://openalex.org/W2899462209","https://openalex.org/W2905026759","https://openalex.org/W2906718952","https://openalex.org/W2944311919","https://openalex.org/W3021517781","https://openalex.org/W3033105525","https://openalex.org/W3166424533","https://openalex.org/W4200467649","https://openalex.org/W4286365441","https://openalex.org/W4309487594","https://openalex.org/W4312326088","https://openalex.org/W4313420669","https://openalex.org/W4384787194","https://openalex.org/W4400033848","https://openalex.org/W4403721394","https://openalex.org/W4404515646"],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,28,34,90,110,117,131,138,152,202],"improvement":[2],"of":[3,31,38,80,205],"Intelligent":[4],"Transportation":[5],"Systems":[6],"(ITS),":[7],"Vehicular":[8],"Edge":[9],"Computing":[10],"(VEC),":[11],"which":[12,165],"integrates":[13,251],"roadside":[14],"computing":[15,20],"devices,":[16],"can":[17],"provide":[18],"essential":[19],"and":[21,33,52,83,97,104,121,156,184,208,223,234,245,262],"storage":[22],"resources":[23],"for":[24,45,257],"road":[25],"vehicles.":[26],"However,":[27],"high":[29],"mobility":[30],"vehicles":[32],"limited":[35,209],"processing":[36,211],"capacity":[37],"Roadside":[39],"Units":[40],"(RSUs)":[41],"bring":[42],"significant":[43,179],"challenges":[44],"service":[46,64,194,218,264],"migration,":[47],"particularly":[48],"in":[49,151,181,226],"real-time":[50,63,91,182,217],"decisions":[51,183,220],"resource":[53,133,167,260],"scheduling.":[54],"To":[55],"address":[56],"these":[57],"challenges,":[58],"this":[59],"study":[60,190],"proposes":[61,191],"a":[62],"migration":[65,195,219],"strategy":[66,196],"that":[67],"leverages":[68],"Artificial":[69],"Intelligence":[70],"(AI)":[71],"technologies":[72],"specifically":[73],"Deep":[74],"Reinforcement":[75],"Learning":[76],"(DRL)to":[77],"optimize":[78],"Quality":[79],"Service":[81],"(QoS)":[82],"reduce":[84],"response":[85],"latency.":[86],"Firstly,":[87],"to":[88,129,199,201,238,254],"solve":[89,242],"decision":[92],"problem,":[93],"Prioritized":[94,118,153],"Experience":[95,119,154],"Replay":[96,120,155],"Four-Trajectory":[98,122,157],"Exploration":[99,123,158],"(PERFT),":[100],"recurrent":[101,231],"neural":[102,232],"networks,":[103],"attention":[105,235],"mechanisms":[106],"are":[107],"incorporated":[108],"into":[109,148],"Proximal":[111,124,160],"Policy":[112,125,161],"Optimization":[113,126,162],"(PPO)":[114],"algorithm,":[115,164],"yielding":[116],"(PERFT-PPO).":[127],"Then,":[128],"meet":[130],"multi-agents":[132,259],"scheduling":[134,261],"demands":[135],"under":[136,197,221],"VEC,":[137],"Centralized":[139],"Training":[140],"with":[141,252],"Decentralized":[142],"Execution":[143],"(CTDE)":[144],"framework":[145],"is":[146],"integrated":[147],"PERFT-PPO,":[149],"resulting":[150],"Multi-Agent":[159],"(PERFT-MAPPO)":[163],"coordinates":[166],"allocation":[168],"among":[169],"agents":[170],"while":[171],"enhancing":[172],"global":[173],"long-term":[174],"rewards.":[175],"Experimental":[176],"results":[177],"demonstrate":[178],"improvements":[180],"overall":[185],"system":[186],"performance.":[187],"\u2022":[188,213,229,249],"This":[189],"an":[192],"AI-based":[193],"VEC":[198,206,222,258],"adapt":[200],"dynamic":[203,227],"nature":[204],"environments":[207],"RSU":[210],"capacity.":[212],"Single-agent":[214],"PERFT-PPO":[215,253],"solves":[216],"optimizes":[224],"QoS":[225],"environments.":[228],"PERFT,":[230],"network":[233],"enhance":[236],"PPO":[237],"handle":[239],"sequence":[240],"info,":[241],"sparse":[243],"rewards,":[244],"improve":[246],"long-trajectory":[247],"exploration.":[248],"CTDE":[250],"create":[255],"PERFT-MAPPO":[256],"optimized":[263],"migration.":[265]},"counts_by_year":[],"updated_date":"2026-04-29T09:16:38.111599","created_date":"2025-11-19T00:00:00"}
