{"id":"https://openalex.org/W3112262420","doi":"https://doi.org/10.1109/tpds.2020.3042599","title":"Distributed and Collective Deep Reinforcement Learning for Computation Offloading: A Practical Perspective","display_name":"Distributed and Collective Deep Reinforcement Learning for Computation Offloading: A Practical Perspective","publication_year":2020,"publication_date":"2020-12-10","ids":{"openalex":"https://openalex.org/W3112262420","doi":"https://doi.org/10.1109/tpds.2020.3042599","mag":"3112262420"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2020.3042599","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2020.3042599","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052666042","display_name":"Xiaoyu Qiu","orcid":"https://orcid.org/0000-0002-9322-9060"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiaoyu Qiu","raw_affiliation_strings":["School of Data and Computer Science, National Engineering Research Center of Digital Life, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Data and Computer Science, National Engineering Research Center of Digital Life, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102828807","display_name":"Weikun Zhang","orcid":"https://orcid.org/0000-0001-5211-4235"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weikun Zhang","raw_affiliation_strings":["School of Data and Computer Science, National Engineering Research Center of Digital Life, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Data and Computer Science, National Engineering Research Center of Digital Life, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066482792","display_name":"Wuhui Chen","orcid":"https://orcid.org/0000-0003-4430-7904"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wuhui Chen","raw_affiliation_strings":["School of Data and Computer Science, National Engineering Research Center of Digital Life, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Data and Computer Science, National Engineering Research Center of Digital Life, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000582109","display_name":"Zibin Zheng","orcid":"https://orcid.org/0000-0002-7878-4330"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zibin Zheng","raw_affiliation_strings":["School of Data and Computer Science, National Engineering Research Center of Digital Life, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Data and Computer Science, National Engineering Research Center of Digital Life, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5052666042"],"corresponding_institution_ids":["https://openalex.org/I157773358"],"apc_list":null,"apc_paid":null,"fwci":11.3322,"has_fulltext":false,"cited_by_count":110,"citation_normalized_percentile":{"value":0.98709316,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"32","issue":"5","first_page":"1085","last_page":"1101"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8495974540710449},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8264145851135254},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.6199659705162048},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.5309588313102722},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.5303830504417419},{"id":"https://openalex.org/keywords/mobile-edge-computing","display_name":"Mobile edge computing","score":0.4841614365577698},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4781801998615265},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.4516987204551697},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.43964889645576477},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.4307772219181061},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.41847431659698486},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.36106574535369873},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.19266539812088013}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8495974540710449},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8264145851135254},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.6199659705162048},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.5309588313102722},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5303830504417419},{"id":"https://openalex.org/C2776061582","wikidata":"https://www.wikidata.org/wiki/Q25325231","display_name":"Mobile edge computing","level":3,"score":0.4841614365577698},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4781801998615265},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.4516987204551697},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.43964889645576477},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.4307772219181061},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.41847431659698486},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36106574535369873},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.19266539812088013},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2020.3042599","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2020.3042599","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1596881006","display_name":null,"funder_award_id":"2019QN01X130","funder_id":"https://openalex.org/F4320334009","funder_display_name":"Guangdong Provincial Pearl River Talents Program"},{"id":"https://openalex.org/G3320589821","display_name":null,"funder_award_id":"2018A030313005","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G5917389280","display_name":null,"funder_award_id":"61802450","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8199004219","display_name":null,"funder_award_id":"61722214","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321921","display_name":"Natural Science Foundation of Guangdong Province","ror":null},{"id":"https://openalex.org/F4320334009","display_name":"Guangdong Provincial Pearl River Talents Program","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":61,"referenced_works":["https://openalex.org/W1575592356","https://openalex.org/W1763200058","https://openalex.org/W1890963104","https://openalex.org/W2069211379","https://openalex.org/W2145339207","https://openalex.org/W2156737235","https://openalex.org/W2171830216","https://openalex.org/W2173248099","https://openalex.org/W2195423816","https://openalex.org/W2336650964","https://openalex.org/W2541884796","https://openalex.org/W2593044849","https://openalex.org/W2596367596","https://openalex.org/W2624989916","https://openalex.org/W2732646932","https://openalex.org/W2736601468","https://openalex.org/W2770968405","https://openalex.org/W2775965637","https://openalex.org/W2786036274","https://openalex.org/W2790435736","https://openalex.org/W2793925626","https://openalex.org/W2798705390","https://openalex.org/W2885631546","https://openalex.org/W2888764732","https://openalex.org/W2889954388","https://openalex.org/W2890075093","https://openalex.org/W2903362341","https://openalex.org/W2910439483","https://openalex.org/W2911573951","https://openalex.org/W2913429011","https://openalex.org/W2918400102","https://openalex.org/W2942608247","https://openalex.org/W2949226003","https://openalex.org/W2951507724","https://openalex.org/W2954039338","https://openalex.org/W2955097190","https://openalex.org/W2962788286","https://openalex.org/W2963334314","https://openalex.org/W2963864421","https://openalex.org/W2963918968","https://openalex.org/W2964043796","https://openalex.org/W2964259004","https://openalex.org/W2964583557","https://openalex.org/W2982316857","https://openalex.org/W2982530739","https://openalex.org/W4231918628","https://openalex.org/W4288363736","https://openalex.org/W4297797010","https://openalex.org/W4318619660","https://openalex.org/W6634413486","https://openalex.org/W6639647829","https://openalex.org/W6683195989","https://openalex.org/W6684921986","https://openalex.org/W6692846177","https://openalex.org/W6703420464","https://openalex.org/W6728757088","https://openalex.org/W6734206676","https://openalex.org/W6735641298","https://openalex.org/W6741002519","https://openalex.org/W6748638692","https://openalex.org/W6756887525"],"related_works":["https://openalex.org/W2092530219","https://openalex.org/W2388464034","https://openalex.org/W2533125852","https://openalex.org/W2140460949","https://openalex.org/W2105580438","https://openalex.org/W2057435755","https://openalex.org/W4306904969","https://openalex.org/W3121798572","https://openalex.org/W3139051647","https://openalex.org/W2902693277"],"abstract_inverted_index":{"Mobile":[0],"edge":[1,17],"computing":[2],"(MEC)":[3],"is":[4,77,98],"a":[5,66,81,124,132,144],"promising":[6],"solution":[7],"to":[8,15,39,69,206],"support":[9],"resource-constrained":[10],"devices":[11],"by":[12,101,105,192,241],"offloading":[13,30,121],"tasks":[14],"the":[16,34,43,60,113,118,169,188,198,208,215,222,230,232],"servers.":[18],"However,":[19],"traditional":[20],"approaches":[21],"(e.g.,":[22],"linear":[23],"programming":[24],"and":[25,91,94,134,146,164,195,203,213,235,245],"game-theory":[26],"methods)":[27],"for":[28],"computation":[29,120],"mainly":[31],"focus":[32,57],"on":[33,58,117],"immediate":[35],"performance,":[36],"potentially":[37],"leading":[38],"performance":[40],"degradation":[41],"in":[42,74],"long":[44],"run.":[45],"Recent":[46],"breakthroughs":[47],"regarding":[48],"deep":[49,201],"reinforcement":[50],"learning":[51],"(DRL)":[52],"provide":[53],"alternative":[54],"methods,":[55],"which":[56,157,180],"maximizing":[59],"cumulative":[61],"reward.":[62],"Nonetheless,":[63],"there":[64],"exists":[65],"large":[67,89],"gap":[68],"deploy":[70],"real":[71],"DRL":[72,83,96,116,136],"applications":[73,114],"MEC.":[75],"This":[76],"because:":[78],"1)":[79,143],"training":[80,97,148,183],"well-performed":[82],"agent":[84],"typically":[85],"requires":[86],"data":[87,162],"with":[88,140,229],"quantities":[90],"high":[92,189],"diversity,":[93],"2)":[95,172],"usually":[99],"accompanied":[100],"huge":[102],"costs":[103,234,238],"caused":[104,191],"trial-and-error.":[106],"To":[107],"address":[108],"this":[109],"mismatch,":[110],"we":[111,130],"study":[112],"of":[115,200,210,224],"multi-user":[119],"problem":[122],"from":[123,153,187],"more":[125],"practical":[126],"perspective.":[127],"In":[128],"particular,":[129],"propose":[131],"distributed":[133,145,193],"collective":[135,147],"algorithm":[137],"called":[138,176],"DC-DRL":[139],"several":[141],"improvements:":[142],"scheme":[149],"that":[150],"assimilates":[151],"knowledge":[152],"multiple":[154,211],"MEC":[155],"environments,":[156],"not":[158],"only":[159],"greatly":[160],"increases":[161],"amount":[163],"diversity":[165],"but":[166],"also":[167],"spreads":[168],"exploration":[170,233],"costs,":[171],"an":[173],"updating":[174],"method":[175],"adaptive":[177],"n-step":[178],"learning,":[179],"can":[181],"improve":[182],"efficiency":[184],"without":[185],"suffering":[186],"variance":[190],"training,":[194],"3)":[196],"combining":[197],"advantages":[199],"neuroevolution":[202],"policy":[204],"gradient":[205],"maximize":[207],"utilization":[209],"environments":[212],"prevent":[214],"premature":[216],"convergence.":[217],"Lastly,":[218],"evaluation":[219],"results":[220],"demonstrate":[221],"effectiveness":[223],"our":[225],"proposed":[226],"algorithm.":[227],"Compared":[228],"baselines,":[231],"final":[236],"system":[237],"are":[239],"reduced":[240],"at":[242],"least":[243],"43":[244],"9.4":[246],"percent,":[247],"respectively.":[248]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":17},{"year":2024,"cited_by_count":20},{"year":2023,"cited_by_count":30},{"year":2022,"cited_by_count":27},{"year":2021,"cited_by_count":13}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
