{"id":"https://openalex.org/W4405022221","doi":"https://doi.org/10.1109/lra.2024.3511408","title":"Hierarchical Deep Reinforcement Learning for Computation Offloading in Autonomous Multi-Robot Systems","display_name":"Hierarchical Deep Reinforcement Learning for Computation Offloading in Autonomous Multi-Robot Systems","publication_year":2024,"publication_date":"2024-12-04","ids":{"openalex":"https://openalex.org/W4405022221","doi":"https://doi.org/10.1109/lra.2024.3511408"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2024.3511408","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2024.3511408","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100865935","display_name":"Wen Gao","orcid":"https://orcid.org/0009-0002-0139-2627"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wen Gao","raw_affiliation_strings":["School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China"],"raw_orcid":"https://orcid.org/0009-0002-0139-2627","affiliations":[{"raw_affiliation_string":"School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100701166","display_name":"Zhiwen Yu","orcid":"https://orcid.org/0000-0002-9905-3238"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiwen Yu","raw_affiliation_strings":["School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China"],"raw_orcid":"https://orcid.org/0000-0002-9905-3238","affiliations":[{"raw_affiliation_string":"School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100456543","display_name":"Liang Wang","orcid":"https://orcid.org/0000-0002-5897-4401"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Wang","raw_affiliation_strings":["School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China"],"raw_orcid":"https://orcid.org/0000-0002-5897-4401","affiliations":[{"raw_affiliation_string":"School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061725051","display_name":"Helei Cui","orcid":"https://orcid.org/0000-0003-1946-5361"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Helei Cui","raw_affiliation_strings":["School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China"],"raw_orcid":"https://orcid.org/0000-0003-1946-5361","affiliations":[{"raw_affiliation_string":"School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078005520","display_name":"Bin Guo","orcid":"https://orcid.org/0000-0001-6097-2467"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Guo","raw_affiliation_strings":["School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China"],"raw_orcid":"https://orcid.org/0000-0001-6097-2467","affiliations":[{"raw_affiliation_string":"School of Computer Science, Northwestern Polytechnical University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101862104","display_name":"Hui Xiong","orcid":"https://orcid.org/0000-0001-6016-6465"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]},{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Hui Xiong","raw_affiliation_strings":["Thust of the Artificial Intelligence, The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-6016-6465","affiliations":[{"raw_affiliation_string":"Thust of the Artificial Intelligence, The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China","institution_ids":["https://openalex.org/I200769079","https://openalex.org/I889458895"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100865935"],"corresponding_institution_ids":["https://openalex.org/I17145004"],"apc_list":null,"apc_paid":null,"fwci":0.8116,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.69574038,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":"10","issue":"1","first_page":"540","last_page":"547"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9212999939918518,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9212999939918518,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8084529638290405},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6192977428436279},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5579817295074463},{"id":"https://openalex.org/keywords/autonomous-robot","display_name":"Autonomous robot","score":0.556640625},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5551173090934753},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5271643996238708},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.5104050040245056},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.42159903049468994},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3739722967147827},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3320491313934326}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8084529638290405},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6192977428436279},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5579817295074463},{"id":"https://openalex.org/C2778835581","wikidata":"https://www.wikidata.org/wiki/Q2916098","display_name":"Autonomous robot","level":4,"score":0.556640625},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5551173090934753},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5271643996238708},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.5104050040245056},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.42159903049468994},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3739722967147827},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3320491313934326},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2024.3511408","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2024.3511408","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G425168253","display_name":null,"funder_award_id":"61960206008","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7715781798","display_name":null,"funder_award_id":"62372383","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W2617547828","https://openalex.org/W2736601468","https://openalex.org/W2889987506","https://openalex.org/W2962747795","https://openalex.org/W3095315965","https://openalex.org/W3099689767","https://openalex.org/W3116115872","https://openalex.org/W3133496440","https://openalex.org/W3182045899","https://openalex.org/W4210530701","https://openalex.org/W4283206588","https://openalex.org/W4313291432","https://openalex.org/W4321488123","https://openalex.org/W4328007710","https://openalex.org/W4361804634","https://openalex.org/W4388756484","https://openalex.org/W4389370848","https://openalex.org/W4391467970","https://openalex.org/W4393305235","https://openalex.org/W4396594868","https://openalex.org/W4400770592","https://openalex.org/W6741002519","https://openalex.org/W6753526802"],"related_works":["https://openalex.org/W2122871747","https://openalex.org/W3114279067","https://openalex.org/W2930863966","https://openalex.org/W2126211886","https://openalex.org/W3153786280","https://openalex.org/W3127551068","https://openalex.org/W4220829754","https://openalex.org/W2165180011","https://openalex.org/W3165944253","https://openalex.org/W2351343564"],"abstract_inverted_index":{"To":[0],"ensure":[1],"system":[2,34],"responsiveness,":[3],"some":[4],"compute-intensive":[5],"tasks":[6,82],"are":[7],"usually":[8],"offloaded":[9],"to":[10,20,44,71,122,155],"cloud":[11],"or":[12],"edge":[13],"computing":[14,22,130],"devices.":[15,131],"In":[16,86,112],"environments":[17],"where":[18],"connection":[19],"external":[21],"facilities":[23],"is":[24],"unavailable,":[25],"computation":[26,57],"offloading":[27],"among":[28],"members":[29],"within":[30,83],"an":[31,84,150],"autonomous":[32],"multi-robot":[33],"(AMRS)":[35],"becomes":[36],"a":[37,64],"solution.":[38],"The":[39],"challenge":[40],"lies":[41],"in":[42],"how":[43],"maximize":[45],"the":[46,77,89,93,108,114,124,144],"use":[47],"of":[48,80,95,126,129,142,152],"other":[49],"members'":[50],"idle":[51],"resources":[52],"without":[53],"disrupting":[54],"their":[55],"local":[56],"tasks.":[58],"Therefore,":[59],"this":[60,87],"study":[61],"proposes":[62],"HRL-AMRS,":[63],"hierarchical":[65],"deep":[66],"reinforcement":[67],"learning":[68],"framework":[69,145],"designed":[70],"distribute":[72],"computational":[73,81,104],"loads":[74],"and":[75,140],"reduce":[76],"processing":[78,110,147],"time":[79],"AMRS.":[85],"framework,":[88],"high-level":[90],"must":[91],"consider":[92],"impact":[94],"data":[96],"loading":[97],"scales":[98],"determined":[99],"by":[100,149],"low-level":[101,115],"under":[102],"varying":[103],"device":[105],"states":[106,128],"on":[107],"actual":[109],"times.":[111],"addition,":[113],"employs":[116],"Long":[117],"Short-Term":[118],"Memory":[119],"(LSTM)":[120],"networks":[121],"enhance":[123],"understanding":[125],"time-series":[127],"Experimental":[132],"results":[133],"show":[134],"that,":[135],"across":[136],"various":[137],"task":[138],"sizes":[139],"numbers":[141],"robots,":[143],"reduces":[146],"times":[148],"average":[151],"4.32%":[153],"compared":[154],"baseline":[156],"methods.":[157]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3}],"updated_date":"2025-12-22T23:10:17.713674","created_date":"2025-10-10T00:00:00"}
