{"id":"https://openalex.org/W4415934829","doi":"https://doi.org/10.1109/tc.2025.3628924","title":"HeShare: Energy-Aware and Efficient Multi-Task GPU Sharing in Heterogeneous GPU-Based Computing Systems","display_name":"HeShare: Energy-Aware and Efficient Multi-Task GPU Sharing in Heterogeneous GPU-Based Computing Systems","publication_year":2025,"publication_date":"2025-11-05","ids":{"openalex":"https://openalex.org/W4415934829","doi":"https://doi.org/10.1109/tc.2025.3628924"},"language":null,"primary_location":{"id":"doi:10.1109/tc.2025.3628924","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2025.3628924","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001957036","display_name":"Zhuolong Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhuolong Jiang","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010791300","display_name":"Zinuo Cai","orcid":"https://orcid.org/0000-0001-9373-8474"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zinuo Cai","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001679454","display_name":"Hongyu Zhao","orcid":"https://orcid.org/0000-0003-3213-9923"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongyu Zhao","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002957686","display_name":"Bo Zhang","orcid":"https://orcid.org/0009-0002-8545-1013"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baoheng Zhang","raw_affiliation_strings":["Aerospace System Engineering Shanghai, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Aerospace System Engineering Shanghai, Shanghai, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083523912","display_name":"Tianqi Wu","orcid":"https://orcid.org/0000-0002-1545-3462"},"institutions":[{"id":"https://openalex.org/I4210129465","display_name":"Wuhan Ship Development & Design Institute","ror":"https://ror.org/02mcdae06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210129465"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianqi Wu","raw_affiliation_strings":["China Ship Scientific Research Center, Jiangsu, China","China Ship Scientific Research Center"],"affiliations":[{"raw_affiliation_string":"China Ship Scientific Research Center, Jiangsu, China","institution_ids":["https://openalex.org/I4210129465"]},{"raw_affiliation_string":"China Ship Scientific Research Center","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075358199","display_name":"Yiming Qiang","orcid":"https://orcid.org/0009-0002-7110-7342"},"institutions":[{"id":"https://openalex.org/I4210129465","display_name":"Wuhan Ship Development & Design Institute","ror":"https://ror.org/02mcdae06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210129465"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yiming Qiang","raw_affiliation_strings":["China Ship Scientific Research Center, Jiangsu, China","China Ship Scientific Research Center"],"affiliations":[{"raw_affiliation_string":"China Ship Scientific Research Center, Jiangsu, China","institution_ids":["https://openalex.org/I4210129465"]},{"raw_affiliation_string":"China Ship Scientific Research Center","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101955065","display_name":"Ruichen Ma","orcid":"https://orcid.org/0009-0004-6210-8022"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruhui Ma","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049487451","display_name":"Haibing Guan","orcid":"https://orcid.org/0000-0002-4714-7400"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haibing Guan","raw_affiliation_strings":["School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014716105","display_name":"Rajkumar Buyya","orcid":"https://orcid.org/0000-0001-9754-6496"},"institutions":[{"id":"https://openalex.org/I165779595","display_name":"The University of Melbourne","ror":"https://ror.org/01ej9dk98","country_code":"AU","type":"education","lineage":["https://openalex.org/I165779595"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Rajkumar Buyya","raw_affiliation_strings":["Cloud Computing and Distributed Systems (CLOUDS) Laboratory, School of Computing and Information Systems, The University of Melbourne, Melbourne, VIC, Australia","Cloud Computing and Distributed Systems (CLOUDS) Laboratory, School of Computing and Information Systems, The University of Melbourne, Australia"],"affiliations":[{"raw_affiliation_string":"Cloud Computing and Distributed Systems (CLOUDS) Laboratory, School of Computing and Information Systems, The University of Melbourne, Melbourne, VIC, Australia","institution_ids":["https://openalex.org/I165779595"]},{"raw_affiliation_string":"Cloud Computing and Distributed Systems (CLOUDS) Laboratory, School of Computing and Information Systems, The University of Melbourne, Australia","institution_ids":["https://openalex.org/I165779595"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5001957036"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":9.9426,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.97992978,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":"75","issue":"3","first_page":"776","last_page":"787"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.5582000017166138,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.5582000017166138,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.2903999984264374,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.06210000067949295,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/symmetric-multiprocessor-system","display_name":"Symmetric multiprocessor system","score":0.6233999729156494},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.6179999709129333},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.6021999716758728},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.5958999991416931},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.43299999833106995},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4147000014781952},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.4074999988079071},{"id":"https://openalex.org/keywords/shared-resource","display_name":"Shared resource","score":0.3801000118255615},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.35280001163482666}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8835999965667725},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.6299999952316284},{"id":"https://openalex.org/C172430144","wikidata":"https://www.wikidata.org/wiki/Q17111997","display_name":"Symmetric multiprocessor system","level":2,"score":0.6233999729156494},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.6179999709129333},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.6021999716758728},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.5958999991416931},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.43299999833106995},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.41499999165534973},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4147000014781952},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.4074999988079071},{"id":"https://openalex.org/C51332947","wikidata":"https://www.wikidata.org/wiki/Q1172305","display_name":"Shared resource","level":2,"score":0.3801000118255615},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.35280001163482666},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.33730000257492065},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.33410000801086426},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.33340001106262207},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3330000042915344},{"id":"https://openalex.org/C2984118289","wikidata":"https://www.wikidata.org/wiki/Q29954","display_name":"Power consumption","level":3,"score":0.31349998712539673},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.2856000065803528},{"id":"https://openalex.org/C2989134064","wikidata":"https://www.wikidata.org/wiki/Q288510","display_name":"Execution time","level":2,"score":0.2822999954223633},{"id":"https://openalex.org/C55416958","wikidata":"https://www.wikidata.org/wiki/Q6206757","display_name":"Job shop scheduling","level":3,"score":0.28029999136924744},{"id":"https://openalex.org/C38725249","wikidata":"https://www.wikidata.org/wiki/Q913876","display_name":"Time-sharing","level":2,"score":0.27489998936653137},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.2689000070095062},{"id":"https://openalex.org/C2984822820","wikidata":"https://www.wikidata.org/wiki/Q1123036","display_name":"Processor scheduling","level":3,"score":0.26269999146461487},{"id":"https://openalex.org/C111873713","wikidata":"https://www.wikidata.org/wiki/Q1641413","display_name":"Job scheduler","level":3,"score":0.258899986743927},{"id":"https://openalex.org/C49154492","wikidata":"https://www.wikidata.org/wiki/Q5300","display_name":"Central processing unit","level":2,"score":0.2581999897956848},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.2574000060558319},{"id":"https://openalex.org/C107568181","wikidata":"https://www.wikidata.org/wiki/Q5319000","display_name":"Dynamic priority scheduling","level":3,"score":0.2522999942302704}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tc.2025.3628924","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2025.3628924","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W2050127041","https://openalex.org/W2194775991","https://openalex.org/W2563621803","https://openalex.org/W2751165078","https://openalex.org/W2919897868","https://openalex.org/W2963163009","https://openalex.org/W2963446712","https://openalex.org/W2982479996","https://openalex.org/W3016928194","https://openalex.org/W3022298203","https://openalex.org/W3034966030","https://openalex.org/W3115175310","https://openalex.org/W3216416559","https://openalex.org/W4206943884","https://openalex.org/W4304192541","https://openalex.org/W4385245566","https://openalex.org/W4386038523","https://openalex.org/W4387934926","https://openalex.org/W4388116548","https://openalex.org/W4390075082","https://openalex.org/W4401386998","https://openalex.org/W4403842265","https://openalex.org/W4404133812","https://openalex.org/W4407197043","https://openalex.org/W4411800438"],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,11,53,76,179],"rapid":[2],"growth":[3],"of":[4,78],"artificial":[5],"intelligence":[6],"and":[7,24,36,58,72,84,102,117,146,160,173,189,202],"large-scale":[8,22],"model":[9],"computing,":[10],"demand":[12],"for":[13,21,81,122,163],"GPUs":[14,32,90,138],"in":[15,55,93],"datacenters":[16],"continues":[17],"to":[18,46,52,68,99,139,178],"increase,":[19],"especially":[20],"training":[23],"inference":[25],"tasks.":[26],"Heterogeneous":[27],"multi-GPU":[28],"systems,":[29],"which":[30],"integrate":[31],"with":[33],"varying":[34],"types":[35],"computational":[37],"capabilities,":[38],"have":[39],"become":[40],"critical":[41],"computing":[42],"resources.":[43],"This":[44],"leads":[45],"two":[47],"main":[48],"challenges.":[49],"First,":[50,124],"due":[51],"differences":[54],"GPU":[56,94,120,152],"performance":[57],"power":[59],"consumption,":[60,172],"task":[61,129,134,175],"scheduling":[62,130],"involves":[63],"a":[64,141,151,197],"complex":[65],"multi-objective":[66],"optimization":[67,154],"balance":[69,142,198],"energy":[70,144,171,185,200],"efficiency":[71,201],"performance.":[73,147,176,203],"More":[74],"importantly,":[75],"lack":[77],"coordinated":[79],"mechanisms":[80],"multi-task":[82],"sharing":[83,153],"energy-efficient":[85],"resource":[86,167],"management":[87],"across":[88,136],"heterogeneous":[89,119],"can":[91],"result":[92],"overload":[95],"or":[96],"underutilization,":[97],"leading":[98],"wasted":[100],"resources":[101],"potential":[103],"system":[104],"risks.":[105],"<p":[106],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[107],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">To":[108],"address":[109],"these":[110],"challenges,":[111],"we":[112,125,149,182],"propose":[113],"HESHARE,":[114],"an":[115,127],"energy-aware":[116,128],"efficient":[118],"framework":[121],"datacenters.":[123],"design":[126],"strategy":[131],"that":[132,156],"optimizes":[133],"allocation":[135],"different":[137],"achieve":[140],"between":[143,199],"consumption":[145],"Second,":[148],"introduce":[150],"mechanism":[155],"adaptively":[157],"configures":[158],"MPS":[159],"DVFS":[161],"settings":[162],"each":[164],"GPU,":[165],"enhancing":[166],"utilization,":[168],"reducing":[169],"overall":[170],"ensuring":[174],"Compared":[177],"state-of-the-art":[180],"framework,":[181],"reduce":[183],"average":[184],"costs":[186],"by":[187,194],"26%":[188],"improve":[190],"job":[191],"completion":[192],"time":[193],"31%,":[195],"achieving":[196]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2}],"updated_date":"2026-03-26T15:22:09.906841","created_date":"2025-11-05T00:00:00"}
