{"id":"https://openalex.org/W7133506911","doi":"https://doi.org/10.48550/arxiv.2603.02885","title":"MuxTune: Efficient Multi-Task LLM Fine-Tuning in Multi-Tenant Datacenters via Spatial-Temporal Backbone Multiplexing","display_name":"MuxTune: Efficient Multi-Task LLM Fine-Tuning in Multi-Tenant Datacenters via Spatial-Temporal Backbone Multiplexing","publication_year":2026,"publication_date":"2026-03-03","ids":{"openalex":"https://openalex.org/W7133506911","doi":"https://doi.org/10.48550/arxiv.2603.02885"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.02885","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02885","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.02885","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128074366","display_name":"Chunyu Xue","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Xue, Chunyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128106701","display_name":"Yi Pan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Yi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128127037","display_name":"Weihao Cui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cui, Weihao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128103150","display_name":"Quan Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Quan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012349805","display_name":"Shulai Zhang","orcid":"https://orcid.org/0000-0002-0802-7203"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Shulai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128075543","display_name":"Bingsheng He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Bingsheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128082937","display_name":"Minyi Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Minyi","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5128074366"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.6266999840736389,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.6266999840736389,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.1062999963760376,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.05739999935030937,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.4943999946117401},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4878999888896942},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.48660001158714294},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.46149998903274536},{"id":"https://openalex.org/keywords/multiplexing","display_name":"Multiplexing","score":0.41749998927116394},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.40149998664855957},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.38679999113082886},{"id":"https://openalex.org/keywords/service","display_name":"Service (business)","score":0.3596999943256378},{"id":"https://openalex.org/keywords/personalization","display_name":"Personalization","score":0.35280001163482666},{"id":"https://openalex.org/keywords/shared-resource","display_name":"Shared resource","score":0.35199999809265137}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8299000263214111},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5907999873161316},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.5127999782562256},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.4943999946117401},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4878999888896942},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.48660001158714294},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.46149998903274536},{"id":"https://openalex.org/C19275194","wikidata":"https://www.wikidata.org/wiki/Q222903","display_name":"Multiplexing","level":2,"score":0.41749998927116394},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.40149998664855957},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.38679999113082886},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3709000051021576},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.3596999943256378},{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.35280001163482666},{"id":"https://openalex.org/C51332947","wikidata":"https://www.wikidata.org/wiki/Q1172305","display_name":"Shared resource","level":2,"score":0.35199999809265137},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.3434000015258789},{"id":"https://openalex.org/C17020691","wikidata":"https://www.wikidata.org/wiki/Q139677","display_name":"Operator (biology)","level":5,"score":0.3391999900341034},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.33230000734329224},{"id":"https://openalex.org/C2779965156","wikidata":"https://www.wikidata.org/wiki/Q5227350","display_name":"Data sharing","level":3,"score":0.3260999917984009},{"id":"https://openalex.org/C88796919","wikidata":"https://www.wikidata.org/wiki/Q1142907","display_name":"Backbone network","level":2,"score":0.32350000739097595},{"id":"https://openalex.org/C557945733","wikidata":"https://www.wikidata.org/wiki/Q389772","display_name":"Data transmission","level":2,"score":0.322299987077713},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.3172999918460846},{"id":"https://openalex.org/C2775941552","wikidata":"https://www.wikidata.org/wiki/Q25212305","display_name":"Isolation (microbiology)","level":2,"score":0.3034999966621399},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.29760000109672546},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2939999997615814},{"id":"https://openalex.org/C50661577","wikidata":"https://www.wikidata.org/wiki/Q901831","display_name":"Time-division multiplexing","level":3,"score":0.29330000281333923},{"id":"https://openalex.org/C193702766","wikidata":"https://www.wikidata.org/wiki/Q1414548","display_name":"Concurrency","level":2,"score":0.2800000011920929},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.27810001373291016},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.27070000767707825},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.26919999718666077},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.26579999923706055},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.26179999113082886},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.25999999046325684},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.25589999556541443},{"id":"https://openalex.org/C72414096","wikidata":"https://www.wikidata.org/wiki/Q1367461","display_name":"Mass customization","level":3,"score":0.2556999921798706},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.2554999887943268},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.2540999948978424},{"id":"https://openalex.org/C116537","wikidata":"https://www.wikidata.org/wiki/Q2169973","display_name":"Service provider","level":3,"score":0.2508000135421753},{"id":"https://openalex.org/C61455927","wikidata":"https://www.wikidata.org/wiki/Q1030529","display_name":"Blossom algorithm","level":3,"score":0.2506999969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.02885","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02885","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.02885","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02885","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Parameter-Efficient":[0],"Fine-Tuning":[1],"(PEFT)":[2],"is":[3,79],"widely":[4],"applied":[5],"as":[6],"the":[7,82],"backend":[8],"of":[9,72,125],"fine-tuning":[10,65],"APIs":[11],"for":[12,25,91],"large":[13],"language":[14],"model":[15],"(LLM)":[16],"customization":[17],"in":[18,53,87,135],"datacenters.":[19],"Service":[20],"providers":[21],"deploy":[22],"separate":[23],"instances":[24],"individual":[26],"PEFT":[27,74,105],"tasks,":[28],"giving":[29],"rise":[30],"to":[31,80,145,157,166],"prominent":[32],"resource":[33],"inefficiencies,":[34],"including":[35],"(1)":[36],"GPU":[37],"underutilization":[38],"from":[39,47],"small-scale,":[40],"PEFT-native":[41],"operators":[42],"and":[43,50,94,115,127,130,161],"(2)":[44],"device":[45],"stalls":[46],"communication":[48],"delays":[49],"data":[51,143],"dependencies":[52],"parallelized":[54],"execution.":[55],"To":[56],"address":[57],"these":[58],"issues,":[59],"this":[60],"paper":[61],"presents":[62],"MuxTune,":[63],"a":[64,88,123],"system":[66],"that":[67,153],"enables":[68],"resource-efficient":[69],"concurrent":[70],"execution":[71,134],"multiple":[73],"tasks.":[75],"The":[76],"key":[77],"idea":[78],"multiplex":[81],"backbone":[83,101],"across":[84],"independent":[85],"tasks":[86,121],"spatial-temporal":[89],"manner":[90],"improved":[92],"utilization":[93],"reduced":[95],"stalls.":[96],"Building":[97],"on":[98],"flexible,":[99],"modularized":[100],"sharing":[102],"via":[103],"unified":[104],"representations,":[106],"MuxTune":[107,140,154],"proposes":[108],"hierarchical":[109],"co-scheduling":[110],"scheme":[111],"with":[112],"task,":[113],"operator,":[114],"data-level":[116],"optimizations.":[117],"Specifically,":[118],"it":[119],"fuses":[120],"through":[122],"hybrid":[124,137],"spatial":[126],"temporal":[128],"multiplexing,":[129],"orchestrates":[131],"multi-task":[132],"operator":[133],"two-tiered":[136],"parallelism.":[138],"Additionally,":[139],"employs":[141],"chunk-based":[142],"alignment":[144],"mitigate":[146],"inter-task":[147],"ineffective":[148],"tokens.":[149],"Experimental":[150],"results":[151],"demonstrate":[152],"achieves":[155],"up":[156],"$2.33\\times$":[158],"higher":[159],"throughput":[160],"$5.29\\times$":[162],"memory":[163],"reduction":[164],"compared":[165],"three":[167],"state-of-the-art":[168],"baselines.":[169]},"counts_by_year":[],"updated_date":"2026-03-05T07:36:02.291473","created_date":"2026-03-05T00:00:00"}
