{"id":"https://openalex.org/W7160100082","doi":"https://doi.org/10.48550/arxiv.2605.00515","title":"SpaceMoE: Realizing Distributed Mixture-of-Experts Inference over Space Networks","display_name":"SpaceMoE: Realizing Distributed Mixture-of-Experts Inference over Space Networks","publication_year":2026,"publication_date":"2026-05-01","ids":{"openalex":"https://openalex.org/W7160100082","doi":"https://doi.org/10.48550/arxiv.2605.00515"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.00515","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.00515","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.00515","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135099173","display_name":"Zhanwei Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zhanwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135141022","display_name":"Huiling Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Huiling","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135275299","display_name":"Min Sheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sheng, Min","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135239868","display_name":"Khaled B. Letaief","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Letaief, Khaled B.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135145742","display_name":"Kaibin Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Kaibin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12042","display_name":"Satellite Communication Systems","score":0.5076000094413757,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12042","display_name":"Satellite Communication Systems","score":0.5076000094413757,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11896","display_name":"Opportunistic and Delay-Tolerant Networks","score":0.2524000108242035,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.05510000139474869,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5097000002861023},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.4691999852657318},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.43540000915527344},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.41280001401901245},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.40959998965263367},{"id":"https://openalex.org/keywords/network-architecture","display_name":"Network architecture","score":0.39410001039505005},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.3917999863624573},{"id":"https://openalex.org/keywords/network-topology","display_name":"Network topology","score":0.3880000114440918},{"id":"https://openalex.org/keywords/constellation","display_name":"Constellation","score":0.3846000134944916},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.3785000145435333}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7791000008583069},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.598800003528595},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5097000002861023},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.4691999852657318},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.43540000915527344},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.41280001401901245},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.40959998965263367},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.39410001039505005},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.3917999863624573},{"id":"https://openalex.org/C199845137","wikidata":"https://www.wikidata.org/wiki/Q145490","display_name":"Network topology","level":2,"score":0.3880000114440918},{"id":"https://openalex.org/C70352696","wikidata":"https://www.wikidata.org/wiki/Q8928","display_name":"Constellation","level":2,"score":0.3846000134944916},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.3785000145435333},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3716999888420105},{"id":"https://openalex.org/C19269812","wikidata":"https://www.wikidata.org/wiki/Q26540","display_name":"Satellite","level":2,"score":0.366100013256073},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3573000133037567},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.35420000553131104},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.3528999984264374},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.3431999981403351},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.3149999976158142},{"id":"https://openalex.org/C77270119","wikidata":"https://www.wikidata.org/wiki/Q1655198","display_name":"Software-defined networking","level":2,"score":0.311599999666214},{"id":"https://openalex.org/C184896649","wikidata":"https://www.wikidata.org/wiki/Q290066","display_name":"Routing table","level":4,"score":0.30169999599456787},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.30140000581741333},{"id":"https://openalex.org/C187107819","wikidata":"https://www.wikidata.org/wiki/Q835696","display_name":"NASA Deep Space Network","level":3,"score":0.3001999855041504},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.299699991941452},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.2921999990940094},{"id":"https://openalex.org/C104060986","wikidata":"https://www.wikidata.org/wiki/Q180046","display_name":"Space exploration","level":2,"score":0.28459998965263367},{"id":"https://openalex.org/C190793597","wikidata":"https://www.wikidata.org/wiki/Q189768","display_name":"Application layer","level":3,"score":0.2709999978542328},{"id":"https://openalex.org/C2779784338","wikidata":"https://www.wikidata.org/wiki/Q967145","display_name":"Satellite constellation","level":3,"score":0.26989999413490295},{"id":"https://openalex.org/C192126672","wikidata":"https://www.wikidata.org/wiki/Q1068715","display_name":"Telecommunications network","level":2,"score":0.26899999380111694},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.2635999917984009},{"id":"https://openalex.org/C121308736","wikidata":"https://www.wikidata.org/wiki/Q149918","display_name":"Communications satellite","level":3,"score":0.2517000138759613},{"id":"https://openalex.org/C44010500","wikidata":"https://www.wikidata.org/wiki/Q1422567","display_name":"Source routing","level":5,"score":0.2513999938964844}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.00515","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.00515","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.00515","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.00515","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.8458163738250732,"display_name":"Affordable and clean energy"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Leveraging":[0],"continuous":[1],"solar":[2],"energy":[3],"harvesting":[4],"at":[5,247],"high":[6],"efficiency,":[7],"space":[8,27],"data":[9],"centers":[10],"are":[11,34,129],"envisioned":[12],"as":[13],"a":[14,50,54,70,118,182,220,228,231,240,249],"promising":[15],"platform":[16],"for":[17,200],"executing":[18],"energy-intensive":[19],"large":[20],"language":[21],"models":[22],"(LLMs).":[23],"Recognizing":[24],"this":[25,38,102,191],"advantage,":[26],"and":[28,63,76,89,141,195,257],"AI":[29],"conglomerates":[30],"(e.g.,":[31],"SpaceX,":[32],"Google)":[33],"actively":[35],"investing":[36],"in":[37,53,123],"vision.":[39],"One":[40],"key":[41],"challenge,":[42],"however,":[43],"is":[44],"the":[45,59,84,106,114,154,162,171,175],"efficient":[46],"distributed":[47,115],"deployment":[48],"of":[49,109,117,166],"large-scale":[51],"LLM":[52],"satellite":[55,139,172,229],"network":[56,90],"due":[57],"to":[58,69,80,95,138,150,169,204,227],"limited":[60],"onboard":[61],"computing":[62],"communication":[64,164],"resources.":[65],"This":[66],"gives":[67],"rise":[68],"placement":[71,127,203,259],"problem":[72,199],"that":[73,83,244],"involves":[74],"partitioning":[75],"mapping":[77],"model":[78,87,122],"components":[79],"satellites":[81,151],"such":[82],"fundamentally":[85],"different":[86],"architecture":[88],"topology":[91],"can":[92],"be":[93,225],"reconciled":[94],"ensure":[96],"low-latency":[97],"token":[98],"generation.":[99],"To":[100],"address":[101],"problem,":[103],"we":[104,160,193],"present":[105],"Space":[107],"Network":[108],"Mixture-of-Experts":[110],"(SpaceMoE)":[111],"framework":[112],"targeting":[113],"execution":[116],"popular":[119],"mixture-of-experts":[120],"(MoE)":[121],"space.":[124],"The":[125,213],"proposed":[126],"strategies":[128],"two-level:":[130],"(1)":[131],"layer":[132,158],"placement,":[133,145,159],"which":[134,146],"assigns":[135,147],"MoE":[136,187],"layers":[137],"subnets;":[140],"(2)":[142],"intra-layer":[143,201],"expert":[144,202,223],"individual":[148],"experts":[149,206],"associated":[152],"with":[153,207,234,254],"same":[155],"layer/subnet.":[156],"For":[157],"exploit":[161],"ring-like":[163],"pattern":[165],"autoregressive":[167],"inference":[168],"partition":[170],"constellation":[173,242],"along":[174],"orbiting":[176],"direction":[177],"into":[178],"subnets":[179],"arranged":[180],"on":[181,190,230],"ring,":[183],"each":[184],"hosting":[185],"one":[186],"layer.":[188],"Based":[189],"architecture,":[192],"formulate":[194],"solve":[196],"an":[197,217],"optimization":[198],"map":[205],"heterogeneous":[208],"activation":[209],"probabilities":[210],"onto":[211],"satellites.":[212],"derived":[214],"strategy":[215],"reveals":[216],"intuitive":[218],"principle:":[219],"frequently":[221],"activated":[222],"should":[224],"mapped":[226],"routing":[232],"path":[233],"low":[235],"expected":[236],"latency.":[237],"Experiments":[238],"over":[239],"thousand-satellite":[241],"show":[243],"SpaceMoE":[245],"achieves":[246],"least":[248],"threefold":[250],"latency":[251],"reduction":[252],"compared":[253],"conventional":[255],"random":[256],"ablation-based":[258],"strategies.":[260]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-05T00:00:00"}
