{"id":"https://openalex.org/W7148446660","doi":"https://doi.org/10.48550/arxiv.2604.00368","title":"TENT: A Declarative Slice Spraying Engine for Performant and Resilient Data Movement in Disaggregated LLM Serving","display_name":"TENT: A Declarative Slice Spraying Engine for Performant and Resilient Data Movement in Disaggregated LLM Serving","publication_year":2026,"publication_date":"2026-04-01","ids":{"openalex":"https://openalex.org/W7148446660","doi":"https://doi.org/10.48550/arxiv.2604.00368"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.00368","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00368","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.00368","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132796231","display_name":"Feng Ren","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ren, Feng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132782270","display_name":"Ruoyu Qin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qin, Ruoyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132801236","display_name":"Teng Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Teng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036856464","display_name":"Shangming Cai","orcid":"https://orcid.org/0000-0002-0902-7774"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cai, Shangming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132791092","display_name":"Zheng Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Zheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132780365","display_name":"Chao Lei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lei, Chao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027029641","display_name":"Dejiang Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Dejiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132809447","display_name":"Ke Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Ke","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132734942","display_name":"Zheming Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Zheming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132765757","display_name":"Jialei Cui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cui, Jialei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132765515","display_name":"Weixiao Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Weixiao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132824537","display_name":"Yikai Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Yikai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132783441","display_name":"Yineng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yineng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132789506","display_name":"Hao Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132822769","display_name":"Xiang Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Xiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033814924","display_name":"Yuhao Fu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fu, Yuhao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132820736","display_name":"Jinlei Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Jinlei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132802570","display_name":"Yongwei Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Yongwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132821939","display_name":"Mingxing Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Mingxing","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":19,"corresponding_author_ids":["https://openalex.org/A5132796231"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.4848000109195709,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.4848000109195709,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.26260000467300415,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.035999998450279236,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stream-control-transmission-protocol","display_name":"Stream Control Transmission Protocol","score":0.5946999788284302},{"id":"https://openalex.org/keywords/remote-direct-memory-access","display_name":"Remote direct memory access","score":0.4733000099658966},{"id":"https://openalex.org/keywords/liveness","display_name":"Liveness","score":0.4490000009536743},{"id":"https://openalex.org/keywords/marshalling","display_name":"Marshalling","score":0.4198000133037567},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.4092999994754791},{"id":"https://openalex.org/keywords/ranging","display_name":"Ranging","score":0.33629998564720154},{"id":"https://openalex.org/keywords/forwarding-plane","display_name":"Forwarding plane","score":0.3325999975204468},{"id":"https://openalex.org/keywords/blocking","display_name":"Blocking (statistics)","score":0.3264000117778778},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.31779998540878296}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8116999864578247},{"id":"https://openalex.org/C90377713","wikidata":"https://www.wikidata.org/wiki/Q576997","display_name":"Stream Control Transmission Protocol","level":3,"score":0.5946999788284302},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.516700029373169},{"id":"https://openalex.org/C130795937","wikidata":"https://www.wikidata.org/wiki/Q2561570","display_name":"Remote direct memory access","level":2,"score":0.4733000099658966},{"id":"https://openalex.org/C15569618","wikidata":"https://www.wikidata.org/wiki/Q3561421","display_name":"Liveness","level":2,"score":0.4490000009536743},{"id":"https://openalex.org/C206019424","wikidata":"https://www.wikidata.org/wiki/Q373671","display_name":"Marshalling","level":2,"score":0.4198000133037567},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.4092999994754791},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.36559998989105225},{"id":"https://openalex.org/C115051666","wikidata":"https://www.wikidata.org/wiki/Q6522493","display_name":"Ranging","level":2,"score":0.33629998564720154},{"id":"https://openalex.org/C10597312","wikidata":"https://www.wikidata.org/wiki/Q5473302","display_name":"Forwarding plane","level":3,"score":0.3325999975204468},{"id":"https://openalex.org/C144745244","wikidata":"https://www.wikidata.org/wiki/Q4927286","display_name":"Blocking (statistics)","level":2,"score":0.3264000117778778},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.31779998540878296},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.3176000118255615},{"id":"https://openalex.org/C183469790","wikidata":"https://www.wikidata.org/wiki/Q333501","display_name":"Crash","level":2,"score":0.30300000309944153},{"id":"https://openalex.org/C22684755","wikidata":"https://www.wikidata.org/wiki/Q847526","display_name":"Queueing theory","level":2,"score":0.2992999851703644},{"id":"https://openalex.org/C2776175482","wikidata":"https://www.wikidata.org/wiki/Q1195816","display_name":"Transfer (computing)","level":2,"score":0.29840001463890076},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.2822999954223633},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.2806999981403351},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.27709999680519104},{"id":"https://openalex.org/C2779013668","wikidata":"https://www.wikidata.org/wiki/Q826798","display_name":"NonStop","level":2,"score":0.2768999934196472},{"id":"https://openalex.org/C150202949","wikidata":"https://www.wikidata.org/wiki/Q107602","display_name":"Pointer (user interface)","level":2,"score":0.2754000127315521},{"id":"https://openalex.org/C65813073","wikidata":"https://www.wikidata.org/wiki/Q1622420","display_name":"High availability","level":2,"score":0.27320000529289246},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.27250000834465027},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.2718000113964081},{"id":"https://openalex.org/C553261973","wikidata":"https://www.wikidata.org/wiki/Q14579","display_name":"Linux kernel","level":2,"score":0.26579999923706055},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.26499998569488525},{"id":"https://openalex.org/C20574231","wikidata":"https://www.wikidata.org/wiki/Q844605","display_name":"Backward compatibility","level":2,"score":0.2535000145435333},{"id":"https://openalex.org/C31395832","wikidata":"https://www.wikidata.org/wiki/Q1318674","display_name":"Testbed","level":2,"score":0.2515999972820282}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.00368","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00368","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.00368","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00368","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.410592645406723,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Modern":[0],"GPU":[1],"clusters":[2,189],"are":[3],"built":[4],"upon":[5],"a":[6,32,47,96,118],"complex":[7],"hierarchy":[8],"of":[9,44,107],"heterogeneous":[10,115],"interconnects,":[11],"ranging":[12],"from":[13,103],"multi-rail":[14,76],"RDMA":[15],"to":[16,63,79,84,110,211],"proprietary":[17],"fabrics":[18],"such":[19],"as":[20,169],"Multi-Node":[21],"NVLink":[22],"and":[23,82,137,153,177,200,215],"Ascend":[24],"UB.":[25],"Orchestrating":[26],"these":[27],"diverse":[28],"links":[29,141],"effectively":[30],"remains":[31],"critical":[33,48],"challenge":[34],"in":[35,230],"disaggregated":[36],"LLM":[37,175,203],"serving.":[38],"Operating":[39],"Mooncake":[40,197,221],"TE":[41],"on":[42,65,143,186],"thousands":[43],"GPUs":[45],"exposed":[46],"limitation":[49],"shared":[50],"by":[51,159,234],"existing":[52],"frameworks:":[53],"imperative,":[54],"statically":[55],"bound":[56],"path":[57],"selection.":[58],"This":[59,147],"rigidity":[60],"forces":[61],"engines":[62],"rely":[64],"state-blind":[66],"striping":[67],"that":[68,99,191],"ignores":[69],"congestion":[70],"signals,":[71],"creating":[72],"communication":[73],"silos,":[74],"wasting":[75],"bandwidth":[77],"due":[78],"head-of-line":[80,151],"blocking,":[81],"leading":[83],"operational":[85],"fragility":[86],"where":[87],"routine":[88],"faults":[89],"require":[90],"manual":[91],"intervention.":[92],"We":[93],"present":[94],"TENT,":[95],"data-movement":[97],"engine":[98],"decouples":[100],"transfer":[101,126],"intent":[102],"physical":[104],"execution.":[105],"Instead":[106],"locking":[108],"workloads":[109],"fixed":[111],"backends,":[112],"TENT":[113,129,167,192,208,226],"unifies":[114],"interconnects":[116],"into":[117,134],"single":[119],"dynamic":[120],"resource":[121],"pool.":[122],"Applications":[123],"simply":[124],"declare":[125],"intents,":[127],"while":[128],"dynamically":[130],"decomposes":[131],"elephant":[132],"flows":[133],"fine-grained":[135],"slices":[136,161],"\"sprays\"":[138],"them":[139],"across":[140],"based":[142],"instantaneous":[144],"link":[145],"quality.":[146],"telemetry-driven":[148],"orchestration":[149],"eliminates":[150],"blocking":[152],"enables":[154],"transparent,":[155],"sub-50":[156],"ms":[157],"self-healing":[158],"rerouting":[160],"around":[162],"failures":[163],"without":[164],"application":[165],"logic.":[166],"serves":[168],"the":[170],"production":[171],"data":[172],"plane":[173],"for":[174],"inference":[176,204],"RL":[178,224],"pipelines":[179],"at":[180],"multiple":[181],"industrial":[182],"sites.":[183],"Our":[184],"evaluation":[185],"H800":[187],"HGX":[188],"shows":[190],"outperforms":[193],"state-of-the-art":[194],"baselines,":[195],"including":[196],"TE,":[198],"NIXL,":[199],"UCCL.":[201],"In":[202,223],"with":[205],"SGLang":[206],"HiCache,":[207],"achieves":[209],"up":[210],"1.36x":[212],"higher":[213],"throughput":[214],"26%":[216],"lower":[217],"P90":[218],"TTFT":[219],"than":[220],"TE.":[222],"pipelines,":[225],"accelerates":[227],"parameter":[228],"updates":[229],"Moonshot":[231],"Checkpoint":[232],"Engine":[233],"20-26%.":[235]},"counts_by_year":[],"updated_date":"2026-04-03T16:44:17.987007","created_date":"2026-04-03T00:00:00"}
