{"id":"https://openalex.org/W7140319919","doi":"https://doi.org/10.48550/arxiv.2603.22691","title":"Rank-Aware Resource Scheduling for Tightly-Coupled MPI Workloads on Kubernetes","display_name":"Rank-Aware Resource Scheduling for Tightly-Coupled MPI Workloads on Kubernetes","publication_year":2026,"publication_date":"2026-03-24","ids":{"openalex":"https://openalex.org/W7140319919","doi":"https://doi.org/10.48550/arxiv.2603.22691"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.22691","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22691","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.22691","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125299483","display_name":"Tianfang Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Xie, Tianfang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5125299483"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.822700023651123,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.822700023651123,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.04699999839067459,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.03229999914765358,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cpu-shielding","display_name":"CPU shielding","score":0.816100001335144},{"id":"https://openalex.org/keywords/central-processing-unit","display_name":"Central processing unit","score":0.57669997215271},{"id":"https://openalex.org/keywords/provisioning","display_name":"Provisioning","score":0.5278000235557556},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.5145000219345093},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.4083000123500824},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.3303999900817871},{"id":"https://openalex.org/keywords/pci-express","display_name":"PCI Express","score":0.2980000078678131}],"concepts":[{"id":"https://openalex.org/C180613757","wikidata":"https://www.wikidata.org/wiki/Q5013757","display_name":"CPU shielding","level":3,"score":0.816100001335144},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7976999878883362},{"id":"https://openalex.org/C49154492","wikidata":"https://www.wikidata.org/wiki/Q5300","display_name":"Central processing unit","level":2,"score":0.57669997215271},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5378999710083008},{"id":"https://openalex.org/C172191483","wikidata":"https://www.wikidata.org/wiki/Q1071806","display_name":"Provisioning","level":2,"score":0.5278000235557556},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.5145000219345093},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.43309998512268066},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.4083000123500824},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3743000030517578},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.3303999900817871},{"id":"https://openalex.org/C64270927","wikidata":"https://www.wikidata.org/wiki/Q206924","display_name":"PCI Express","level":3,"score":0.2980000078678131},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.27549999952316284},{"id":"https://openalex.org/C19012869","wikidata":"https://www.wikidata.org/wiki/Q578372","display_name":"Response time","level":2,"score":0.27489998936653137},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.27379998564720154},{"id":"https://openalex.org/C107568181","wikidata":"https://www.wikidata.org/wiki/Q5319000","display_name":"Dynamic priority scheduling","level":3,"score":0.26429998874664307},{"id":"https://openalex.org/C2780870223","wikidata":"https://www.wikidata.org/wiki/Q1004415","display_name":"Runtime system","level":2,"score":0.26330000162124634},{"id":"https://openalex.org/C29140674","wikidata":"https://www.wikidata.org/wiki/Q206637","display_name":"Computer cluster","level":2,"score":0.26159998774528503},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.22691","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22691","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.22691","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22691","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.4143337607383728,"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Fully":[0],"provisioned":[1,158],"Message":[2],"Passing":[3],"Interface":[4],"(MPI)":[5],"parallelism":[6],"achieves":[7],"near-optimal":[8],"wall-clock":[9],"time":[10],"for":[11,23,79],"Computational":[12],"Fluid":[13],"Dynamics":[14],"(CFD)":[15],"solvers.":[16],"This":[17],"work":[18],"addresses":[19],"a":[20,57,135],"complementary":[21],"question":[22],"shared,":[24],"cloud-managed":[25],"clusters:":[26],"can":[27],"fine-grained":[28],"CPU":[29,60,81,91,122,133,159],"provisioning":[30],"reduce":[31],"resource":[32,48],"reservation":[33],"of":[34,165],"low-load":[35],"subdomains,":[36],"improving":[37],"cluster":[38],"packing":[39],"efficiency":[40],"without":[41,83],"unacceptably":[42],"degrading":[43],"performance?":[44],"We":[45,69],"propose":[46],"rank-aware":[47],"scheduling":[49,166],"on":[50,114,144,171],"Kubernetes,":[51],"mapping":[52],"each":[53],"MPI":[54,142],"rank":[55],"to":[56,64],"pod":[58,84],"whose":[59],"request":[61],"is":[62,123,149],"proportional":[63,132,147],"its":[65],"subdomain":[66],"cell":[67],"count.":[68],"also":[70],"demonstrate":[71],"In-Place":[72],"Pod":[73],"Vertical":[74],"Scaling":[75],"(Kubernetes":[76],"v1.35":[77],"GA)":[78],"mid-simulation":[80],"adjustment":[82],"restart.":[85],"Three":[86],"findings":[87],"emerge.":[88],"First,":[89],"hard":[90],"limits":[92],"via":[93],"the":[94,127],"Linux":[95],"CFS":[96],"bandwidth":[97],"controller":[98],"cause":[99],"78x":[100],"slowdown":[101],"through":[102],"cascading":[103],"stalls":[104],"at":[105,140],"MPI_Allreduce":[106],"barriers;":[107],"requests-only":[108],"allocation":[109,148,154],"eliminates":[110],"throttling":[111],"entirely.":[112],"Second,":[113],"non-burstable":[115],"c5.xlarge":[116,174],"instances,":[117],"concentric":[118],"decomposition":[119],"with":[120],"equal":[121,153],"19%":[124],"faster":[125,151],"than":[126,152],"Scotch":[128],"baseline,":[129],"while":[130,155],"adding":[131],"yields":[134],"further":[136],"3%":[137],"improvement.":[138],"Third,":[139],"16":[141],"ranks":[143],"101K-cell":[145],"meshes,":[146],"20%":[150],"reducing":[156],"sparse-subdomain":[157],"by":[160],"82%,":[161],"freeing":[162],"6.5":[163],"vCPU":[164],"headroom.":[167],"Experiments":[168],"are":[169,185],"conducted":[170],"AWS":[172],"EC2":[173],"clusters":[175],"(4-16":[176],"ranks)":[177],"running":[178],"k3s":[179],"v1.35.":[180],"All":[181],"scripts":[182],"and":[183],"data":[184],"released":[186],"as":[187],"open":[188],"source.":[189]},"counts_by_year":[],"updated_date":"2026-03-26T06:10:45.909354","created_date":"2026-03-26T00:00:00"}
