{"id":"https://openalex.org/W7162466499","doi":"https://doi.org/10.48550/arxiv.2605.24006","title":"A Tabular Schedule Abstraction for Communication-Aware Evaluation of Pipeline-Parallel LLM Training","display_name":"A Tabular Schedule Abstraction for Communication-Aware Evaluation of Pipeline-Parallel LLM Training","publication_year":2026,"publication_date":"2026-05-19","ids":{"openalex":"https://openalex.org/W7162466499","doi":"https://doi.org/10.48550/arxiv.2605.24006"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.24006","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.24006","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.24006","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093393016","display_name":"Daniel Barley","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Barley, Daniel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137058030","display_name":"Jonathan Leis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Leis, Jonathan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049729482","display_name":"Benjamin Klenk","orcid":"https://orcid.org/0000-0001-7657-3049"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Klenk, Benjamin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5014251134","display_name":"Holger Fr\u00f6ning","orcid":"https://orcid.org/0000-0001-9562-0680"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fr\u00f6ning, Holger","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.8654000163078308,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.8654000163078308,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.04490000009536743,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.010900000110268593,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/schedule","display_name":"Schedule","score":0.7508000135421753},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6955999732017517},{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.6635000109672546},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5407000184059143},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4878999888896942},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4077000021934509},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.40459999442100525}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.835099995136261},{"id":"https://openalex.org/C68387754","wikidata":"https://www.wikidata.org/wiki/Q7271585","display_name":"Schedule","level":2,"score":0.7508000135421753},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6955999732017517},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.6635000109672546},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5407000184059143},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4878999888896942},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4077000021934509},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.40459999442100525},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.39489999413490295},{"id":"https://openalex.org/C157915830","wikidata":"https://www.wikidata.org/wiki/Q2928001","display_name":"Bubble","level":2,"score":0.39070001244544983},{"id":"https://openalex.org/C53833338","wikidata":"https://www.wikidata.org/wiki/Q1061424","display_name":"Context switch","level":2,"score":0.37630000710487366},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3522000014781952},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.34630000591278076},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3449000120162964},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.3440000116825104},{"id":"https://openalex.org/C110251889","wikidata":"https://www.wikidata.org/wiki/Q1569697","display_name":"Model checking","level":2,"score":0.2939999997615814},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.28060001134872437},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.28049999475479126},{"id":"https://openalex.org/C2989134064","wikidata":"https://www.wikidata.org/wiki/Q288510","display_name":"Execution time","level":2,"score":0.2791999876499176}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.24006","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.24006","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.24006","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.24006","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Pipeline":[0],"parallelism":[1],"is":[2,25,125,138,180],"a":[3,49,54,120],"key":[4],"technique":[5],"for":[6],"distributed":[7],"training":[8],"of":[9,186],"large":[10],"language":[11],"models":[12,28],"because":[13],"it":[14],"reduces":[15],"per-device":[16],"parameter":[17],"and":[18,42,53,65,77,113,132],"activation":[19],"memory.":[20],"However,":[21],"comparing":[22],"pipeline":[23,177],"schedules":[24],"difficult:":[26],"analytical":[27],"expose":[29],"structural":[30,100],"quantities":[31],"such":[32],"as":[33],"bubble":[34,104],"ratios,":[35],"while":[36,136],"end-to-end":[37],"hardware":[38],"experiments":[39],"are":[40,94,115],"costly":[41],"system-specific.":[43],"In":[44],"this":[45,70],"work,":[46],"we":[47,72],"introduce":[48],"tabular":[50],"schedule":[51,63,92,178],"abstraction":[52],"unified":[55],"multi-abstraction":[56],"methodology":[57],"that":[58,91],"connects":[59],"formula-based":[60],"reasoning,":[61],"idealized":[62],"tables,":[64],"communication-aware":[66],"execution":[67,189],"simulation.":[68],"Using":[69],"framework,":[71],"compare":[73],"GPipe,":[74],"1F1B,":[75],"Chimera,":[76],"Hanayo":[78,137],"in":[79,133,140,173,183],"its":[80,141],"restricted":[81,143],"regime":[82],"across":[83],"multiple":[84],"modeled":[85,188],"system":[86],"configurations.":[87],"Our":[88],"results":[89],"show":[90],"rankings":[93],"not":[95,161],"abstraction-invariant:":[96],"communication":[97],"can":[98],"negate":[99],"advantages":[101],"suggested":[102],"by":[103],"analysis":[105],"alone.":[106],"Under":[107],"the":[108,163,184,187],"assumptions":[109],"considered":[110],"here,":[111],"GPipe":[112],"1F1B":[114,118],"runtime-equivalent,":[116],"but":[117,146,168],"achieves":[119],"lower":[121],"activation-memory":[122],"peak.":[123],"Chimera":[124],"advantageous":[126],"mainly":[127],"at":[128],"low":[129],"microbatch":[130],"counts":[131],"communication-favorable":[134],"regimes,":[135],"effective":[139],"intended":[142],"operating":[144],"point":[145],"remains":[147],"sensitive":[148],"to":[149],"network":[150],"bottlenecks.":[151],"We":[152],"further":[153],"study":[154],"an":[155],"asymmetric":[156],"Chimera-style":[157],"placement,":[158],"which":[159],"does":[160],"reduce":[162],"global":[164],"peak":[165],"memory":[166],"requirement":[167],"reveals":[169],"limited":[170],"runtime":[171],"gains":[172],"shallow":[174],"pipelines.":[175],"Overall,":[176],"quality":[179],"meaningful":[181],"only":[182],"context":[185],"environment.":[190]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-27T00:00:00"}
