{"id":"https://openalex.org/W4406755573","doi":"https://doi.org/10.48550/arxiv.2501.12407","title":"The Streaming Batch Model for Efficient and Fault-Tolerant Heterogeneous Execution","display_name":"The Streaming Batch Model for Efficient and Fault-Tolerant Heterogeneous Execution","publication_year":2025,"publication_date":"2025-01-16","ids":{"openalex":"https://openalex.org/W4406755573","doi":"https://doi.org/10.48550/arxiv.2501.12407"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2501.12407","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.12407","pdf_url":"https://arxiv.org/pdf/2501.12407","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2501.12407","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075193455","display_name":"Frank Sifei Luan","orcid":"https://orcid.org/0000-0001-8709-6823"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Luan, Frank Sifei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011833703","display_name":"Ziming Mao","orcid":"https://orcid.org/0009-0006-5985-0968"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Ron Yifeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111045826","display_name":"R. Wang","orcid":"https://orcid.org/0009-0008-3671-4028"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gu, Yile","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089635779","display_name":"Chi\u2010Wei Lin","orcid":"https://orcid.org/0000-0002-5178-5448"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mao, Ziming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018727500","display_name":"Amog Kamsetty","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Charlotte","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100353673","display_name":"Hao Chen","orcid":"https://orcid.org/0009-0001-6480-7976"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kamsetty, Amog","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048194625","display_name":"Cheng Su","orcid":"https://orcid.org/0009-0003-3281-7904"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116004356","display_name":"Balaji Veeramani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Cheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026638199","display_name":"Scott Lee","orcid":"https://orcid.org/0000-0003-4584-6758"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Veeramani, Balaji","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036448834","display_name":"SangBin Cho","orcid":"https://orcid.org/0009-0006-8695-5941"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Scott","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116004355","display_name":"Clark Zinzow","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cho, SangBin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064891668","display_name":"Eric Liang","orcid":"https://orcid.org/0000-0002-3760-6845"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zinzow, Clark","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041920173","display_name":"Ion Stoica","orcid":"https://orcid.org/0000-0002-5373-0088"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Eric","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076479697","display_name":"Stephanie Wang","orcid":"https://orcid.org/0000-0001-5960-5491"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stoica, Ion","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Wang, Stephanie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Stephanie","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":15,"corresponding_author_ids":["https://openalex.org/A5075193455"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9847000241279602,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9789000153541565,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6866472959518433},{"id":"https://openalex.org/keywords/fault-tolerance","display_name":"Fault tolerance","score":0.5429667234420776},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.49184107780456543},{"id":"https://openalex.org/keywords/streaming-data","display_name":"Streaming data","score":0.4559434652328491},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4076882600784302},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.10258761048316956}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6866472959518433},{"id":"https://openalex.org/C63540848","wikidata":"https://www.wikidata.org/wiki/Q3140932","display_name":"Fault tolerance","level":2,"score":0.5429667234420776},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.49184107780456543},{"id":"https://openalex.org/C2777611316","wikidata":"https://www.wikidata.org/wiki/Q39045282","display_name":"Streaming data","level":2,"score":0.4559434652328491},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4076882600784302},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.10258761048316956}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2501.12407","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.12407","pdf_url":"https://arxiv.org/pdf/2501.12407","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2501.12407","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2501.12407","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2501.12407","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.12407","pdf_url":"https://arxiv.org/pdf/2501.12407","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4406755573.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2384129116","https://openalex.org/W2144438995","https://openalex.org/W1577886464","https://openalex.org/W2164896586","https://openalex.org/W1593559483","https://openalex.org/W2108334564","https://openalex.org/W2111125783","https://openalex.org/W2100367016"],"abstract_inverted_index":{"While":[0],"ML":[1,147],"model":[2],"training":[3,133],"and":[4,48,60,65,92,122],"inference":[5,114],"are":[6],"both":[7],"GPU-intensive,":[8],"CPU-based":[9,35],"data":[10,17,148],"processing":[11,18,26,124],"is":[12,72],"often":[13],"the":[14,22,52,77],"bottleneck.":[15],"Distributed":[16],"systems":[19],"based":[20],"on":[21,46,111],"batch":[23,54,59,106,113,121],"or":[24,42],"stream":[25,123],"models":[27,137],"assume":[28],"homogeneous":[29],"resource":[30],"requirements.":[31],"They":[32],"excel":[33],"at":[34],"computation":[36],"but":[37,84],"either":[38],"under-utilize":[39],"heterogeneous":[40,67,95,112,128],"resources":[41],"impose":[43],"high":[44],"overheads":[45],"failure":[47],"reconfiguration.":[49],"We":[50,100],"introduce":[51],"streaming":[53,61,105],"model,":[55],"a":[56,104],"hybrid":[57],"of":[58,79],"that":[62,108],"enables":[63],"efficient":[64],"fault-tolerant":[66],"execution.":[68],"The":[69],"key":[70],"idea":[71],"to":[73,81,85,88,119,145],"use":[74],"partitions":[75,87],"as":[76,139],"unit":[78],"execution":[80],"achieve":[82],"elasticity,":[83],"allow":[86],"be":[89],"dynamically":[90],"created":[91],"streamed":[93],"between":[94],"operators":[96],"for":[97,135],"memory-efficient":[98],"pipelining.":[99],"present":[101],"Ray":[102,130],"Data,":[103],"system":[107],"improves":[109,132],"throughput":[110,134],"pipelines":[115],"by":[116,142],"2.5-12$\\times$":[117],"compared":[118,144],"traditional":[120],"systems.":[125],"By":[126],"leveraging":[127],"clusters,":[129],"Data":[131],"multimodal":[136],"such":[138],"Stable":[140],"Diffusion":[141],"31%":[143],"single-node":[146],"loaders.":[149]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
